@objectstack/knowledge-ragflow 6.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../src/index.ts"],"sourcesContent":["// Copyright (c) 2025 ObjectStack. Licensed under the Apache-2.0 license.\n\nimport type { Plugin, PluginContext } from '@objectstack/core';\nimport type {\n IKnowledgeAdapter,\n IKnowledgeService,\n AdapterContext,\n AdapterSearchOptions,\n} from '@objectstack/spec/contracts';\nimport type {\n KnowledgeDocument,\n KnowledgeHit,\n KnowledgeSource,\n} from '@objectstack/spec/ai';\nimport { KNOWLEDGE_SERVICE } from '@objectstack/spec/contracts';\n\n/**\n * Subset of `fetch` used by the adapter. Inject in tests; defaults to\n * the global `fetch`.\n */\nexport type FetchLike = (\n input: string,\n init?: {\n method?: string;\n headers?: Record<string, string>;\n body?: string;\n signal?: AbortSignal;\n },\n) => Promise<{\n ok: boolean;\n status: number;\n statusText: string;\n text(): Promise<string>;\n json(): Promise<unknown>;\n}>;\n\nexport interface KnowledgeRagflowAdapterOptions {\n /** RAGFlow endpoint, e.g. `http://localhost:9380`. */\n endpoint: string;\n /** RAGFlow API key (Bearer token). */\n apiKey: string;\n /** Adapter id. @default 'ragflow' */\n id?: string;\n /** Override `fetch` for tests. */\n fetch?: FetchLike;\n /** Request timeout in milliseconds. @default 30000 */\n timeoutMs?: number;\n}\n\ninterface RagflowSourceOptions {\n datasetId: string;\n /** Optional rerank model id (overrides dataset default). */\n rerankModel?: string;\n /** Optional similarity threshold passed through to RAGFlow. */\n similarityThreshold?: number;\n /** Optional vector vs keyword weight in [0,1]. */\n vectorSimilarityWeight?: number;\n}\n\nfunction extractRagflowOptions(source: KnowledgeSource): RagflowSourceOptions {\n const opts = ((source as unknown as { options?: Record<string, unknown> }).options ?? {}) as\n Record<string, unknown>;\n const datasetId = opts.datasetId;\n if (typeof datasetId !== 'string' || !datasetId) {\n throw new Error(\n `RAGFlow adapter requires source.options.datasetId on source '${source.id}'`,\n );\n }\n return {\n datasetId,\n rerankModel: typeof opts.rerankModel === 'string' ? opts.rerankModel : undefined,\n similarityThreshold:\n typeof opts.similarityThreshold === 'number' ? opts.similarityThreshold : undefined,\n vectorSimilarityWeight:\n typeof opts.vectorSimilarityWeight === 'number'\n ? opts.vectorSimilarityWeight\n : undefined,\n };\n}\n\n/**\n * RAGFlow adapter. Maps {@link KnowledgeDocument} upserts to the\n * dataset's chunk API, delegates retrieval to `/api/v1/retrieval`, and\n * returns {@link KnowledgeHit}s with `sourceRecordId` preserved so the\n * orchestrator can run a permission re-check.\n */\nexport class KnowledgeRagflowAdapter implements IKnowledgeAdapter {\n readonly id: string;\n private readonly endpoint: string;\n private readonly apiKey: string;\n private readonly fetchImpl: FetchLike;\n private readonly timeoutMs: number;\n\n constructor(opts: KnowledgeRagflowAdapterOptions) {\n if (!opts.endpoint) throw new Error('RAGFlow adapter: endpoint required');\n if (!opts.apiKey) throw new Error('RAGFlow adapter: apiKey required');\n this.id = opts.id ?? 'ragflow';\n this.endpoint = opts.endpoint.replace(/\\/+$/, '');\n this.apiKey = opts.apiKey;\n this.fetchImpl = opts.fetch ?? ((globalThis as { fetch?: FetchLike }).fetch as FetchLike);\n this.timeoutMs = opts.timeoutMs ?? 30000;\n if (!this.fetchImpl) {\n throw new Error('RAGFlow adapter: no fetch available; pass options.fetch');\n }\n }\n\n async upsert(docs: KnowledgeDocument[], ctx: AdapterContext): Promise<void> {\n const { datasetId } = extractRagflowOptions(ctx.source);\n // RAGFlow models documents in two layers: documents (file-like) and\n // chunks (text blocks). We treat each KnowledgeDocument as a single\n // chunk-set: delete existing chunks with the same external id, then\n // upload as `content` chunks tagged with our document id.\n for (const doc of docs) {\n await this.deleteChunksByDocumentId(datasetId, doc.id);\n await this.request(`/api/v1/datasets/${datasetId}/chunks`, {\n method: 'POST',\n body: JSON.stringify({\n content: doc.content,\n // RAGFlow accepts arbitrary metadata used for filtering at\n // retrieval time. We always stamp `objectstack_doc_id` so\n // delete() can find these chunks again.\n important_keywords: doc.title ? [doc.title] : undefined,\n metadata: {\n ...(doc.metadata ?? {}),\n objectstack_doc_id: doc.id,\n objectstack_source_id: doc.sourceId,\n objectstack_record_id: doc.sourceRecordId,\n title: doc.title,\n },\n }),\n });\n }\n }\n\n async delete(documentIds: string[], ctx: AdapterContext): Promise<void> {\n const { datasetId } = extractRagflowOptions(ctx.source);\n for (const id of documentIds) {\n await this.deleteChunksByDocumentId(datasetId, id);\n }\n }\n\n async search(query: string, opts: AdapterSearchOptions): Promise<KnowledgeHit[]> {\n const { datasetId, rerankModel, similarityThreshold, vectorSimilarityWeight } =\n extractRagflowOptions(opts.source);\n const body: Record<string, unknown> = {\n question: query,\n dataset_ids: [datasetId],\n top_k: opts.topK,\n keyword: true,\n };\n if (rerankModel) body.rerank_id = rerankModel;\n if (typeof similarityThreshold === 'number') body.similarity_threshold = similarityThreshold;\n if (typeof vectorSimilarityWeight === 'number')\n body.vector_similarity_weight = vectorSimilarityWeight;\n if (opts.filter) body.metadata_condition = { ...opts.filter };\n\n const res = await this.request('/api/v1/retrieval', {\n method: 'POST',\n body: JSON.stringify(body),\n });\n const data = (res?.data ?? {}) as { chunks?: RagflowChunkHit[] };\n const chunks = data.chunks ?? [];\n return chunks.slice(0, opts.topK).map<KnowledgeHit>((c) => {\n const md = (c.metadata ?? {}) as Record<string, unknown>;\n const docId =\n (md.objectstack_doc_id as string | undefined) ??\n c.document_id ??\n c.doc_id ??\n c.id;\n const recordId = md.objectstack_record_id as string | undefined;\n return {\n chunkId: c.id ?? `${docId}#${c.position ?? 0}`,\n documentId: docId ?? c.id ?? 'unknown',\n sourceId: opts.source.id,\n sourceRecordId: recordId,\n score: c.similarity ?? c.score ?? 0,\n snippet: c.content ?? c.content_with_weight ?? '',\n title: (md.title as string | undefined) ?? c.document_name,\n metadata: md,\n };\n });\n }\n\n async healthCheck(): Promise<{ ok: boolean; message?: string }> {\n try {\n await this.request('/api/v1/datasets?page=1&page_size=1', { method: 'GET' });\n return { ok: true };\n } catch (err) {\n return { ok: false, message: err instanceof Error ? err.message : String(err) };\n }\n }\n\n private async deleteChunksByDocumentId(datasetId: string, docId: string): Promise<void> {\n // Find chunks with our stamped metadata, then delete by chunk id.\n const found = (await this.request(`/api/v1/retrieval`, {\n method: 'POST',\n body: JSON.stringify({\n question: docId,\n dataset_ids: [datasetId],\n top_k: 256,\n keyword: false,\n metadata_condition: { objectstack_doc_id: docId },\n }),\n })) as { data?: { chunks?: Array<{ id?: string }> } };\n const ids = (found.data?.chunks ?? [])\n .map((c) => c.id)\n .filter((x): x is string => typeof x === 'string');\n if (ids.length === 0) return;\n await this.request(`/api/v1/datasets/${datasetId}/chunks`, {\n method: 'DELETE',\n body: JSON.stringify({ chunk_ids: ids }),\n });\n }\n\n private async request(\n path: string,\n init: { method: string; body?: string },\n ): Promise<{ data?: unknown; code?: number; message?: string }> {\n const controller = new AbortController();\n const t = setTimeout(() => controller.abort(), this.timeoutMs);\n try {\n const res = await this.fetchImpl(`${this.endpoint}${path}`, {\n method: init.method,\n headers: {\n 'content-type': 'application/json',\n authorization: `Bearer ${this.apiKey}`,\n },\n body: init.body,\n signal: controller.signal,\n });\n const raw = await res.text();\n let parsed: { data?: unknown; code?: number; message?: string } = {};\n if (raw) {\n try {\n parsed = JSON.parse(raw) as typeof parsed;\n } catch {\n if (!res.ok) {\n throw new Error(\n `RAGFlow ${init.method} ${path} → ${res.status} ${res.statusText}: ${raw.slice(0, 200)}`,\n );\n }\n }\n }\n if (!res.ok || (typeof parsed.code === 'number' && parsed.code !== 0 && parsed.code !== 200)) {\n throw new Error(\n `RAGFlow ${init.method} ${path} → ${res.status} ${res.statusText}${\n parsed.message ? ` (${parsed.message})` : ''\n }`,\n );\n }\n return parsed;\n } finally {\n clearTimeout(t);\n }\n }\n}\n\ninterface RagflowChunkHit {\n id?: string;\n document_id?: string;\n doc_id?: string;\n document_name?: string;\n content?: string;\n content_with_weight?: string;\n similarity?: number;\n score?: number;\n position?: number;\n metadata?: Record<string, unknown>;\n}\n\n/* ---------------------------------------------------------------- */\n/* Kernel plugin glue */\n/* ---------------------------------------------------------------- */\n\nexport interface KnowledgeRagflowPluginOptions extends KnowledgeRagflowAdapterOptions {}\n\nexport class KnowledgeRagflowPlugin implements Plugin {\n name = 'com.objectstack.plugin.knowledge-ragflow';\n version = '0.1.0';\n type = 'standard';\n\n private readonly adapter: KnowledgeRagflowAdapter;\n\n constructor(opts: KnowledgeRagflowPluginOptions) {\n this.adapter = new KnowledgeRagflowAdapter(opts);\n }\n\n async init(_ctx: PluginContext): Promise<void> {\n // No-op: actual registration happens in start() once service is available.\n }\n\n async start(ctx: PluginContext): Promise<void> {\n let svc: IKnowledgeService | undefined;\n try {\n svc = ctx.getService<IKnowledgeService>(KNOWLEDGE_SERVICE);\n } catch {\n ctx.logger.warn?.(\n 'KnowledgeRagflowPlugin: IKnowledgeService not registered — install KnowledgeServicePlugin first.',\n );\n return;\n }\n svc.registerAdapter(this.adapter.id, this.adapter);\n ctx.logger.info?.(\n `KnowledgeRagflowPlugin: adapter '${this.adapter.id}' registered (endpoint=${(this.adapter as unknown as { endpoint: string }).endpoint}).`,\n );\n }\n}\n"],"mappings":";;;;;;;;;;;;;;;;;;;;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAcA,uBAAkC;AA6ClC,SAAS,sBAAsB,QAA+C;AAC5E,QAAM,OAAS,OAA4D,WAAW,CAAC;AAEvF,QAAM,YAAY,KAAK;AACvB,MAAI,OAAO,cAAc,YAAY,CAAC,WAAW;AAC/C,UAAM,IAAI;AAAA,MACR,gEAAgE,OAAO,EAAE;AAAA,IAC3E;AAAA,EACF;AACA,SAAO;AAAA,IACL;AAAA,IACA,aAAa,OAAO,KAAK,gBAAgB,WAAW,KAAK,cAAc;AAAA,IACvE,qBACE,OAAO,KAAK,wBAAwB,WAAW,KAAK,sBAAsB;AAAA,IAC5E,wBACE,OAAO,KAAK,2BAA2B,WACnC,KAAK,yBACL;AAAA,EACR;AACF;AAQO,IAAM,0BAAN,MAA2D;AAAA,EAOhE,YAAY,MAAsC;AAChD,QAAI,CAAC,KAAK,SAAU,OAAM,IAAI,MAAM,oCAAoC;AACxE,QAAI,CAAC,KAAK,OAAQ,OAAM,IAAI,MAAM,kCAAkC;AACpE,SAAK,KAAK,KAAK,MAAM;AACrB,SAAK,WAAW,KAAK,SAAS,QAAQ,QAAQ,EAAE;AAChD,SAAK,SAAS,KAAK;AACnB,SAAK,YAAY,KAAK,SAAW,WAAqC;AACtE,SAAK,YAAY,KAAK,aAAa;AACnC,QAAI,CAAC,KAAK,WAAW;AACnB,YAAM,IAAI,MAAM,yDAAyD;AAAA,IAC3E;AAAA,EACF;AAAA,EAEA,MAAM,OAAO,MAA2B,KAAoC;AAC1E,UAAM,EAAE,UAAU,IAAI,sBAAsB,IAAI,MAAM;AAKtD,eAAW,OAAO,MAAM;AACtB,YAAM,KAAK,yBAAyB,WAAW,IAAI,EAAE;AACrD,YAAM,KAAK,QAAQ,oBAAoB,SAAS,WAAW;AAAA,QACzD,QAAQ;AAAA,QACR,MAAM,KAAK,UAAU;AAAA,UACnB,SAAS,IAAI;AAAA;AAAA;AAAA;AAAA,UAIb,oBAAoB,IAAI,QAAQ,CAAC,IAAI,KAAK,IAAI;AAAA,UAC9C,UAAU;AAAA,YACR,GAAI,IAAI,YAAY,CAAC;AAAA,YACrB,oBAAoB,IAAI;AAAA,YACxB,uBAAuB,IAAI;AAAA,YAC3B,uBAAuB,IAAI;AAAA,YAC3B,OAAO,IAAI;AAAA,UACb;AAAA,QACF,CAAC;AAAA,MACH,CAAC;AAAA,IACH;AAAA,EACF;AAAA,EAEA,MAAM,OAAO,aAAuB,KAAoC;AACtE,UAAM,EAAE,UAAU,IAAI,sBAAsB,IAAI,MAAM;AACtD,eAAW,MAAM,aAAa;AAC5B,YAAM,KAAK,yBAAyB,WAAW,EAAE;AAAA,IACnD;AAAA,EACF;AAAA,EAEA,MAAM,OAAO,OAAe,MAAqD;AAC/E,UAAM,EAAE,WAAW,aAAa,qBAAqB,uBAAuB,IAC1E,sBAAsB,KAAK,MAAM;AACnC,UAAM,OAAgC;AAAA,MACpC,UAAU;AAAA,MACV,aAAa,CAAC,SAAS;AAAA,MACvB,OAAO,KAAK;AAAA,MACZ,SAAS;AAAA,IACX;AACA,QAAI,YAAa,MAAK,YAAY;AAClC,QAAI,OAAO,wBAAwB,SAAU,MAAK,uBAAuB;AACzE,QAAI,OAAO,2BAA2B;AACpC,WAAK,2BAA2B;AAClC,QAAI,KAAK,OAAQ,MAAK,qBAAqB,EAAE,GAAG,KAAK,OAAO;AAE5D,UAAM,MAAM,MAAM,KAAK,QAAQ,qBAAqB;AAAA,MAClD,QAAQ;AAAA,MACR,MAAM,KAAK,UAAU,IAAI;AAAA,IAC3B,CAAC;AACD,UAAM,OAAQ,KAAK,QAAQ,CAAC;AAC5B,UAAM,SAAS,KAAK,UAAU,CAAC;AAC/B,WAAO,OAAO,MAAM,GAAG,KAAK,IAAI,EAAE,IAAkB,CAAC,MAAM;AACzD,YAAM,KAAM,EAAE,YAAY,CAAC;AAC3B,YAAM,QACH,GAAG,sBACJ,EAAE,eACF,EAAE,UACF,EAAE;AACJ,YAAM,WAAW,GAAG;AACpB,aAAO;AAAA,QACL,SAAS,EAAE,MAAM,GAAG,KAAK,IAAI,EAAE,YAAY,CAAC;AAAA,QAC5C,YAAY,SAAS,EAAE,MAAM;AAAA,QAC7B,UAAU,KAAK,OAAO;AAAA,QACtB,gBAAgB;AAAA,QAChB,OAAO,EAAE,cAAc,EAAE,SAAS;AAAA,QAClC,SAAS,EAAE,WAAW,EAAE,uBAAuB;AAAA,QAC/C,OAAQ,GAAG,SAAgC,EAAE;AAAA,QAC7C,UAAU;AAAA,MACZ;AAAA,IACF,CAAC;AAAA,EACH;AAAA,EAEA,MAAM,cAA0D;AAC9D,QAAI;AACF,YAAM,KAAK,QAAQ,uCAAuC,EAAE,QAAQ,MAAM,CAAC;AAC3E,aAAO,EAAE,IAAI,KAAK;AAAA,IACpB,SAAS,KAAK;AACZ,aAAO,EAAE,IAAI,OAAO,SAAS,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG,EAAE;AAAA,IAChF;AAAA,EACF;AAAA,EAEA,MAAc,yBAAyB,WAAmB,OAA8B;AAEtF,UAAM,QAAS,MAAM,KAAK,QAAQ,qBAAqB;AAAA,MACrD,QAAQ;AAAA,MACR,MAAM,KAAK,UAAU;AAAA,QACnB,UAAU;AAAA,QACV,aAAa,CAAC,SAAS;AAAA,QACvB,OAAO;AAAA,QACP,SAAS;AAAA,QACT,oBAAoB,EAAE,oBAAoB,MAAM;AAAA,MAClD,CAAC;AAAA,IACH,CAAC;AACD,UAAM,OAAO,MAAM,MAAM,UAAU,CAAC,GACjC,IAAI,CAAC,MAAM,EAAE,EAAE,EACf,OAAO,CAAC,MAAmB,OAAO,MAAM,QAAQ;AACnD,QAAI,IAAI,WAAW,EAAG;AACtB,UAAM,KAAK,QAAQ,oBAAoB,SAAS,WAAW;AAAA,MACzD,QAAQ;AAAA,MACR,MAAM,KAAK,UAAU,EAAE,WAAW,IAAI,CAAC;AAAA,IACzC,CAAC;AAAA,EACH;AAAA,EAEA,MAAc,QACZ,MACA,MAC8D;AAC9D,UAAM,aAAa,IAAI,gBAAgB;AACvC,UAAM,IAAI,WAAW,MAAM,WAAW,MAAM,GAAG,KAAK,SAAS;AAC7D,QAAI;AACF,YAAM,MAAM,MAAM,KAAK,UAAU,GAAG,KAAK,QAAQ,GAAG,IAAI,IAAI;AAAA,QAC1D,QAAQ,KAAK;AAAA,QACb,SAAS;AAAA,UACP,gBAAgB;AAAA,UAChB,eAAe,UAAU,KAAK,MAAM;AAAA,QACtC;AAAA,QACA,MAAM,KAAK;AAAA,QACX,QAAQ,WAAW;AAAA,MACrB,CAAC;AACD,YAAM,MAAM,MAAM,IAAI,KAAK;AAC3B,UAAI,SAA8D,CAAC;AACnE,UAAI,KAAK;AACP,YAAI;AACF,mBAAS,KAAK,MAAM,GAAG;AAAA,QACzB,QAAQ;AACN,cAAI,CAAC,IAAI,IAAI;AACX,kBAAM,IAAI;AAAA,cACR,WAAW,KAAK,MAAM,IAAI,IAAI,WAAM,IAAI,MAAM,IAAI,IAAI,UAAU,KAAK,IAAI,MAAM,GAAG,GAAG,CAAC;AAAA,YACxF;AAAA,UACF;AAAA,QACF;AAAA,MACF;AACA,UAAI,CAAC,IAAI,MAAO,OAAO,OAAO,SAAS,YAAY,OAAO,SAAS,KAAK,OAAO,SAAS,KAAM;AAC5F,cAAM,IAAI;AAAA,UACR,WAAW,KAAK,MAAM,IAAI,IAAI,WAAM,IAAI,MAAM,IAAI,IAAI,UAAU,GAC9D,OAAO,UAAU,KAAK,OAAO,OAAO,MAAM,EAC5C;AAAA,QACF;AAAA,MACF;AACA,aAAO;AAAA,IACT,UAAE;AACA,mBAAa,CAAC;AAAA,IAChB;AAAA,EACF;AACF;AAqBO,IAAM,yBAAN,MAA+C;AAAA,EAOpD,YAAY,MAAqC;AANjD,gBAAO;AACP,mBAAU;AACV,gBAAO;AAKL,SAAK,UAAU,IAAI,wBAAwB,IAAI;AAAA,EACjD;AAAA,EAEA,MAAM,KAAK,MAAoC;AAAA,EAE/C;AAAA,EAEA,MAAM,MAAM,KAAmC;AAC7C,QAAI;AACJ,QAAI;AACF,YAAM,IAAI,WAA8B,kCAAiB;AAAA,IAC3D,QAAQ;AACN,UAAI,OAAO;AAAA,QACT;AAAA,MACF;AACA;AAAA,IACF;AACA,QAAI,gBAAgB,KAAK,QAAQ,IAAI,KAAK,OAAO;AACjD,QAAI,OAAO;AAAA,MACT,oCAAoC,KAAK,QAAQ,EAAE,0BAA2B,KAAK,QAA4C,QAAQ;AAAA,IACzI;AAAA,EACF;AACF;","names":[]}
package/dist/index.mjs ADDED
@@ -0,0 +1,187 @@
1
+ // src/index.ts
2
+ import { KNOWLEDGE_SERVICE } from "@objectstack/spec/contracts";
3
+ function extractRagflowOptions(source) {
4
+ const opts = source.options ?? {};
5
+ const datasetId = opts.datasetId;
6
+ if (typeof datasetId !== "string" || !datasetId) {
7
+ throw new Error(
8
+ `RAGFlow adapter requires source.options.datasetId on source '${source.id}'`
9
+ );
10
+ }
11
+ return {
12
+ datasetId,
13
+ rerankModel: typeof opts.rerankModel === "string" ? opts.rerankModel : void 0,
14
+ similarityThreshold: typeof opts.similarityThreshold === "number" ? opts.similarityThreshold : void 0,
15
+ vectorSimilarityWeight: typeof opts.vectorSimilarityWeight === "number" ? opts.vectorSimilarityWeight : void 0
16
+ };
17
+ }
18
+ var KnowledgeRagflowAdapter = class {
19
+ constructor(opts) {
20
+ if (!opts.endpoint) throw new Error("RAGFlow adapter: endpoint required");
21
+ if (!opts.apiKey) throw new Error("RAGFlow adapter: apiKey required");
22
+ this.id = opts.id ?? "ragflow";
23
+ this.endpoint = opts.endpoint.replace(/\/+$/, "");
24
+ this.apiKey = opts.apiKey;
25
+ this.fetchImpl = opts.fetch ?? globalThis.fetch;
26
+ this.timeoutMs = opts.timeoutMs ?? 3e4;
27
+ if (!this.fetchImpl) {
28
+ throw new Error("RAGFlow adapter: no fetch available; pass options.fetch");
29
+ }
30
+ }
31
+ async upsert(docs, ctx) {
32
+ const { datasetId } = extractRagflowOptions(ctx.source);
33
+ for (const doc of docs) {
34
+ await this.deleteChunksByDocumentId(datasetId, doc.id);
35
+ await this.request(`/api/v1/datasets/${datasetId}/chunks`, {
36
+ method: "POST",
37
+ body: JSON.stringify({
38
+ content: doc.content,
39
+ // RAGFlow accepts arbitrary metadata used for filtering at
40
+ // retrieval time. We always stamp `objectstack_doc_id` so
41
+ // delete() can find these chunks again.
42
+ important_keywords: doc.title ? [doc.title] : void 0,
43
+ metadata: {
44
+ ...doc.metadata ?? {},
45
+ objectstack_doc_id: doc.id,
46
+ objectstack_source_id: doc.sourceId,
47
+ objectstack_record_id: doc.sourceRecordId,
48
+ title: doc.title
49
+ }
50
+ })
51
+ });
52
+ }
53
+ }
54
+ async delete(documentIds, ctx) {
55
+ const { datasetId } = extractRagflowOptions(ctx.source);
56
+ for (const id of documentIds) {
57
+ await this.deleteChunksByDocumentId(datasetId, id);
58
+ }
59
+ }
60
+ async search(query, opts) {
61
+ const { datasetId, rerankModel, similarityThreshold, vectorSimilarityWeight } = extractRagflowOptions(opts.source);
62
+ const body = {
63
+ question: query,
64
+ dataset_ids: [datasetId],
65
+ top_k: opts.topK,
66
+ keyword: true
67
+ };
68
+ if (rerankModel) body.rerank_id = rerankModel;
69
+ if (typeof similarityThreshold === "number") body.similarity_threshold = similarityThreshold;
70
+ if (typeof vectorSimilarityWeight === "number")
71
+ body.vector_similarity_weight = vectorSimilarityWeight;
72
+ if (opts.filter) body.metadata_condition = { ...opts.filter };
73
+ const res = await this.request("/api/v1/retrieval", {
74
+ method: "POST",
75
+ body: JSON.stringify(body)
76
+ });
77
+ const data = res?.data ?? {};
78
+ const chunks = data.chunks ?? [];
79
+ return chunks.slice(0, opts.topK).map((c) => {
80
+ const md = c.metadata ?? {};
81
+ const docId = md.objectstack_doc_id ?? c.document_id ?? c.doc_id ?? c.id;
82
+ const recordId = md.objectstack_record_id;
83
+ return {
84
+ chunkId: c.id ?? `${docId}#${c.position ?? 0}`,
85
+ documentId: docId ?? c.id ?? "unknown",
86
+ sourceId: opts.source.id,
87
+ sourceRecordId: recordId,
88
+ score: c.similarity ?? c.score ?? 0,
89
+ snippet: c.content ?? c.content_with_weight ?? "",
90
+ title: md.title ?? c.document_name,
91
+ metadata: md
92
+ };
93
+ });
94
+ }
95
+ async healthCheck() {
96
+ try {
97
+ await this.request("/api/v1/datasets?page=1&page_size=1", { method: "GET" });
98
+ return { ok: true };
99
+ } catch (err) {
100
+ return { ok: false, message: err instanceof Error ? err.message : String(err) };
101
+ }
102
+ }
103
+ async deleteChunksByDocumentId(datasetId, docId) {
104
+ const found = await this.request(`/api/v1/retrieval`, {
105
+ method: "POST",
106
+ body: JSON.stringify({
107
+ question: docId,
108
+ dataset_ids: [datasetId],
109
+ top_k: 256,
110
+ keyword: false,
111
+ metadata_condition: { objectstack_doc_id: docId }
112
+ })
113
+ });
114
+ const ids = (found.data?.chunks ?? []).map((c) => c.id).filter((x) => typeof x === "string");
115
+ if (ids.length === 0) return;
116
+ await this.request(`/api/v1/datasets/${datasetId}/chunks`, {
117
+ method: "DELETE",
118
+ body: JSON.stringify({ chunk_ids: ids })
119
+ });
120
+ }
121
+ async request(path, init) {
122
+ const controller = new AbortController();
123
+ const t = setTimeout(() => controller.abort(), this.timeoutMs);
124
+ try {
125
+ const res = await this.fetchImpl(`${this.endpoint}${path}`, {
126
+ method: init.method,
127
+ headers: {
128
+ "content-type": "application/json",
129
+ authorization: `Bearer ${this.apiKey}`
130
+ },
131
+ body: init.body,
132
+ signal: controller.signal
133
+ });
134
+ const raw = await res.text();
135
+ let parsed = {};
136
+ if (raw) {
137
+ try {
138
+ parsed = JSON.parse(raw);
139
+ } catch {
140
+ if (!res.ok) {
141
+ throw new Error(
142
+ `RAGFlow ${init.method} ${path} \u2192 ${res.status} ${res.statusText}: ${raw.slice(0, 200)}`
143
+ );
144
+ }
145
+ }
146
+ }
147
+ if (!res.ok || typeof parsed.code === "number" && parsed.code !== 0 && parsed.code !== 200) {
148
+ throw new Error(
149
+ `RAGFlow ${init.method} ${path} \u2192 ${res.status} ${res.statusText}${parsed.message ? ` (${parsed.message})` : ""}`
150
+ );
151
+ }
152
+ return parsed;
153
+ } finally {
154
+ clearTimeout(t);
155
+ }
156
+ }
157
+ };
158
+ var KnowledgeRagflowPlugin = class {
159
+ constructor(opts) {
160
+ this.name = "com.objectstack.plugin.knowledge-ragflow";
161
+ this.version = "0.1.0";
162
+ this.type = "standard";
163
+ this.adapter = new KnowledgeRagflowAdapter(opts);
164
+ }
165
+ async init(_ctx) {
166
+ }
167
+ async start(ctx) {
168
+ let svc;
169
+ try {
170
+ svc = ctx.getService(KNOWLEDGE_SERVICE);
171
+ } catch {
172
+ ctx.logger.warn?.(
173
+ "KnowledgeRagflowPlugin: IKnowledgeService not registered \u2014 install KnowledgeServicePlugin first."
174
+ );
175
+ return;
176
+ }
177
+ svc.registerAdapter(this.adapter.id, this.adapter);
178
+ ctx.logger.info?.(
179
+ `KnowledgeRagflowPlugin: adapter '${this.adapter.id}' registered (endpoint=${this.adapter.endpoint}).`
180
+ );
181
+ }
182
+ };
183
+ export {
184
+ KnowledgeRagflowAdapter,
185
+ KnowledgeRagflowPlugin
186
+ };
187
+ //# sourceMappingURL=index.mjs.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../src/index.ts"],"sourcesContent":["// Copyright (c) 2025 ObjectStack. Licensed under the Apache-2.0 license.\n\nimport type { Plugin, PluginContext } from '@objectstack/core';\nimport type {\n IKnowledgeAdapter,\n IKnowledgeService,\n AdapterContext,\n AdapterSearchOptions,\n} from '@objectstack/spec/contracts';\nimport type {\n KnowledgeDocument,\n KnowledgeHit,\n KnowledgeSource,\n} from '@objectstack/spec/ai';\nimport { KNOWLEDGE_SERVICE } from '@objectstack/spec/contracts';\n\n/**\n * Subset of `fetch` used by the adapter. Inject in tests; defaults to\n * the global `fetch`.\n */\nexport type FetchLike = (\n input: string,\n init?: {\n method?: string;\n headers?: Record<string, string>;\n body?: string;\n signal?: AbortSignal;\n },\n) => Promise<{\n ok: boolean;\n status: number;\n statusText: string;\n text(): Promise<string>;\n json(): Promise<unknown>;\n}>;\n\nexport interface KnowledgeRagflowAdapterOptions {\n /** RAGFlow endpoint, e.g. `http://localhost:9380`. */\n endpoint: string;\n /** RAGFlow API key (Bearer token). */\n apiKey: string;\n /** Adapter id. @default 'ragflow' */\n id?: string;\n /** Override `fetch` for tests. */\n fetch?: FetchLike;\n /** Request timeout in milliseconds. @default 30000 */\n timeoutMs?: number;\n}\n\ninterface RagflowSourceOptions {\n datasetId: string;\n /** Optional rerank model id (overrides dataset default). */\n rerankModel?: string;\n /** Optional similarity threshold passed through to RAGFlow. */\n similarityThreshold?: number;\n /** Optional vector vs keyword weight in [0,1]. */\n vectorSimilarityWeight?: number;\n}\n\nfunction extractRagflowOptions(source: KnowledgeSource): RagflowSourceOptions {\n const opts = ((source as unknown as { options?: Record<string, unknown> }).options ?? {}) as\n Record<string, unknown>;\n const datasetId = opts.datasetId;\n if (typeof datasetId !== 'string' || !datasetId) {\n throw new Error(\n `RAGFlow adapter requires source.options.datasetId on source '${source.id}'`,\n );\n }\n return {\n datasetId,\n rerankModel: typeof opts.rerankModel === 'string' ? opts.rerankModel : undefined,\n similarityThreshold:\n typeof opts.similarityThreshold === 'number' ? opts.similarityThreshold : undefined,\n vectorSimilarityWeight:\n typeof opts.vectorSimilarityWeight === 'number'\n ? opts.vectorSimilarityWeight\n : undefined,\n };\n}\n\n/**\n * RAGFlow adapter. Maps {@link KnowledgeDocument} upserts to the\n * dataset's chunk API, delegates retrieval to `/api/v1/retrieval`, and\n * returns {@link KnowledgeHit}s with `sourceRecordId` preserved so the\n * orchestrator can run a permission re-check.\n */\nexport class KnowledgeRagflowAdapter implements IKnowledgeAdapter {\n readonly id: string;\n private readonly endpoint: string;\n private readonly apiKey: string;\n private readonly fetchImpl: FetchLike;\n private readonly timeoutMs: number;\n\n constructor(opts: KnowledgeRagflowAdapterOptions) {\n if (!opts.endpoint) throw new Error('RAGFlow adapter: endpoint required');\n if (!opts.apiKey) throw new Error('RAGFlow adapter: apiKey required');\n this.id = opts.id ?? 'ragflow';\n this.endpoint = opts.endpoint.replace(/\\/+$/, '');\n this.apiKey = opts.apiKey;\n this.fetchImpl = opts.fetch ?? ((globalThis as { fetch?: FetchLike }).fetch as FetchLike);\n this.timeoutMs = opts.timeoutMs ?? 30000;\n if (!this.fetchImpl) {\n throw new Error('RAGFlow adapter: no fetch available; pass options.fetch');\n }\n }\n\n async upsert(docs: KnowledgeDocument[], ctx: AdapterContext): Promise<void> {\n const { datasetId } = extractRagflowOptions(ctx.source);\n // RAGFlow models documents in two layers: documents (file-like) and\n // chunks (text blocks). We treat each KnowledgeDocument as a single\n // chunk-set: delete existing chunks with the same external id, then\n // upload as `content` chunks tagged with our document id.\n for (const doc of docs) {\n await this.deleteChunksByDocumentId(datasetId, doc.id);\n await this.request(`/api/v1/datasets/${datasetId}/chunks`, {\n method: 'POST',\n body: JSON.stringify({\n content: doc.content,\n // RAGFlow accepts arbitrary metadata used for filtering at\n // retrieval time. We always stamp `objectstack_doc_id` so\n // delete() can find these chunks again.\n important_keywords: doc.title ? [doc.title] : undefined,\n metadata: {\n ...(doc.metadata ?? {}),\n objectstack_doc_id: doc.id,\n objectstack_source_id: doc.sourceId,\n objectstack_record_id: doc.sourceRecordId,\n title: doc.title,\n },\n }),\n });\n }\n }\n\n async delete(documentIds: string[], ctx: AdapterContext): Promise<void> {\n const { datasetId } = extractRagflowOptions(ctx.source);\n for (const id of documentIds) {\n await this.deleteChunksByDocumentId(datasetId, id);\n }\n }\n\n async search(query: string, opts: AdapterSearchOptions): Promise<KnowledgeHit[]> {\n const { datasetId, rerankModel, similarityThreshold, vectorSimilarityWeight } =\n extractRagflowOptions(opts.source);\n const body: Record<string, unknown> = {\n question: query,\n dataset_ids: [datasetId],\n top_k: opts.topK,\n keyword: true,\n };\n if (rerankModel) body.rerank_id = rerankModel;\n if (typeof similarityThreshold === 'number') body.similarity_threshold = similarityThreshold;\n if (typeof vectorSimilarityWeight === 'number')\n body.vector_similarity_weight = vectorSimilarityWeight;\n if (opts.filter) body.metadata_condition = { ...opts.filter };\n\n const res = await this.request('/api/v1/retrieval', {\n method: 'POST',\n body: JSON.stringify(body),\n });\n const data = (res?.data ?? {}) as { chunks?: RagflowChunkHit[] };\n const chunks = data.chunks ?? [];\n return chunks.slice(0, opts.topK).map<KnowledgeHit>((c) => {\n const md = (c.metadata ?? {}) as Record<string, unknown>;\n const docId =\n (md.objectstack_doc_id as string | undefined) ??\n c.document_id ??\n c.doc_id ??\n c.id;\n const recordId = md.objectstack_record_id as string | undefined;\n return {\n chunkId: c.id ?? `${docId}#${c.position ?? 0}`,\n documentId: docId ?? c.id ?? 'unknown',\n sourceId: opts.source.id,\n sourceRecordId: recordId,\n score: c.similarity ?? c.score ?? 0,\n snippet: c.content ?? c.content_with_weight ?? '',\n title: (md.title as string | undefined) ?? c.document_name,\n metadata: md,\n };\n });\n }\n\n async healthCheck(): Promise<{ ok: boolean; message?: string }> {\n try {\n await this.request('/api/v1/datasets?page=1&page_size=1', { method: 'GET' });\n return { ok: true };\n } catch (err) {\n return { ok: false, message: err instanceof Error ? err.message : String(err) };\n }\n }\n\n private async deleteChunksByDocumentId(datasetId: string, docId: string): Promise<void> {\n // Find chunks with our stamped metadata, then delete by chunk id.\n const found = (await this.request(`/api/v1/retrieval`, {\n method: 'POST',\n body: JSON.stringify({\n question: docId,\n dataset_ids: [datasetId],\n top_k: 256,\n keyword: false,\n metadata_condition: { objectstack_doc_id: docId },\n }),\n })) as { data?: { chunks?: Array<{ id?: string }> } };\n const ids = (found.data?.chunks ?? [])\n .map((c) => c.id)\n .filter((x): x is string => typeof x === 'string');\n if (ids.length === 0) return;\n await this.request(`/api/v1/datasets/${datasetId}/chunks`, {\n method: 'DELETE',\n body: JSON.stringify({ chunk_ids: ids }),\n });\n }\n\n private async request(\n path: string,\n init: { method: string; body?: string },\n ): Promise<{ data?: unknown; code?: number; message?: string }> {\n const controller = new AbortController();\n const t = setTimeout(() => controller.abort(), this.timeoutMs);\n try {\n const res = await this.fetchImpl(`${this.endpoint}${path}`, {\n method: init.method,\n headers: {\n 'content-type': 'application/json',\n authorization: `Bearer ${this.apiKey}`,\n },\n body: init.body,\n signal: controller.signal,\n });\n const raw = await res.text();\n let parsed: { data?: unknown; code?: number; message?: string } = {};\n if (raw) {\n try {\n parsed = JSON.parse(raw) as typeof parsed;\n } catch {\n if (!res.ok) {\n throw new Error(\n `RAGFlow ${init.method} ${path} → ${res.status} ${res.statusText}: ${raw.slice(0, 200)}`,\n );\n }\n }\n }\n if (!res.ok || (typeof parsed.code === 'number' && parsed.code !== 0 && parsed.code !== 200)) {\n throw new Error(\n `RAGFlow ${init.method} ${path} → ${res.status} ${res.statusText}${\n parsed.message ? ` (${parsed.message})` : ''\n }`,\n );\n }\n return parsed;\n } finally {\n clearTimeout(t);\n }\n }\n}\n\ninterface RagflowChunkHit {\n id?: string;\n document_id?: string;\n doc_id?: string;\n document_name?: string;\n content?: string;\n content_with_weight?: string;\n similarity?: number;\n score?: number;\n position?: number;\n metadata?: Record<string, unknown>;\n}\n\n/* ---------------------------------------------------------------- */\n/* Kernel plugin glue */\n/* ---------------------------------------------------------------- */\n\nexport interface KnowledgeRagflowPluginOptions extends KnowledgeRagflowAdapterOptions {}\n\nexport class KnowledgeRagflowPlugin implements Plugin {\n name = 'com.objectstack.plugin.knowledge-ragflow';\n version = '0.1.0';\n type = 'standard';\n\n private readonly adapter: KnowledgeRagflowAdapter;\n\n constructor(opts: KnowledgeRagflowPluginOptions) {\n this.adapter = new KnowledgeRagflowAdapter(opts);\n }\n\n async init(_ctx: PluginContext): Promise<void> {\n // No-op: actual registration happens in start() once service is available.\n }\n\n async start(ctx: PluginContext): Promise<void> {\n let svc: IKnowledgeService | undefined;\n try {\n svc = ctx.getService<IKnowledgeService>(KNOWLEDGE_SERVICE);\n } catch {\n ctx.logger.warn?.(\n 'KnowledgeRagflowPlugin: IKnowledgeService not registered — install KnowledgeServicePlugin first.',\n );\n return;\n }\n svc.registerAdapter(this.adapter.id, this.adapter);\n ctx.logger.info?.(\n `KnowledgeRagflowPlugin: adapter '${this.adapter.id}' registered (endpoint=${(this.adapter as unknown as { endpoint: string }).endpoint}).`,\n );\n }\n}\n"],"mappings":";AAcA,SAAS,yBAAyB;AA6ClC,SAAS,sBAAsB,QAA+C;AAC5E,QAAM,OAAS,OAA4D,WAAW,CAAC;AAEvF,QAAM,YAAY,KAAK;AACvB,MAAI,OAAO,cAAc,YAAY,CAAC,WAAW;AAC/C,UAAM,IAAI;AAAA,MACR,gEAAgE,OAAO,EAAE;AAAA,IAC3E;AAAA,EACF;AACA,SAAO;AAAA,IACL;AAAA,IACA,aAAa,OAAO,KAAK,gBAAgB,WAAW,KAAK,cAAc;AAAA,IACvE,qBACE,OAAO,KAAK,wBAAwB,WAAW,KAAK,sBAAsB;AAAA,IAC5E,wBACE,OAAO,KAAK,2BAA2B,WACnC,KAAK,yBACL;AAAA,EACR;AACF;AAQO,IAAM,0BAAN,MAA2D;AAAA,EAOhE,YAAY,MAAsC;AAChD,QAAI,CAAC,KAAK,SAAU,OAAM,IAAI,MAAM,oCAAoC;AACxE,QAAI,CAAC,KAAK,OAAQ,OAAM,IAAI,MAAM,kCAAkC;AACpE,SAAK,KAAK,KAAK,MAAM;AACrB,SAAK,WAAW,KAAK,SAAS,QAAQ,QAAQ,EAAE;AAChD,SAAK,SAAS,KAAK;AACnB,SAAK,YAAY,KAAK,SAAW,WAAqC;AACtE,SAAK,YAAY,KAAK,aAAa;AACnC,QAAI,CAAC,KAAK,WAAW;AACnB,YAAM,IAAI,MAAM,yDAAyD;AAAA,IAC3E;AAAA,EACF;AAAA,EAEA,MAAM,OAAO,MAA2B,KAAoC;AAC1E,UAAM,EAAE,UAAU,IAAI,sBAAsB,IAAI,MAAM;AAKtD,eAAW,OAAO,MAAM;AACtB,YAAM,KAAK,yBAAyB,WAAW,IAAI,EAAE;AACrD,YAAM,KAAK,QAAQ,oBAAoB,SAAS,WAAW;AAAA,QACzD,QAAQ;AAAA,QACR,MAAM,KAAK,UAAU;AAAA,UACnB,SAAS,IAAI;AAAA;AAAA;AAAA;AAAA,UAIb,oBAAoB,IAAI,QAAQ,CAAC,IAAI,KAAK,IAAI;AAAA,UAC9C,UAAU;AAAA,YACR,GAAI,IAAI,YAAY,CAAC;AAAA,YACrB,oBAAoB,IAAI;AAAA,YACxB,uBAAuB,IAAI;AAAA,YAC3B,uBAAuB,IAAI;AAAA,YAC3B,OAAO,IAAI;AAAA,UACb;AAAA,QACF,CAAC;AAAA,MACH,CAAC;AAAA,IACH;AAAA,EACF;AAAA,EAEA,MAAM,OAAO,aAAuB,KAAoC;AACtE,UAAM,EAAE,UAAU,IAAI,sBAAsB,IAAI,MAAM;AACtD,eAAW,MAAM,aAAa;AAC5B,YAAM,KAAK,yBAAyB,WAAW,EAAE;AAAA,IACnD;AAAA,EACF;AAAA,EAEA,MAAM,OAAO,OAAe,MAAqD;AAC/E,UAAM,EAAE,WAAW,aAAa,qBAAqB,uBAAuB,IAC1E,sBAAsB,KAAK,MAAM;AACnC,UAAM,OAAgC;AAAA,MACpC,UAAU;AAAA,MACV,aAAa,CAAC,SAAS;AAAA,MACvB,OAAO,KAAK;AAAA,MACZ,SAAS;AAAA,IACX;AACA,QAAI,YAAa,MAAK,YAAY;AAClC,QAAI,OAAO,wBAAwB,SAAU,MAAK,uBAAuB;AACzE,QAAI,OAAO,2BAA2B;AACpC,WAAK,2BAA2B;AAClC,QAAI,KAAK,OAAQ,MAAK,qBAAqB,EAAE,GAAG,KAAK,OAAO;AAE5D,UAAM,MAAM,MAAM,KAAK,QAAQ,qBAAqB;AAAA,MAClD,QAAQ;AAAA,MACR,MAAM,KAAK,UAAU,IAAI;AAAA,IAC3B,CAAC;AACD,UAAM,OAAQ,KAAK,QAAQ,CAAC;AAC5B,UAAM,SAAS,KAAK,UAAU,CAAC;AAC/B,WAAO,OAAO,MAAM,GAAG,KAAK,IAAI,EAAE,IAAkB,CAAC,MAAM;AACzD,YAAM,KAAM,EAAE,YAAY,CAAC;AAC3B,YAAM,QACH,GAAG,sBACJ,EAAE,eACF,EAAE,UACF,EAAE;AACJ,YAAM,WAAW,GAAG;AACpB,aAAO;AAAA,QACL,SAAS,EAAE,MAAM,GAAG,KAAK,IAAI,EAAE,YAAY,CAAC;AAAA,QAC5C,YAAY,SAAS,EAAE,MAAM;AAAA,QAC7B,UAAU,KAAK,OAAO;AAAA,QACtB,gBAAgB;AAAA,QAChB,OAAO,EAAE,cAAc,EAAE,SAAS;AAAA,QAClC,SAAS,EAAE,WAAW,EAAE,uBAAuB;AAAA,QAC/C,OAAQ,GAAG,SAAgC,EAAE;AAAA,QAC7C,UAAU;AAAA,MACZ;AAAA,IACF,CAAC;AAAA,EACH;AAAA,EAEA,MAAM,cAA0D;AAC9D,QAAI;AACF,YAAM,KAAK,QAAQ,uCAAuC,EAAE,QAAQ,MAAM,CAAC;AAC3E,aAAO,EAAE,IAAI,KAAK;AAAA,IACpB,SAAS,KAAK;AACZ,aAAO,EAAE,IAAI,OAAO,SAAS,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG,EAAE;AAAA,IAChF;AAAA,EACF;AAAA,EAEA,MAAc,yBAAyB,WAAmB,OAA8B;AAEtF,UAAM,QAAS,MAAM,KAAK,QAAQ,qBAAqB;AAAA,MACrD,QAAQ;AAAA,MACR,MAAM,KAAK,UAAU;AAAA,QACnB,UAAU;AAAA,QACV,aAAa,CAAC,SAAS;AAAA,QACvB,OAAO;AAAA,QACP,SAAS;AAAA,QACT,oBAAoB,EAAE,oBAAoB,MAAM;AAAA,MAClD,CAAC;AAAA,IACH,CAAC;AACD,UAAM,OAAO,MAAM,MAAM,UAAU,CAAC,GACjC,IAAI,CAAC,MAAM,EAAE,EAAE,EACf,OAAO,CAAC,MAAmB,OAAO,MAAM,QAAQ;AACnD,QAAI,IAAI,WAAW,EAAG;AACtB,UAAM,KAAK,QAAQ,oBAAoB,SAAS,WAAW;AAAA,MACzD,QAAQ;AAAA,MACR,MAAM,KAAK,UAAU,EAAE,WAAW,IAAI,CAAC;AAAA,IACzC,CAAC;AAAA,EACH;AAAA,EAEA,MAAc,QACZ,MACA,MAC8D;AAC9D,UAAM,aAAa,IAAI,gBAAgB;AACvC,UAAM,IAAI,WAAW,MAAM,WAAW,MAAM,GAAG,KAAK,SAAS;AAC7D,QAAI;AACF,YAAM,MAAM,MAAM,KAAK,UAAU,GAAG,KAAK,QAAQ,GAAG,IAAI,IAAI;AAAA,QAC1D,QAAQ,KAAK;AAAA,QACb,SAAS;AAAA,UACP,gBAAgB;AAAA,UAChB,eAAe,UAAU,KAAK,MAAM;AAAA,QACtC;AAAA,QACA,MAAM,KAAK;AAAA,QACX,QAAQ,WAAW;AAAA,MACrB,CAAC;AACD,YAAM,MAAM,MAAM,IAAI,KAAK;AAC3B,UAAI,SAA8D,CAAC;AACnE,UAAI,KAAK;AACP,YAAI;AACF,mBAAS,KAAK,MAAM,GAAG;AAAA,QACzB,QAAQ;AACN,cAAI,CAAC,IAAI,IAAI;AACX,kBAAM,IAAI;AAAA,cACR,WAAW,KAAK,MAAM,IAAI,IAAI,WAAM,IAAI,MAAM,IAAI,IAAI,UAAU,KAAK,IAAI,MAAM,GAAG,GAAG,CAAC;AAAA,YACxF;AAAA,UACF;AAAA,QACF;AAAA,MACF;AACA,UAAI,CAAC,IAAI,MAAO,OAAO,OAAO,SAAS,YAAY,OAAO,SAAS,KAAK,OAAO,SAAS,KAAM;AAC5F,cAAM,IAAI;AAAA,UACR,WAAW,KAAK,MAAM,IAAI,IAAI,WAAM,IAAI,MAAM,IAAI,IAAI,UAAU,GAC9D,OAAO,UAAU,KAAK,OAAO,OAAO,MAAM,EAC5C;AAAA,QACF;AAAA,MACF;AACA,aAAO;AAAA,IACT,UAAE;AACA,mBAAa,CAAC;AAAA,IAChB;AAAA,EACF;AACF;AAqBO,IAAM,yBAAN,MAA+C;AAAA,EAOpD,YAAY,MAAqC;AANjD,gBAAO;AACP,mBAAU;AACV,gBAAO;AAKL,SAAK,UAAU,IAAI,wBAAwB,IAAI;AAAA,EACjD;AAAA,EAEA,MAAM,KAAK,MAAoC;AAAA,EAE/C;AAAA,EAEA,MAAM,MAAM,KAAmC;AAC7C,QAAI;AACJ,QAAI;AACF,YAAM,IAAI,WAA8B,iBAAiB;AAAA,IAC3D,QAAQ;AACN,UAAI,OAAO;AAAA,QACT;AAAA,MACF;AACA;AAAA,IACF;AACA,QAAI,gBAAgB,KAAK,QAAQ,IAAI,KAAK,OAAO;AACjD,QAAI,OAAO;AAAA,MACT,oCAAoC,KAAK,QAAQ,EAAE,0BAA2B,KAAK,QAA4C,QAAQ;AAAA,IACzI;AAAA,EACF;AACF;","names":[]}
package/package.json ADDED
@@ -0,0 +1,36 @@
1
+ {
2
+ "name": "@objectstack/knowledge-ragflow",
3
+ "version": "6.4.0",
4
+ "license": "Apache-2.0",
5
+ "description": "RAGFlow knowledge adapter for ObjectStack — production-grade RAG via the Apache 2.0 RAGFlow REST API.",
6
+ "main": "dist/index.js",
7
+ "types": "dist/index.d.ts",
8
+ "exports": {
9
+ ".": {
10
+ "types": "./dist/index.d.ts",
11
+ "import": "./dist/index.mjs",
12
+ "require": "./dist/index.js"
13
+ }
14
+ },
15
+ "dependencies": {
16
+ "@objectstack/core": "6.4.0",
17
+ "@objectstack/service-knowledge": "6.4.0",
18
+ "@objectstack/spec": "6.4.0"
19
+ },
20
+ "devDependencies": {
21
+ "@types/node": "^25.9.1",
22
+ "typescript": "^6.0.3",
23
+ "vitest": "^4.1.7"
24
+ },
25
+ "keywords": [
26
+ "objectstack",
27
+ "knowledge",
28
+ "rag",
29
+ "ragflow"
30
+ ],
31
+ "scripts": {
32
+ "build": "tsup --config ../../../tsup.config.ts",
33
+ "dev": "tsc -w",
34
+ "test": "vitest run"
35
+ }
36
+ }
@@ -0,0 +1,160 @@
1
+ // Copyright (c) 2025 ObjectStack. Licensed under the Apache-2.0 license.
2
+
3
+ import { describe, it, expect } from 'vitest';
4
+ import { KnowledgeRagflowAdapter, type FetchLike } from '../index';
5
+ import type { KnowledgeSource, KnowledgeDocument } from '@objectstack/spec/ai';
6
+
7
+ const source: KnowledgeSource = {
8
+ id: 'docs',
9
+ label: 'Docs',
10
+ adapter: 'ragflow',
11
+ source: { kind: 'http', urls: ['https://docs.example.com'] } as KnowledgeSource['source'],
12
+ options: { datasetId: 'ds_42' },
13
+ };
14
+
15
+ function fakeFetch(handler: (url: string, init?: any) => unknown): { fetch: FetchLike; calls: Array<{ url: string; init: any }> } {
16
+ const calls: Array<{ url: string; init: any }> = [];
17
+ const fetch: FetchLike = async (url, init) => {
18
+ calls.push({ url, init });
19
+ const out = await Promise.resolve(handler(url, init));
20
+ const body = typeof out === 'string' ? out : JSON.stringify(out ?? {});
21
+ return {
22
+ ok: true,
23
+ status: 200,
24
+ statusText: 'OK',
25
+ text: async () => body,
26
+ json: async () => JSON.parse(body),
27
+ };
28
+ };
29
+ return { fetch, calls };
30
+ }
31
+
32
+ describe('KnowledgeRagflowAdapter', () => {
33
+ it('rejects sources without datasetId', async () => {
34
+ const { fetch } = fakeFetch(() => ({}));
35
+ const a = new KnowledgeRagflowAdapter({ endpoint: 'http://x', apiKey: 'k', fetch });
36
+ const bad: KnowledgeSource = { ...source, options: {} as Record<string, unknown> };
37
+ await expect(a.search('q', { source: bad, topK: 1 })).rejects.toThrow(/datasetId/);
38
+ });
39
+
40
+ it('upsert deletes-then-creates chunks and stamps objectstack metadata', async () => {
41
+ const { fetch, calls } = fakeFetch((url) => {
42
+ if (url.includes('/api/v1/retrieval')) return { code: 0, data: { chunks: [] } };
43
+ return { code: 0, data: {} };
44
+ });
45
+ const a = new KnowledgeRagflowAdapter({ endpoint: 'http://r', apiKey: 'k', fetch });
46
+ const doc: KnowledgeDocument = {
47
+ id: 'd1',
48
+ sourceId: 'docs',
49
+ sourceRecordId: 'rec_1',
50
+ content: 'hello world',
51
+ title: 'Greeting',
52
+ metadata: { topic: 'intro' },
53
+ };
54
+ await a.upsert([doc], { source });
55
+ // First call: lookup existing chunks; second: create chunk
56
+ const createCall = calls.find((c) => c.url.endsWith('/api/v1/datasets/ds_42/chunks') && c.init.method === 'POST');
57
+ expect(createCall).toBeDefined();
58
+ const body = JSON.parse(createCall!.init.body);
59
+ expect(body.content).toBe('hello world');
60
+ expect(body.metadata.objectstack_doc_id).toBe('d1');
61
+ expect(body.metadata.objectstack_record_id).toBe('rec_1');
62
+ expect(body.metadata.objectstack_source_id).toBe('docs');
63
+ expect(body.metadata.topic).toBe('intro');
64
+ });
65
+
66
+ it('search maps ragflow chunks to KnowledgeHit shape', async () => {
67
+ const { fetch, calls } = fakeFetch(() => ({
68
+ code: 0,
69
+ data: {
70
+ chunks: [
71
+ {
72
+ id: 'c1',
73
+ content: 'snippet one',
74
+ similarity: 0.91,
75
+ metadata: { objectstack_doc_id: 'd1', objectstack_record_id: 'rec_1', title: 'T1' },
76
+ },
77
+ {
78
+ id: 'c2',
79
+ content: 'snippet two',
80
+ similarity: 0.7,
81
+ metadata: { objectstack_doc_id: 'd2' },
82
+ },
83
+ ],
84
+ },
85
+ }));
86
+ const a = new KnowledgeRagflowAdapter({ endpoint: 'http://r', apiKey: 'k', fetch });
87
+ const hits = await a.search('hello', { source, topK: 5 });
88
+ expect(hits).toHaveLength(2);
89
+ expect(hits[0]).toMatchObject({
90
+ chunkId: 'c1',
91
+ documentId: 'd1',
92
+ sourceId: 'docs',
93
+ sourceRecordId: 'rec_1',
94
+ score: 0.91,
95
+ snippet: 'snippet one',
96
+ title: 'T1',
97
+ });
98
+ expect(hits[1].sourceRecordId).toBeUndefined();
99
+ // Authorization header present
100
+ const last = calls.at(-1)!;
101
+ expect(last.init.headers.authorization).toBe('Bearer k');
102
+ });
103
+
104
+ it('search honours rerankModel + similarityThreshold + filter', async () => {
105
+ const { fetch, calls } = fakeFetch(() => ({ code: 0, data: { chunks: [] } }));
106
+ const a = new KnowledgeRagflowAdapter({ endpoint: 'http://r', apiKey: 'k', fetch });
107
+ const s: KnowledgeSource = {
108
+ ...source,
109
+ options: { datasetId: 'ds_42', rerankModel: 'bge-reranker', similarityThreshold: 0.6 },
110
+ };
111
+ await a.search('q', { source: s, topK: 3, filter: { tag: 'a' } });
112
+ const body = JSON.parse(calls[0].init.body);
113
+ expect(body.rerank_id).toBe('bge-reranker');
114
+ expect(body.similarity_threshold).toBe(0.6);
115
+ expect(body.metadata_condition).toEqual({ tag: 'a' });
116
+ expect(body.top_k).toBe(3);
117
+ });
118
+
119
+ it('delete looks up chunks then issues DELETE with chunk_ids', async () => {
120
+ const { fetch, calls } = fakeFetch((url) => {
121
+ if (url.includes('/api/v1/retrieval')) {
122
+ return { code: 0, data: { chunks: [{ id: 'c1' }, { id: 'c2' }] } };
123
+ }
124
+ return { code: 0, data: {} };
125
+ });
126
+ const a = new KnowledgeRagflowAdapter({ endpoint: 'http://r', apiKey: 'k', fetch });
127
+ await a.delete(['d1'], { source });
128
+ const del = calls.find((c) => c.init.method === 'DELETE');
129
+ expect(del).toBeDefined();
130
+ expect(JSON.parse(del!.init.body)).toEqual({ chunk_ids: ['c1', 'c2'] });
131
+ });
132
+
133
+ it('healthCheck pings dataset list', async () => {
134
+ const { fetch } = fakeFetch(() => ({ code: 0, data: { datasets: [] } }));
135
+ const a = new KnowledgeRagflowAdapter({ endpoint: 'http://r', apiKey: 'k', fetch });
136
+ const h = await a.healthCheck();
137
+ expect(h.ok).toBe(true);
138
+ });
139
+
140
+ it('healthCheck reports failure when request throws', async () => {
141
+ const fetch: FetchLike = async () => {
142
+ throw new Error('boom');
143
+ };
144
+ const a = new KnowledgeRagflowAdapter({ endpoint: 'http://r', apiKey: 'k', fetch });
145
+ const h = await a.healthCheck();
146
+ expect(h.ok).toBe(false);
147
+ expect(h.message).toMatch(/boom/);
148
+ });
149
+
150
+ it('throws on non-zero RAGFlow error code', async () => {
151
+ const { fetch } = fakeFetch(() => ({ code: 102, message: 'bad request' }));
152
+ const a = new KnowledgeRagflowAdapter({ endpoint: 'http://r', apiKey: 'k', fetch });
153
+ await expect(a.search('q', { source, topK: 1 })).rejects.toThrow(/bad request/);
154
+ });
155
+
156
+ it('constructor validates endpoint and apiKey', () => {
157
+ expect(() => new KnowledgeRagflowAdapter({ endpoint: '', apiKey: 'k', fetch: (async () => ({}) as any) })).toThrow(/endpoint/);
158
+ expect(() => new KnowledgeRagflowAdapter({ endpoint: 'http://x', apiKey: '', fetch: (async () => ({}) as any) })).toThrow(/apiKey/);
159
+ });
160
+ });