@objectstack/embedder-openai 6.7.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.turbo/turbo-build.log +22 -0
- package/CHANGELOG.md +45 -0
- package/LICENSE +202 -0
- package/README.md +121 -0
- package/dist/index.d.mts +132 -0
- package/dist/index.d.ts +132 -0
- package/dist/index.js +124 -0
- package/dist/index.js.map +1 -0
- package/dist/index.mjs +97 -0
- package/dist/index.mjs.map +1 -0
- package/package.json +40 -0
- package/src/__tests__/openai-embedder.test.ts +166 -0
- package/src/index.ts +222 -0
- package/tsconfig.json +20 -0
- package/vitest.config.ts +17 -0
package/dist/index.js
ADDED
|
@@ -0,0 +1,124 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
var __defProp = Object.defineProperty;
|
|
3
|
+
var __getOwnPropDesc = Object.getOwnPropertyDescriptor;
|
|
4
|
+
var __getOwnPropNames = Object.getOwnPropertyNames;
|
|
5
|
+
var __hasOwnProp = Object.prototype.hasOwnProperty;
|
|
6
|
+
var __export = (target, all) => {
|
|
7
|
+
for (var name in all)
|
|
8
|
+
__defProp(target, name, { get: all[name], enumerable: true });
|
|
9
|
+
};
|
|
10
|
+
var __copyProps = (to, from, except, desc) => {
|
|
11
|
+
if (from && typeof from === "object" || typeof from === "function") {
|
|
12
|
+
for (let key of __getOwnPropNames(from))
|
|
13
|
+
if (!__hasOwnProp.call(to, key) && key !== except)
|
|
14
|
+
__defProp(to, key, { get: () => from[key], enumerable: !(desc = __getOwnPropDesc(from, key)) || desc.enumerable });
|
|
15
|
+
}
|
|
16
|
+
return to;
|
|
17
|
+
};
|
|
18
|
+
var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: true }), mod);
|
|
19
|
+
|
|
20
|
+
// src/index.ts
|
|
21
|
+
var index_exports = {};
|
|
22
|
+
__export(index_exports, {
|
|
23
|
+
OPENAI_COMPATIBLE_PRESETS: () => OPENAI_COMPATIBLE_PRESETS,
|
|
24
|
+
OpenAIEmbedder: () => OpenAIEmbedder,
|
|
25
|
+
createOpenAIEmbedder: () => createOpenAIEmbedder,
|
|
26
|
+
default: () => index_default
|
|
27
|
+
});
|
|
28
|
+
module.exports = __toCommonJS(index_exports);
|
|
29
|
+
var KNOWN_DIMENSIONS = {
|
|
30
|
+
// OpenAI
|
|
31
|
+
"text-embedding-3-small": 1536,
|
|
32
|
+
"text-embedding-3-large": 3072,
|
|
33
|
+
"text-embedding-ada-002": 1536,
|
|
34
|
+
// 阿里通义
|
|
35
|
+
"text-embedding-v3": 1024,
|
|
36
|
+
"text-embedding-v2": 1536,
|
|
37
|
+
"text-embedding-v1": 1536,
|
|
38
|
+
// 智谱
|
|
39
|
+
"embedding-3": 2048,
|
|
40
|
+
"embedding-2": 1024,
|
|
41
|
+
// 硅基流动 / BGE 家族
|
|
42
|
+
"BAAI/bge-m3": 1024,
|
|
43
|
+
"BAAI/bge-large-zh-v1.5": 1024,
|
|
44
|
+
"BAAI/bge-large-en-v1.5": 1024,
|
|
45
|
+
"BAAI/bge-base-zh-v1.5": 768,
|
|
46
|
+
"BAAI/bge-small-zh-v1.5": 512,
|
|
47
|
+
"bge-m3": 1024,
|
|
48
|
+
// 火山 Doubao
|
|
49
|
+
"doubao-embedding-large-text-240915": 4096,
|
|
50
|
+
"doubao-embedding-text-240715": 2048,
|
|
51
|
+
// Nomic / Ollama defaults
|
|
52
|
+
"nomic-embed-text": 768,
|
|
53
|
+
// MiniMax
|
|
54
|
+
"embo-01": 1536
|
|
55
|
+
};
|
|
56
|
+
var OpenAIEmbedder = class {
|
|
57
|
+
constructor(opts) {
|
|
58
|
+
if (!opts.apiKey) throw new Error("OpenAIEmbedder: apiKey required");
|
|
59
|
+
this.apiKey = opts.apiKey;
|
|
60
|
+
this.id = opts.id ?? "openai";
|
|
61
|
+
this.model = opts.model ?? "text-embedding-3-small";
|
|
62
|
+
this.baseUrl = (opts.baseUrl ?? "https://api.openai.com/v1").replace(/\/+$/, "");
|
|
63
|
+
this.fetchImpl = opts.fetch ?? globalThis.fetch;
|
|
64
|
+
this.requestedDims = opts.dimensions;
|
|
65
|
+
this.extraHeaders = opts.headers ?? {};
|
|
66
|
+
this.dimensions = opts.dimensions ?? KNOWN_DIMENSIONS[this.model] ?? 1536;
|
|
67
|
+
if (!this.fetchImpl) {
|
|
68
|
+
throw new Error(
|
|
69
|
+
"OpenAIEmbedder: no fetch available; pass options.fetch or run on Node 18+ / a fetch-capable runtime"
|
|
70
|
+
);
|
|
71
|
+
}
|
|
72
|
+
}
|
|
73
|
+
async embed(texts) {
|
|
74
|
+
if (texts.length === 0) return [];
|
|
75
|
+
const body = { model: this.model, input: texts };
|
|
76
|
+
if (this.requestedDims) body.dimensions = this.requestedDims;
|
|
77
|
+
const res = await this.fetchImpl(`${this.baseUrl}/embeddings`, {
|
|
78
|
+
method: "POST",
|
|
79
|
+
headers: {
|
|
80
|
+
"content-type": "application/json",
|
|
81
|
+
authorization: `Bearer ${this.apiKey}`,
|
|
82
|
+
...this.extraHeaders
|
|
83
|
+
},
|
|
84
|
+
body: JSON.stringify(body)
|
|
85
|
+
});
|
|
86
|
+
if (!res.ok) {
|
|
87
|
+
const text = await res.text().catch(() => "");
|
|
88
|
+
throw new Error(
|
|
89
|
+
`OpenAIEmbedder (${this.baseUrl}) \u2192 ${res.status} ${res.statusText}${text ? `: ${text.slice(0, 200)}` : ""}`
|
|
90
|
+
);
|
|
91
|
+
}
|
|
92
|
+
const json = await res.json();
|
|
93
|
+
const data = json.data ?? [];
|
|
94
|
+
if (data.length !== texts.length) {
|
|
95
|
+
throw new Error(
|
|
96
|
+
`OpenAIEmbedder: expected ${texts.length} vectors, got ${data.length}`
|
|
97
|
+
);
|
|
98
|
+
}
|
|
99
|
+
return data.map((d) => d.embedding);
|
|
100
|
+
}
|
|
101
|
+
};
|
|
102
|
+
var OPENAI_COMPATIBLE_PRESETS = {
|
|
103
|
+
openai: "https://api.openai.com/v1",
|
|
104
|
+
azure: "",
|
|
105
|
+
// user must provide full deployment URL via baseUrl
|
|
106
|
+
dashscope: "https://dashscope.aliyuncs.com/compatible-mode/v1",
|
|
107
|
+
zhipu: "https://open.bigmodel.cn/api/paas/v4",
|
|
108
|
+
siliconflow: "https://api.siliconflow.cn/v1",
|
|
109
|
+
doubao: "https://ark.cn-beijing.volces.com/api/v3",
|
|
110
|
+
minimax: "https://api.minimax.chat/v1",
|
|
111
|
+
ollama: "http://localhost:11434/v1"
|
|
112
|
+
};
|
|
113
|
+
function createOpenAIEmbedder(opts) {
|
|
114
|
+
const baseUrl = opts.baseUrl ?? (opts.preset ? OPENAI_COMPATIBLE_PRESETS[opts.preset] : void 0);
|
|
115
|
+
return new OpenAIEmbedder({ ...opts, baseUrl, id: opts.id ?? opts.preset ?? "openai" });
|
|
116
|
+
}
|
|
117
|
+
var index_default = OpenAIEmbedder;
|
|
118
|
+
// Annotate the CommonJS export names for ESM import in node:
|
|
119
|
+
0 && (module.exports = {
|
|
120
|
+
OPENAI_COMPATIBLE_PRESETS,
|
|
121
|
+
OpenAIEmbedder,
|
|
122
|
+
createOpenAIEmbedder
|
|
123
|
+
});
|
|
124
|
+
//# sourceMappingURL=index.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../src/index.ts"],"sourcesContent":["// Copyright (c) 2026 ObjectStack. Licensed under the Apache-2.0 license.\n\n/**\n * `@objectstack/embedder-openai`\n *\n * OpenAI-compatible embedder. Drop-in for any endpoint that speaks the\n * `POST /v1/embeddings` shape:\n *\n * - OpenAI https://api.openai.com/v1\n * - Azure OpenAI https://{resource}.openai.azure.com/openai/deployments/{deployment}\n * - 阿里通义 DashScope https://dashscope.aliyuncs.com/compatible-mode/v1\n * - 智谱 BigModel https://open.bigmodel.cn/api/paas/v4\n * - 硅基流动 SiliconFlow https://api.siliconflow.cn/v1\n * - 火山引擎 Doubao https://ark.cn-beijing.volces.com/api/v3\n * - MiniMax https://api.minimax.chat/v1\n * - Ollama (openai shim) http://localhost:11434/v1\n * - LiteLLM / vLLM / 任何兼容服务\n *\n * Implements the `IEmbedder` contract from `@objectstack/spec/contracts`.\n */\n\nimport type { IEmbedder } from '@objectstack/spec/contracts';\n\nexport interface OpenAIEmbedderOptions {\n /** Bearer token sent as `Authorization: Bearer <apiKey>`. Required. */\n apiKey: string;\n /**\n * Model id sent in the request body. Choose to match your provider:\n * - OpenAI: `'text-embedding-3-small'` (default), `'text-embedding-3-large'`\n * - 阿里通义: `'text-embedding-v3'`\n * - 智谱: `'embedding-3'`\n * - 硅基流动: `'BAAI/bge-m3'`, `'BAAI/bge-large-zh-v1.5'`\n * - 火山 Doubao: `'doubao-embedding-large-text-240915'`\n * - Ollama: `'bge-m3'`, `'nomic-embed-text'`\n *\n * @default 'text-embedding-3-small'\n */\n model?: string;\n /**\n * Override dimensions. Only Matryoshka-style models (OpenAI v3, 智谱 embedding-3,\n * BGE-m3 dense) support truncation. When set, also forwarded to the upstream\n * `dimensions` body field for providers that honour it.\n */\n dimensions?: number;\n /**\n * Endpoint base URL (without `/embeddings`). Defaults to OpenAI's. Set this\n * to point at any compatible provider.\n *\n * @default 'https://api.openai.com/v1'\n */\n baseUrl?: string;\n /** Stable id surfaced as `IEmbedder.id`. @default 'openai' */\n id?: string;\n /** Inject for tests. Defaults to `globalThis.fetch`. */\n fetch?: typeof fetch;\n /** Additional headers (e.g. provider-specific keys, tracing). */\n headers?: Record<string, string>;\n}\n\n/**\n * Known dimensions for popular models. Used as the default when the\n * caller doesn't pass `dimensions` explicitly.\n */\nconst KNOWN_DIMENSIONS: Record<string, number> = {\n // OpenAI\n 'text-embedding-3-small': 1536,\n 'text-embedding-3-large': 3072,\n 'text-embedding-ada-002': 1536,\n // 阿里通义\n 'text-embedding-v3': 1024,\n 'text-embedding-v2': 1536,\n 'text-embedding-v1': 1536,\n // 智谱\n 'embedding-3': 2048,\n 'embedding-2': 1024,\n // 硅基流动 / BGE 家族\n 'BAAI/bge-m3': 1024,\n 'BAAI/bge-large-zh-v1.5': 1024,\n 'BAAI/bge-large-en-v1.5': 1024,\n 'BAAI/bge-base-zh-v1.5': 768,\n 'BAAI/bge-small-zh-v1.5': 512,\n 'bge-m3': 1024,\n // 火山 Doubao\n 'doubao-embedding-large-text-240915': 4096,\n 'doubao-embedding-text-240715': 2048,\n // Nomic / Ollama defaults\n 'nomic-embed-text': 768,\n // MiniMax\n 'embo-01': 1536,\n};\n\n/**\n * `OpenAIEmbedder` — OpenAI-compatible embedder. One instance per\n * upstream provider + model combination. Pass into any knowledge\n * adapter that expects `IEmbedder`.\n *\n * @example\n * // OpenAI\n * new OpenAIEmbedder({ apiKey: process.env.OPENAI_API_KEY! });\n *\n * @example\n * // 阿里通义 DashScope\n * new OpenAIEmbedder({\n * apiKey: process.env.DASHSCOPE_API_KEY!,\n * baseUrl: 'https://dashscope.aliyuncs.com/compatible-mode/v1',\n * model: 'text-embedding-v3',\n * });\n *\n * @example\n * // 硅基流动 SiliconFlow + BGE-m3\n * new OpenAIEmbedder({\n * apiKey: process.env.SILICONFLOW_API_KEY!,\n * baseUrl: 'https://api.siliconflow.cn/v1',\n * model: 'BAAI/bge-m3',\n * });\n *\n * @example\n * // Local Ollama\n * new OpenAIEmbedder({\n * apiKey: 'ollama',\n * baseUrl: 'http://localhost:11434/v1',\n * model: 'bge-m3',\n * });\n */\nexport class OpenAIEmbedder implements IEmbedder {\n readonly id: string;\n readonly dimensions: number;\n private readonly model: string;\n private readonly baseUrl: string;\n private readonly apiKey: string;\n private readonly fetchImpl: typeof fetch;\n private readonly requestedDims?: number;\n private readonly extraHeaders: Record<string, string>;\n\n constructor(opts: OpenAIEmbedderOptions) {\n if (!opts.apiKey) throw new Error('OpenAIEmbedder: apiKey required');\n this.apiKey = opts.apiKey;\n this.id = opts.id ?? 'openai';\n this.model = opts.model ?? 'text-embedding-3-small';\n this.baseUrl = (opts.baseUrl ?? 'https://api.openai.com/v1').replace(/\\/+$/, '');\n this.fetchImpl = opts.fetch ?? (globalThis.fetch as typeof fetch);\n this.requestedDims = opts.dimensions;\n this.extraHeaders = opts.headers ?? {};\n this.dimensions =\n opts.dimensions ?? KNOWN_DIMENSIONS[this.model] ?? 1536;\n if (!this.fetchImpl) {\n throw new Error(\n 'OpenAIEmbedder: no fetch available; pass options.fetch or run on Node 18+ / a fetch-capable runtime',\n );\n }\n }\n\n async embed(texts: string[]): Promise<number[][]> {\n if (texts.length === 0) return [];\n const body: Record<string, unknown> = { model: this.model, input: texts };\n if (this.requestedDims) body.dimensions = this.requestedDims;\n const res = await this.fetchImpl(`${this.baseUrl}/embeddings`, {\n method: 'POST',\n headers: {\n 'content-type': 'application/json',\n authorization: `Bearer ${this.apiKey}`,\n ...this.extraHeaders,\n },\n body: JSON.stringify(body),\n });\n if (!res.ok) {\n const text = await res.text().catch(() => '');\n throw new Error(\n `OpenAIEmbedder (${this.baseUrl}) → ${res.status} ${res.statusText}${text ? `: ${text.slice(0, 200)}` : ''}`,\n );\n }\n const json = (await res.json()) as { data?: Array<{ embedding: number[] }> };\n const data = json.data ?? [];\n if (data.length !== texts.length) {\n throw new Error(\n `OpenAIEmbedder: expected ${texts.length} vectors, got ${data.length}`,\n );\n }\n return data.map((d) => d.embedding);\n }\n}\n\n/**\n * Convenience presets for popular Chinese providers — saves callers\n * from memorising base URLs. Pass through `createXxxEmbedder({...})`.\n */\nexport const OPENAI_COMPATIBLE_PRESETS = {\n openai: 'https://api.openai.com/v1',\n azure: '', // user must provide full deployment URL via baseUrl\n dashscope: 'https://dashscope.aliyuncs.com/compatible-mode/v1',\n zhipu: 'https://open.bigmodel.cn/api/paas/v4',\n siliconflow: 'https://api.siliconflow.cn/v1',\n doubao: 'https://ark.cn-beijing.volces.com/api/v3',\n minimax: 'https://api.minimax.chat/v1',\n ollama: 'http://localhost:11434/v1',\n} as const;\n\nexport type OpenAICompatiblePreset = keyof typeof OPENAI_COMPATIBLE_PRESETS;\n\nexport interface PresetEmbedderOptions\n extends Omit<OpenAIEmbedderOptions, 'baseUrl'> {\n /** Pick a known provider; sets `baseUrl` automatically. */\n preset?: OpenAICompatiblePreset;\n /** Explicit override; takes precedence over `preset`. */\n baseUrl?: string;\n}\n\n/**\n * Helper: pick a provider by preset name. Equivalent to constructing\n * `OpenAIEmbedder` with the matching `baseUrl`.\n *\n * @example\n * createOpenAIEmbedder({ preset: 'dashscope', apiKey, model: 'text-embedding-v3' })\n */\nexport function createOpenAIEmbedder(opts: PresetEmbedderOptions): OpenAIEmbedder {\n const baseUrl =\n opts.baseUrl ??\n (opts.preset ? OPENAI_COMPATIBLE_PRESETS[opts.preset] : undefined);\n return new OpenAIEmbedder({ ...opts, baseUrl, id: opts.id ?? opts.preset ?? 'openai' });\n}\n\nexport default OpenAIEmbedder;\n"],"mappings":";;;;;;;;;;;;;;;;;;;;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AA+DA,IAAM,mBAA2C;AAAA;AAAA,EAE/C,0BAA0B;AAAA,EAC1B,0BAA0B;AAAA,EAC1B,0BAA0B;AAAA;AAAA,EAE1B,qBAAqB;AAAA,EACrB,qBAAqB;AAAA,EACrB,qBAAqB;AAAA;AAAA,EAErB,eAAe;AAAA,EACf,eAAe;AAAA;AAAA,EAEf,eAAe;AAAA,EACf,0BAA0B;AAAA,EAC1B,0BAA0B;AAAA,EAC1B,yBAAyB;AAAA,EACzB,0BAA0B;AAAA,EAC1B,UAAU;AAAA;AAAA,EAEV,sCAAsC;AAAA,EACtC,gCAAgC;AAAA;AAAA,EAEhC,oBAAoB;AAAA;AAAA,EAEpB,WAAW;AACb;AAmCO,IAAM,iBAAN,MAA0C;AAAA,EAU/C,YAAY,MAA6B;AACvC,QAAI,CAAC,KAAK,OAAQ,OAAM,IAAI,MAAM,iCAAiC;AACnE,SAAK,SAAS,KAAK;AACnB,SAAK,KAAK,KAAK,MAAM;AACrB,SAAK,QAAQ,KAAK,SAAS;AAC3B,SAAK,WAAW,KAAK,WAAW,6BAA6B,QAAQ,QAAQ,EAAE;AAC/E,SAAK,YAAY,KAAK,SAAU,WAAW;AAC3C,SAAK,gBAAgB,KAAK;AAC1B,SAAK,eAAe,KAAK,WAAW,CAAC;AACrC,SAAK,aACH,KAAK,cAAc,iBAAiB,KAAK,KAAK,KAAK;AACrD,QAAI,CAAC,KAAK,WAAW;AACnB,YAAM,IAAI;AAAA,QACR;AAAA,MACF;AAAA,IACF;AAAA,EACF;AAAA,EAEA,MAAM,MAAM,OAAsC;AAChD,QAAI,MAAM,WAAW,EAAG,QAAO,CAAC;AAChC,UAAM,OAAgC,EAAE,OAAO,KAAK,OAAO,OAAO,MAAM;AACxE,QAAI,KAAK,cAAe,MAAK,aAAa,KAAK;AAC/C,UAAM,MAAM,MAAM,KAAK,UAAU,GAAG,KAAK,OAAO,eAAe;AAAA,MAC7D,QAAQ;AAAA,MACR,SAAS;AAAA,QACP,gBAAgB;AAAA,QAChB,eAAe,UAAU,KAAK,MAAM;AAAA,QACpC,GAAG,KAAK;AAAA,MACV;AAAA,MACA,MAAM,KAAK,UAAU,IAAI;AAAA,IAC3B,CAAC;AACD,QAAI,CAAC,IAAI,IAAI;AACX,YAAM,OAAO,MAAM,IAAI,KAAK,EAAE,MAAM,MAAM,EAAE;AAC5C,YAAM,IAAI;AAAA,QACR,mBAAmB,KAAK,OAAO,YAAO,IAAI,MAAM,IAAI,IAAI,UAAU,GAAG,OAAO,KAAK,KAAK,MAAM,GAAG,GAAG,CAAC,KAAK,EAAE;AAAA,MAC5G;AAAA,IACF;AACA,UAAM,OAAQ,MAAM,IAAI,KAAK;AAC7B,UAAM,OAAO,KAAK,QAAQ,CAAC;AAC3B,QAAI,KAAK,WAAW,MAAM,QAAQ;AAChC,YAAM,IAAI;AAAA,QACR,4BAA4B,MAAM,MAAM,iBAAiB,KAAK,MAAM;AAAA,MACtE;AAAA,IACF;AACA,WAAO,KAAK,IAAI,CAAC,MAAM,EAAE,SAAS;AAAA,EACpC;AACF;AAMO,IAAM,4BAA4B;AAAA,EACvC,QAAQ;AAAA,EACR,OAAO;AAAA;AAAA,EACP,WAAW;AAAA,EACX,OAAO;AAAA,EACP,aAAa;AAAA,EACb,QAAQ;AAAA,EACR,SAAS;AAAA,EACT,QAAQ;AACV;AAmBO,SAAS,qBAAqB,MAA6C;AAChF,QAAM,UACJ,KAAK,YACJ,KAAK,SAAS,0BAA0B,KAAK,MAAM,IAAI;AAC1D,SAAO,IAAI,eAAe,EAAE,GAAG,MAAM,SAAS,IAAI,KAAK,MAAM,KAAK,UAAU,SAAS,CAAC;AACxF;AAEA,IAAO,gBAAQ;","names":[]}
|
package/dist/index.mjs
ADDED
|
@@ -0,0 +1,97 @@
|
|
|
1
|
+
// src/index.ts
|
|
2
|
+
var KNOWN_DIMENSIONS = {
|
|
3
|
+
// OpenAI
|
|
4
|
+
"text-embedding-3-small": 1536,
|
|
5
|
+
"text-embedding-3-large": 3072,
|
|
6
|
+
"text-embedding-ada-002": 1536,
|
|
7
|
+
// 阿里通义
|
|
8
|
+
"text-embedding-v3": 1024,
|
|
9
|
+
"text-embedding-v2": 1536,
|
|
10
|
+
"text-embedding-v1": 1536,
|
|
11
|
+
// 智谱
|
|
12
|
+
"embedding-3": 2048,
|
|
13
|
+
"embedding-2": 1024,
|
|
14
|
+
// 硅基流动 / BGE 家族
|
|
15
|
+
"BAAI/bge-m3": 1024,
|
|
16
|
+
"BAAI/bge-large-zh-v1.5": 1024,
|
|
17
|
+
"BAAI/bge-large-en-v1.5": 1024,
|
|
18
|
+
"BAAI/bge-base-zh-v1.5": 768,
|
|
19
|
+
"BAAI/bge-small-zh-v1.5": 512,
|
|
20
|
+
"bge-m3": 1024,
|
|
21
|
+
// 火山 Doubao
|
|
22
|
+
"doubao-embedding-large-text-240915": 4096,
|
|
23
|
+
"doubao-embedding-text-240715": 2048,
|
|
24
|
+
// Nomic / Ollama defaults
|
|
25
|
+
"nomic-embed-text": 768,
|
|
26
|
+
// MiniMax
|
|
27
|
+
"embo-01": 1536
|
|
28
|
+
};
|
|
29
|
+
var OpenAIEmbedder = class {
|
|
30
|
+
constructor(opts) {
|
|
31
|
+
if (!opts.apiKey) throw new Error("OpenAIEmbedder: apiKey required");
|
|
32
|
+
this.apiKey = opts.apiKey;
|
|
33
|
+
this.id = opts.id ?? "openai";
|
|
34
|
+
this.model = opts.model ?? "text-embedding-3-small";
|
|
35
|
+
this.baseUrl = (opts.baseUrl ?? "https://api.openai.com/v1").replace(/\/+$/, "");
|
|
36
|
+
this.fetchImpl = opts.fetch ?? globalThis.fetch;
|
|
37
|
+
this.requestedDims = opts.dimensions;
|
|
38
|
+
this.extraHeaders = opts.headers ?? {};
|
|
39
|
+
this.dimensions = opts.dimensions ?? KNOWN_DIMENSIONS[this.model] ?? 1536;
|
|
40
|
+
if (!this.fetchImpl) {
|
|
41
|
+
throw new Error(
|
|
42
|
+
"OpenAIEmbedder: no fetch available; pass options.fetch or run on Node 18+ / a fetch-capable runtime"
|
|
43
|
+
);
|
|
44
|
+
}
|
|
45
|
+
}
|
|
46
|
+
async embed(texts) {
|
|
47
|
+
if (texts.length === 0) return [];
|
|
48
|
+
const body = { model: this.model, input: texts };
|
|
49
|
+
if (this.requestedDims) body.dimensions = this.requestedDims;
|
|
50
|
+
const res = await this.fetchImpl(`${this.baseUrl}/embeddings`, {
|
|
51
|
+
method: "POST",
|
|
52
|
+
headers: {
|
|
53
|
+
"content-type": "application/json",
|
|
54
|
+
authorization: `Bearer ${this.apiKey}`,
|
|
55
|
+
...this.extraHeaders
|
|
56
|
+
},
|
|
57
|
+
body: JSON.stringify(body)
|
|
58
|
+
});
|
|
59
|
+
if (!res.ok) {
|
|
60
|
+
const text = await res.text().catch(() => "");
|
|
61
|
+
throw new Error(
|
|
62
|
+
`OpenAIEmbedder (${this.baseUrl}) \u2192 ${res.status} ${res.statusText}${text ? `: ${text.slice(0, 200)}` : ""}`
|
|
63
|
+
);
|
|
64
|
+
}
|
|
65
|
+
const json = await res.json();
|
|
66
|
+
const data = json.data ?? [];
|
|
67
|
+
if (data.length !== texts.length) {
|
|
68
|
+
throw new Error(
|
|
69
|
+
`OpenAIEmbedder: expected ${texts.length} vectors, got ${data.length}`
|
|
70
|
+
);
|
|
71
|
+
}
|
|
72
|
+
return data.map((d) => d.embedding);
|
|
73
|
+
}
|
|
74
|
+
};
|
|
75
|
+
var OPENAI_COMPATIBLE_PRESETS = {
|
|
76
|
+
openai: "https://api.openai.com/v1",
|
|
77
|
+
azure: "",
|
|
78
|
+
// user must provide full deployment URL via baseUrl
|
|
79
|
+
dashscope: "https://dashscope.aliyuncs.com/compatible-mode/v1",
|
|
80
|
+
zhipu: "https://open.bigmodel.cn/api/paas/v4",
|
|
81
|
+
siliconflow: "https://api.siliconflow.cn/v1",
|
|
82
|
+
doubao: "https://ark.cn-beijing.volces.com/api/v3",
|
|
83
|
+
minimax: "https://api.minimax.chat/v1",
|
|
84
|
+
ollama: "http://localhost:11434/v1"
|
|
85
|
+
};
|
|
86
|
+
function createOpenAIEmbedder(opts) {
|
|
87
|
+
const baseUrl = opts.baseUrl ?? (opts.preset ? OPENAI_COMPATIBLE_PRESETS[opts.preset] : void 0);
|
|
88
|
+
return new OpenAIEmbedder({ ...opts, baseUrl, id: opts.id ?? opts.preset ?? "openai" });
|
|
89
|
+
}
|
|
90
|
+
var index_default = OpenAIEmbedder;
|
|
91
|
+
export {
|
|
92
|
+
OPENAI_COMPATIBLE_PRESETS,
|
|
93
|
+
OpenAIEmbedder,
|
|
94
|
+
createOpenAIEmbedder,
|
|
95
|
+
index_default as default
|
|
96
|
+
};
|
|
97
|
+
//# sourceMappingURL=index.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../src/index.ts"],"sourcesContent":["// Copyright (c) 2026 ObjectStack. Licensed under the Apache-2.0 license.\n\n/**\n * `@objectstack/embedder-openai`\n *\n * OpenAI-compatible embedder. Drop-in for any endpoint that speaks the\n * `POST /v1/embeddings` shape:\n *\n * - OpenAI https://api.openai.com/v1\n * - Azure OpenAI https://{resource}.openai.azure.com/openai/deployments/{deployment}\n * - 阿里通义 DashScope https://dashscope.aliyuncs.com/compatible-mode/v1\n * - 智谱 BigModel https://open.bigmodel.cn/api/paas/v4\n * - 硅基流动 SiliconFlow https://api.siliconflow.cn/v1\n * - 火山引擎 Doubao https://ark.cn-beijing.volces.com/api/v3\n * - MiniMax https://api.minimax.chat/v1\n * - Ollama (openai shim) http://localhost:11434/v1\n * - LiteLLM / vLLM / 任何兼容服务\n *\n * Implements the `IEmbedder` contract from `@objectstack/spec/contracts`.\n */\n\nimport type { IEmbedder } from '@objectstack/spec/contracts';\n\nexport interface OpenAIEmbedderOptions {\n /** Bearer token sent as `Authorization: Bearer <apiKey>`. Required. */\n apiKey: string;\n /**\n * Model id sent in the request body. Choose to match your provider:\n * - OpenAI: `'text-embedding-3-small'` (default), `'text-embedding-3-large'`\n * - 阿里通义: `'text-embedding-v3'`\n * - 智谱: `'embedding-3'`\n * - 硅基流动: `'BAAI/bge-m3'`, `'BAAI/bge-large-zh-v1.5'`\n * - 火山 Doubao: `'doubao-embedding-large-text-240915'`\n * - Ollama: `'bge-m3'`, `'nomic-embed-text'`\n *\n * @default 'text-embedding-3-small'\n */\n model?: string;\n /**\n * Override dimensions. Only Matryoshka-style models (OpenAI v3, 智谱 embedding-3,\n * BGE-m3 dense) support truncation. When set, also forwarded to the upstream\n * `dimensions` body field for providers that honour it.\n */\n dimensions?: number;\n /**\n * Endpoint base URL (without `/embeddings`). Defaults to OpenAI's. Set this\n * to point at any compatible provider.\n *\n * @default 'https://api.openai.com/v1'\n */\n baseUrl?: string;\n /** Stable id surfaced as `IEmbedder.id`. @default 'openai' */\n id?: string;\n /** Inject for tests. Defaults to `globalThis.fetch`. */\n fetch?: typeof fetch;\n /** Additional headers (e.g. provider-specific keys, tracing). */\n headers?: Record<string, string>;\n}\n\n/**\n * Known dimensions for popular models. Used as the default when the\n * caller doesn't pass `dimensions` explicitly.\n */\nconst KNOWN_DIMENSIONS: Record<string, number> = {\n // OpenAI\n 'text-embedding-3-small': 1536,\n 'text-embedding-3-large': 3072,\n 'text-embedding-ada-002': 1536,\n // 阿里通义\n 'text-embedding-v3': 1024,\n 'text-embedding-v2': 1536,\n 'text-embedding-v1': 1536,\n // 智谱\n 'embedding-3': 2048,\n 'embedding-2': 1024,\n // 硅基流动 / BGE 家族\n 'BAAI/bge-m3': 1024,\n 'BAAI/bge-large-zh-v1.5': 1024,\n 'BAAI/bge-large-en-v1.5': 1024,\n 'BAAI/bge-base-zh-v1.5': 768,\n 'BAAI/bge-small-zh-v1.5': 512,\n 'bge-m3': 1024,\n // 火山 Doubao\n 'doubao-embedding-large-text-240915': 4096,\n 'doubao-embedding-text-240715': 2048,\n // Nomic / Ollama defaults\n 'nomic-embed-text': 768,\n // MiniMax\n 'embo-01': 1536,\n};\n\n/**\n * `OpenAIEmbedder` — OpenAI-compatible embedder. One instance per\n * upstream provider + model combination. Pass into any knowledge\n * adapter that expects `IEmbedder`.\n *\n * @example\n * // OpenAI\n * new OpenAIEmbedder({ apiKey: process.env.OPENAI_API_KEY! });\n *\n * @example\n * // 阿里通义 DashScope\n * new OpenAIEmbedder({\n * apiKey: process.env.DASHSCOPE_API_KEY!,\n * baseUrl: 'https://dashscope.aliyuncs.com/compatible-mode/v1',\n * model: 'text-embedding-v3',\n * });\n *\n * @example\n * // 硅基流动 SiliconFlow + BGE-m3\n * new OpenAIEmbedder({\n * apiKey: process.env.SILICONFLOW_API_KEY!,\n * baseUrl: 'https://api.siliconflow.cn/v1',\n * model: 'BAAI/bge-m3',\n * });\n *\n * @example\n * // Local Ollama\n * new OpenAIEmbedder({\n * apiKey: 'ollama',\n * baseUrl: 'http://localhost:11434/v1',\n * model: 'bge-m3',\n * });\n */\nexport class OpenAIEmbedder implements IEmbedder {\n readonly id: string;\n readonly dimensions: number;\n private readonly model: string;\n private readonly baseUrl: string;\n private readonly apiKey: string;\n private readonly fetchImpl: typeof fetch;\n private readonly requestedDims?: number;\n private readonly extraHeaders: Record<string, string>;\n\n constructor(opts: OpenAIEmbedderOptions) {\n if (!opts.apiKey) throw new Error('OpenAIEmbedder: apiKey required');\n this.apiKey = opts.apiKey;\n this.id = opts.id ?? 'openai';\n this.model = opts.model ?? 'text-embedding-3-small';\n this.baseUrl = (opts.baseUrl ?? 'https://api.openai.com/v1').replace(/\\/+$/, '');\n this.fetchImpl = opts.fetch ?? (globalThis.fetch as typeof fetch);\n this.requestedDims = opts.dimensions;\n this.extraHeaders = opts.headers ?? {};\n this.dimensions =\n opts.dimensions ?? KNOWN_DIMENSIONS[this.model] ?? 1536;\n if (!this.fetchImpl) {\n throw new Error(\n 'OpenAIEmbedder: no fetch available; pass options.fetch or run on Node 18+ / a fetch-capable runtime',\n );\n }\n }\n\n async embed(texts: string[]): Promise<number[][]> {\n if (texts.length === 0) return [];\n const body: Record<string, unknown> = { model: this.model, input: texts };\n if (this.requestedDims) body.dimensions = this.requestedDims;\n const res = await this.fetchImpl(`${this.baseUrl}/embeddings`, {\n method: 'POST',\n headers: {\n 'content-type': 'application/json',\n authorization: `Bearer ${this.apiKey}`,\n ...this.extraHeaders,\n },\n body: JSON.stringify(body),\n });\n if (!res.ok) {\n const text = await res.text().catch(() => '');\n throw new Error(\n `OpenAIEmbedder (${this.baseUrl}) → ${res.status} ${res.statusText}${text ? `: ${text.slice(0, 200)}` : ''}`,\n );\n }\n const json = (await res.json()) as { data?: Array<{ embedding: number[] }> };\n const data = json.data ?? [];\n if (data.length !== texts.length) {\n throw new Error(\n `OpenAIEmbedder: expected ${texts.length} vectors, got ${data.length}`,\n );\n }\n return data.map((d) => d.embedding);\n }\n}\n\n/**\n * Convenience presets for popular Chinese providers — saves callers\n * from memorising base URLs. Pass through `createXxxEmbedder({...})`.\n */\nexport const OPENAI_COMPATIBLE_PRESETS = {\n openai: 'https://api.openai.com/v1',\n azure: '', // user must provide full deployment URL via baseUrl\n dashscope: 'https://dashscope.aliyuncs.com/compatible-mode/v1',\n zhipu: 'https://open.bigmodel.cn/api/paas/v4',\n siliconflow: 'https://api.siliconflow.cn/v1',\n doubao: 'https://ark.cn-beijing.volces.com/api/v3',\n minimax: 'https://api.minimax.chat/v1',\n ollama: 'http://localhost:11434/v1',\n} as const;\n\nexport type OpenAICompatiblePreset = keyof typeof OPENAI_COMPATIBLE_PRESETS;\n\nexport interface PresetEmbedderOptions\n extends Omit<OpenAIEmbedderOptions, 'baseUrl'> {\n /** Pick a known provider; sets `baseUrl` automatically. */\n preset?: OpenAICompatiblePreset;\n /** Explicit override; takes precedence over `preset`. */\n baseUrl?: string;\n}\n\n/**\n * Helper: pick a provider by preset name. Equivalent to constructing\n * `OpenAIEmbedder` with the matching `baseUrl`.\n *\n * @example\n * createOpenAIEmbedder({ preset: 'dashscope', apiKey, model: 'text-embedding-v3' })\n */\nexport function createOpenAIEmbedder(opts: PresetEmbedderOptions): OpenAIEmbedder {\n const baseUrl =\n opts.baseUrl ??\n (opts.preset ? OPENAI_COMPATIBLE_PRESETS[opts.preset] : undefined);\n return new OpenAIEmbedder({ ...opts, baseUrl, id: opts.id ?? opts.preset ?? 'openai' });\n}\n\nexport default OpenAIEmbedder;\n"],"mappings":";AA+DA,IAAM,mBAA2C;AAAA;AAAA,EAE/C,0BAA0B;AAAA,EAC1B,0BAA0B;AAAA,EAC1B,0BAA0B;AAAA;AAAA,EAE1B,qBAAqB;AAAA,EACrB,qBAAqB;AAAA,EACrB,qBAAqB;AAAA;AAAA,EAErB,eAAe;AAAA,EACf,eAAe;AAAA;AAAA,EAEf,eAAe;AAAA,EACf,0BAA0B;AAAA,EAC1B,0BAA0B;AAAA,EAC1B,yBAAyB;AAAA,EACzB,0BAA0B;AAAA,EAC1B,UAAU;AAAA;AAAA,EAEV,sCAAsC;AAAA,EACtC,gCAAgC;AAAA;AAAA,EAEhC,oBAAoB;AAAA;AAAA,EAEpB,WAAW;AACb;AAmCO,IAAM,iBAAN,MAA0C;AAAA,EAU/C,YAAY,MAA6B;AACvC,QAAI,CAAC,KAAK,OAAQ,OAAM,IAAI,MAAM,iCAAiC;AACnE,SAAK,SAAS,KAAK;AACnB,SAAK,KAAK,KAAK,MAAM;AACrB,SAAK,QAAQ,KAAK,SAAS;AAC3B,SAAK,WAAW,KAAK,WAAW,6BAA6B,QAAQ,QAAQ,EAAE;AAC/E,SAAK,YAAY,KAAK,SAAU,WAAW;AAC3C,SAAK,gBAAgB,KAAK;AAC1B,SAAK,eAAe,KAAK,WAAW,CAAC;AACrC,SAAK,aACH,KAAK,cAAc,iBAAiB,KAAK,KAAK,KAAK;AACrD,QAAI,CAAC,KAAK,WAAW;AACnB,YAAM,IAAI;AAAA,QACR;AAAA,MACF;AAAA,IACF;AAAA,EACF;AAAA,EAEA,MAAM,MAAM,OAAsC;AAChD,QAAI,MAAM,WAAW,EAAG,QAAO,CAAC;AAChC,UAAM,OAAgC,EAAE,OAAO,KAAK,OAAO,OAAO,MAAM;AACxE,QAAI,KAAK,cAAe,MAAK,aAAa,KAAK;AAC/C,UAAM,MAAM,MAAM,KAAK,UAAU,GAAG,KAAK,OAAO,eAAe;AAAA,MAC7D,QAAQ;AAAA,MACR,SAAS;AAAA,QACP,gBAAgB;AAAA,QAChB,eAAe,UAAU,KAAK,MAAM;AAAA,QACpC,GAAG,KAAK;AAAA,MACV;AAAA,MACA,MAAM,KAAK,UAAU,IAAI;AAAA,IAC3B,CAAC;AACD,QAAI,CAAC,IAAI,IAAI;AACX,YAAM,OAAO,MAAM,IAAI,KAAK,EAAE,MAAM,MAAM,EAAE;AAC5C,YAAM,IAAI;AAAA,QACR,mBAAmB,KAAK,OAAO,YAAO,IAAI,MAAM,IAAI,IAAI,UAAU,GAAG,OAAO,KAAK,KAAK,MAAM,GAAG,GAAG,CAAC,KAAK,EAAE;AAAA,MAC5G;AAAA,IACF;AACA,UAAM,OAAQ,MAAM,IAAI,KAAK;AAC7B,UAAM,OAAO,KAAK,QAAQ,CAAC;AAC3B,QAAI,KAAK,WAAW,MAAM,QAAQ;AAChC,YAAM,IAAI;AAAA,QACR,4BAA4B,MAAM,MAAM,iBAAiB,KAAK,MAAM;AAAA,MACtE;AAAA,IACF;AACA,WAAO,KAAK,IAAI,CAAC,MAAM,EAAE,SAAS;AAAA,EACpC;AACF;AAMO,IAAM,4BAA4B;AAAA,EACvC,QAAQ;AAAA,EACR,OAAO;AAAA;AAAA,EACP,WAAW;AAAA,EACX,OAAO;AAAA,EACP,aAAa;AAAA,EACb,QAAQ;AAAA,EACR,SAAS;AAAA,EACT,QAAQ;AACV;AAmBO,SAAS,qBAAqB,MAA6C;AAChF,QAAM,UACJ,KAAK,YACJ,KAAK,SAAS,0BAA0B,KAAK,MAAM,IAAI;AAC1D,SAAO,IAAI,eAAe,EAAE,GAAG,MAAM,SAAS,IAAI,KAAK,MAAM,KAAK,UAAU,SAAS,CAAC;AACxF;AAEA,IAAO,gBAAQ;","names":[]}
|
package/package.json
ADDED
|
@@ -0,0 +1,40 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "@objectstack/embedder-openai",
|
|
3
|
+
"version": "6.7.0",
|
|
4
|
+
"license": "Apache-2.0",
|
|
5
|
+
"description": "OpenAI-compatible embedder for ObjectStack — works against OpenAI, 阿里通义 DashScope, 智谱 BigModel, 硅基流动 SiliconFlow, 火山引擎 Doubao, MiniMax, Ollama, and any drop-in OpenAI-shape endpoint.",
|
|
6
|
+
"main": "dist/index.js",
|
|
7
|
+
"types": "dist/index.d.ts",
|
|
8
|
+
"exports": {
|
|
9
|
+
".": {
|
|
10
|
+
"types": "./dist/index.d.ts",
|
|
11
|
+
"import": "./dist/index.mjs",
|
|
12
|
+
"require": "./dist/index.js"
|
|
13
|
+
}
|
|
14
|
+
},
|
|
15
|
+
"dependencies": {
|
|
16
|
+
"@objectstack/spec": "6.7.0"
|
|
17
|
+
},
|
|
18
|
+
"devDependencies": {
|
|
19
|
+
"@types/node": "^25.9.1",
|
|
20
|
+
"typescript": "^6.0.3",
|
|
21
|
+
"vitest": "^4.1.7"
|
|
22
|
+
},
|
|
23
|
+
"keywords": [
|
|
24
|
+
"objectstack",
|
|
25
|
+
"embedder",
|
|
26
|
+
"embedding",
|
|
27
|
+
"openai",
|
|
28
|
+
"rag",
|
|
29
|
+
"vector",
|
|
30
|
+
"dashscope",
|
|
31
|
+
"zhipu",
|
|
32
|
+
"siliconflow",
|
|
33
|
+
"ollama"
|
|
34
|
+
],
|
|
35
|
+
"scripts": {
|
|
36
|
+
"build": "tsup --config ../../../tsup.config.ts",
|
|
37
|
+
"dev": "tsc -w",
|
|
38
|
+
"test": "vitest run"
|
|
39
|
+
}
|
|
40
|
+
}
|
|
@@ -0,0 +1,166 @@
|
|
|
1
|
+
// Copyright (c) 2026 ObjectStack. Licensed under the Apache-2.0 license.
|
|
2
|
+
|
|
3
|
+
import { describe, it, expect, vi } from 'vitest';
|
|
4
|
+
import {
|
|
5
|
+
OpenAIEmbedder,
|
|
6
|
+
createOpenAIEmbedder,
|
|
7
|
+
OPENAI_COMPATIBLE_PRESETS,
|
|
8
|
+
} from '../index';
|
|
9
|
+
|
|
10
|
+
function mockFetch(body: unknown, status = 200): typeof fetch {
|
|
11
|
+
return vi.fn(async () =>
|
|
12
|
+
new Response(JSON.stringify(body), {
|
|
13
|
+
status,
|
|
14
|
+
headers: { 'content-type': 'application/json' },
|
|
15
|
+
}),
|
|
16
|
+
) as unknown as typeof fetch;
|
|
17
|
+
}
|
|
18
|
+
|
|
19
|
+
describe('OpenAIEmbedder', () => {
|
|
20
|
+
it('requires apiKey', () => {
|
|
21
|
+
expect(() => new OpenAIEmbedder({ apiKey: '' })).toThrow(/apiKey required/);
|
|
22
|
+
});
|
|
23
|
+
|
|
24
|
+
it('exposes id and known dimensions for default model', () => {
|
|
25
|
+
const e = new OpenAIEmbedder({ apiKey: 'k', fetch: mockFetch({ data: [] }) });
|
|
26
|
+
expect(e.id).toBe('openai');
|
|
27
|
+
expect(e.dimensions).toBe(1536);
|
|
28
|
+
});
|
|
29
|
+
|
|
30
|
+
it('looks up dimensions for known Chinese models', () => {
|
|
31
|
+
const e = new OpenAIEmbedder({
|
|
32
|
+
apiKey: 'k',
|
|
33
|
+
model: 'text-embedding-v3',
|
|
34
|
+
fetch: mockFetch({ data: [] }),
|
|
35
|
+
});
|
|
36
|
+
expect(e.dimensions).toBe(1024);
|
|
37
|
+
});
|
|
38
|
+
|
|
39
|
+
it('honours explicit dimensions override', () => {
|
|
40
|
+
const e = new OpenAIEmbedder({
|
|
41
|
+
apiKey: 'k',
|
|
42
|
+
dimensions: 256,
|
|
43
|
+
fetch: mockFetch({ data: [] }),
|
|
44
|
+
});
|
|
45
|
+
expect(e.dimensions).toBe(256);
|
|
46
|
+
});
|
|
47
|
+
|
|
48
|
+
it('returns [] for empty input without calling fetch', async () => {
|
|
49
|
+
const fetchImpl = vi.fn() as unknown as typeof fetch;
|
|
50
|
+
const e = new OpenAIEmbedder({ apiKey: 'k', fetch: fetchImpl });
|
|
51
|
+
const out = await e.embed([]);
|
|
52
|
+
expect(out).toEqual([]);
|
|
53
|
+
expect(fetchImpl).not.toHaveBeenCalled();
|
|
54
|
+
});
|
|
55
|
+
|
|
56
|
+
it('POSTs to the configured baseUrl with bearer auth', async () => {
|
|
57
|
+
const fetchImpl = vi.fn(async () =>
|
|
58
|
+
new Response(JSON.stringify({ data: [{ embedding: [0.1, 0.2] }] }), {
|
|
59
|
+
status: 200,
|
|
60
|
+
headers: { 'content-type': 'application/json' },
|
|
61
|
+
}),
|
|
62
|
+
) as unknown as typeof fetch;
|
|
63
|
+
|
|
64
|
+
const e = new OpenAIEmbedder({
|
|
65
|
+
apiKey: 'sk-test',
|
|
66
|
+
baseUrl: 'https://api.siliconflow.cn/v1',
|
|
67
|
+
model: 'BAAI/bge-m3',
|
|
68
|
+
fetch: fetchImpl,
|
|
69
|
+
});
|
|
70
|
+
const out = await e.embed(['hello']);
|
|
71
|
+
|
|
72
|
+
expect(out).toEqual([[0.1, 0.2]]);
|
|
73
|
+
const call = (fetchImpl as unknown as ReturnType<typeof vi.fn>).mock.calls[0];
|
|
74
|
+
expect(call[0]).toBe('https://api.siliconflow.cn/v1/embeddings');
|
|
75
|
+
const init = call[1] as RequestInit;
|
|
76
|
+
expect(init.method).toBe('POST');
|
|
77
|
+
expect((init.headers as Record<string, string>).authorization).toBe('Bearer sk-test');
|
|
78
|
+
expect(JSON.parse(init.body as string)).toEqual({ model: 'BAAI/bge-m3', input: ['hello'] });
|
|
79
|
+
});
|
|
80
|
+
|
|
81
|
+
it('forwards dimensions in the request body when overridden', async () => {
|
|
82
|
+
const fetchImpl = mockFetch({ data: [{ embedding: [1, 2] }] });
|
|
83
|
+
const e = new OpenAIEmbedder({
|
|
84
|
+
apiKey: 'k',
|
|
85
|
+
dimensions: 512,
|
|
86
|
+
fetch: fetchImpl,
|
|
87
|
+
});
|
|
88
|
+
await e.embed(['x']);
|
|
89
|
+
const body = JSON.parse(
|
|
90
|
+
(fetchImpl as unknown as ReturnType<typeof vi.fn>).mock.calls[0][1].body as string,
|
|
91
|
+
);
|
|
92
|
+
expect(body.dimensions).toBe(512);
|
|
93
|
+
});
|
|
94
|
+
|
|
95
|
+
it('throws a useful error on non-2xx', async () => {
|
|
96
|
+
const fetchImpl = mockFetch({ error: 'bad key' }, 401);
|
|
97
|
+
const e = new OpenAIEmbedder({ apiKey: 'k', fetch: fetchImpl });
|
|
98
|
+
await expect(e.embed(['x'])).rejects.toThrow(/401/);
|
|
99
|
+
});
|
|
100
|
+
|
|
101
|
+
it('throws when response vector count mismatches input', async () => {
|
|
102
|
+
const fetchImpl = mockFetch({ data: [{ embedding: [1] }] });
|
|
103
|
+
const e = new OpenAIEmbedder({ apiKey: 'k', fetch: fetchImpl });
|
|
104
|
+
await expect(e.embed(['a', 'b'])).rejects.toThrow(/expected 2 vectors/);
|
|
105
|
+
});
|
|
106
|
+
|
|
107
|
+
it('strips trailing slashes from baseUrl', async () => {
|
|
108
|
+
const fetchImpl = mockFetch({ data: [{ embedding: [1] }] });
|
|
109
|
+
const e = new OpenAIEmbedder({
|
|
110
|
+
apiKey: 'k',
|
|
111
|
+
baseUrl: 'https://x.example/v1///',
|
|
112
|
+
fetch: fetchImpl,
|
|
113
|
+
});
|
|
114
|
+
await e.embed(['x']);
|
|
115
|
+
expect(
|
|
116
|
+
(fetchImpl as unknown as ReturnType<typeof vi.fn>).mock.calls[0][0],
|
|
117
|
+
).toBe('https://x.example/v1/embeddings');
|
|
118
|
+
});
|
|
119
|
+
|
|
120
|
+
it('merges extra headers', async () => {
|
|
121
|
+
const fetchImpl = mockFetch({ data: [{ embedding: [1] }] });
|
|
122
|
+
const e = new OpenAIEmbedder({
|
|
123
|
+
apiKey: 'k',
|
|
124
|
+
fetch: fetchImpl,
|
|
125
|
+
headers: { 'x-trace-id': 't1' },
|
|
126
|
+
});
|
|
127
|
+
await e.embed(['x']);
|
|
128
|
+
const headers = (fetchImpl as unknown as ReturnType<typeof vi.fn>).mock
|
|
129
|
+
.calls[0][1].headers as Record<string, string>;
|
|
130
|
+
expect(headers['x-trace-id']).toBe('t1');
|
|
131
|
+
expect(headers.authorization).toBe('Bearer k');
|
|
132
|
+
});
|
|
133
|
+
});
|
|
134
|
+
|
|
135
|
+
describe('createOpenAIEmbedder presets', () => {
|
|
136
|
+
it('maps preset names to baseUrl', () => {
|
|
137
|
+
const e = createOpenAIEmbedder({
|
|
138
|
+
preset: 'dashscope',
|
|
139
|
+
apiKey: 'k',
|
|
140
|
+
model: 'text-embedding-v3',
|
|
141
|
+
fetch: mockFetch({ data: [] }),
|
|
142
|
+
});
|
|
143
|
+
expect(e.id).toBe('dashscope');
|
|
144
|
+
expect(e.dimensions).toBe(1024);
|
|
145
|
+
});
|
|
146
|
+
|
|
147
|
+
it('exposes well-known preset URLs', () => {
|
|
148
|
+
expect(OPENAI_COMPATIBLE_PRESETS.siliconflow).toContain('siliconflow.cn');
|
|
149
|
+
expect(OPENAI_COMPATIBLE_PRESETS.zhipu).toContain('bigmodel.cn');
|
|
150
|
+
expect(OPENAI_COMPATIBLE_PRESETS.ollama).toContain('localhost:11434');
|
|
151
|
+
});
|
|
152
|
+
|
|
153
|
+
it('explicit baseUrl wins over preset', async () => {
|
|
154
|
+
const fetchImpl = mockFetch({ data: [{ embedding: [1] }] });
|
|
155
|
+
const e = createOpenAIEmbedder({
|
|
156
|
+
preset: 'openai',
|
|
157
|
+
baseUrl: 'https://my-proxy.example/v1',
|
|
158
|
+
apiKey: 'k',
|
|
159
|
+
fetch: fetchImpl,
|
|
160
|
+
});
|
|
161
|
+
await e.embed(['x']);
|
|
162
|
+
expect(
|
|
163
|
+
(fetchImpl as unknown as ReturnType<typeof vi.fn>).mock.calls[0][0],
|
|
164
|
+
).toBe('https://my-proxy.example/v1/embeddings');
|
|
165
|
+
});
|
|
166
|
+
});
|