@cmdoss/memwal-sdk 0.6.2 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (247) hide show
  1. package/ARCHITECTURE.md +547 -547
  2. package/BENCHMARKS.md +238 -238
  3. package/README.md +310 -181
  4. package/dist/ai-sdk/tools.d.ts +2 -2
  5. package/dist/ai-sdk/tools.js +2 -2
  6. package/dist/client/ClientMemoryManager.js +2 -2
  7. package/dist/client/ClientMemoryManager.js.map +1 -1
  8. package/dist/client/PersonalDataWallet.d.ts.map +1 -1
  9. package/dist/client/SimplePDWClient.d.ts +29 -1
  10. package/dist/client/SimplePDWClient.d.ts.map +1 -1
  11. package/dist/client/SimplePDWClient.js +45 -13
  12. package/dist/client/SimplePDWClient.js.map +1 -1
  13. package/dist/client/namespaces/EmbeddingsNamespace.d.ts +1 -1
  14. package/dist/client/namespaces/EmbeddingsNamespace.js +1 -1
  15. package/dist/client/namespaces/MemoryNamespace.d.ts +31 -0
  16. package/dist/client/namespaces/MemoryNamespace.d.ts.map +1 -1
  17. package/dist/client/namespaces/MemoryNamespace.js +272 -39
  18. package/dist/client/namespaces/MemoryNamespace.js.map +1 -1
  19. package/dist/client/namespaces/consolidated/AINamespace.d.ts +2 -2
  20. package/dist/client/namespaces/consolidated/AINamespace.js +2 -2
  21. package/dist/client/namespaces/consolidated/BlockchainNamespace.d.ts +12 -2
  22. package/dist/client/namespaces/consolidated/BlockchainNamespace.d.ts.map +1 -1
  23. package/dist/client/namespaces/consolidated/BlockchainNamespace.js +62 -4
  24. package/dist/client/namespaces/consolidated/BlockchainNamespace.js.map +1 -1
  25. package/dist/client/namespaces/consolidated/StorageNamespace.d.ts +67 -2
  26. package/dist/client/namespaces/consolidated/StorageNamespace.d.ts.map +1 -1
  27. package/dist/client/namespaces/consolidated/StorageNamespace.js +549 -16
  28. package/dist/client/namespaces/consolidated/StorageNamespace.js.map +1 -1
  29. package/dist/config/ConfigurationHelper.js +61 -61
  30. package/dist/config/defaults.js +2 -2
  31. package/dist/config/defaults.js.map +1 -1
  32. package/dist/graph/GraphService.js +21 -21
  33. package/dist/graph/GraphService.js.map +1 -1
  34. package/dist/index.d.ts +3 -1
  35. package/dist/index.d.ts.map +1 -1
  36. package/dist/index.js +3 -1
  37. package/dist/index.js.map +1 -1
  38. package/dist/infrastructure/seal/EncryptionService.d.ts +9 -5
  39. package/dist/infrastructure/seal/EncryptionService.d.ts.map +1 -1
  40. package/dist/infrastructure/seal/EncryptionService.js +37 -15
  41. package/dist/infrastructure/seal/EncryptionService.js.map +1 -1
  42. package/dist/infrastructure/seal/SealService.d.ts +13 -5
  43. package/dist/infrastructure/seal/SealService.d.ts.map +1 -1
  44. package/dist/infrastructure/seal/SealService.js +36 -34
  45. package/dist/infrastructure/seal/SealService.js.map +1 -1
  46. package/dist/langchain/createPDWRAG.js +30 -30
  47. package/dist/retrieval/MemoryDecryptionPipeline.d.ts.map +1 -1
  48. package/dist/retrieval/MemoryDecryptionPipeline.js +2 -1
  49. package/dist/retrieval/MemoryDecryptionPipeline.js.map +1 -1
  50. package/dist/retrieval/MemoryRetrievalService.d.ts +31 -0
  51. package/dist/retrieval/MemoryRetrievalService.d.ts.map +1 -1
  52. package/dist/retrieval/MemoryRetrievalService.js +44 -4
  53. package/dist/retrieval/MemoryRetrievalService.js.map +1 -1
  54. package/dist/services/CapabilityService.d.ts.map +1 -1
  55. package/dist/services/CapabilityService.js +30 -14
  56. package/dist/services/CapabilityService.js.map +1 -1
  57. package/dist/services/CrossContextPermissionService.d.ts.map +1 -1
  58. package/dist/services/CrossContextPermissionService.js +9 -7
  59. package/dist/services/CrossContextPermissionService.js.map +1 -1
  60. package/dist/services/EmbeddingService.d.ts +28 -1
  61. package/dist/services/EmbeddingService.d.ts.map +1 -1
  62. package/dist/services/EmbeddingService.js +54 -0
  63. package/dist/services/EmbeddingService.js.map +1 -1
  64. package/dist/services/EncryptionService.d.ts.map +1 -1
  65. package/dist/services/EncryptionService.js +6 -5
  66. package/dist/services/EncryptionService.js.map +1 -1
  67. package/dist/services/GeminiAIService.js +309 -309
  68. package/dist/services/IndexManager.d.ts +5 -1
  69. package/dist/services/IndexManager.d.ts.map +1 -1
  70. package/dist/services/IndexManager.js +17 -40
  71. package/dist/services/IndexManager.js.map +1 -1
  72. package/dist/services/QueryService.js +1 -1
  73. package/dist/services/QueryService.js.map +1 -1
  74. package/dist/services/StorageService.d.ts +11 -0
  75. package/dist/services/StorageService.d.ts.map +1 -1
  76. package/dist/services/StorageService.js +73 -10
  77. package/dist/services/StorageService.js.map +1 -1
  78. package/dist/services/TransactionService.d.ts +20 -0
  79. package/dist/services/TransactionService.d.ts.map +1 -1
  80. package/dist/services/TransactionService.js +43 -0
  81. package/dist/services/TransactionService.js.map +1 -1
  82. package/dist/services/ViewService.js +2 -2
  83. package/dist/services/ViewService.js.map +1 -1
  84. package/dist/services/storage/QuiltBatchManager.d.ts +101 -1
  85. package/dist/services/storage/QuiltBatchManager.d.ts.map +1 -1
  86. package/dist/services/storage/QuiltBatchManager.js +410 -20
  87. package/dist/services/storage/QuiltBatchManager.js.map +1 -1
  88. package/dist/services/storage/index.d.ts +1 -1
  89. package/dist/services/storage/index.d.ts.map +1 -1
  90. package/dist/services/storage/index.js.map +1 -1
  91. package/dist/utils/LRUCache.d.ts +106 -0
  92. package/dist/utils/LRUCache.d.ts.map +1 -0
  93. package/dist/utils/LRUCache.js +281 -0
  94. package/dist/utils/LRUCache.js.map +1 -0
  95. package/dist/utils/index.d.ts +1 -0
  96. package/dist/utils/index.d.ts.map +1 -1
  97. package/dist/utils/index.js +2 -0
  98. package/dist/utils/index.js.map +1 -1
  99. package/dist/utils/memoryIndexOnChain.d.ts +212 -0
  100. package/dist/utils/memoryIndexOnChain.d.ts.map +1 -0
  101. package/dist/utils/memoryIndexOnChain.js +312 -0
  102. package/dist/utils/memoryIndexOnChain.js.map +1 -0
  103. package/dist/utils/rebuildIndexNode.d.ts +29 -0
  104. package/dist/utils/rebuildIndexNode.d.ts.map +1 -1
  105. package/dist/utils/rebuildIndexNode.js +366 -98
  106. package/dist/utils/rebuildIndexNode.js.map +1 -1
  107. package/dist/vector/HnswWasmService.d.ts +20 -5
  108. package/dist/vector/HnswWasmService.d.ts.map +1 -1
  109. package/dist/vector/HnswWasmService.js +73 -40
  110. package/dist/vector/HnswWasmService.js.map +1 -1
  111. package/dist/vector/IHnswService.d.ts +10 -1
  112. package/dist/vector/IHnswService.d.ts.map +1 -1
  113. package/dist/vector/IHnswService.js.map +1 -1
  114. package/dist/vector/NodeHnswService.d.ts +16 -0
  115. package/dist/vector/NodeHnswService.d.ts.map +1 -1
  116. package/dist/vector/NodeHnswService.js +84 -5
  117. package/dist/vector/NodeHnswService.js.map +1 -1
  118. package/dist/vector/createHnswService.d.ts +1 -1
  119. package/dist/vector/createHnswService.js +1 -1
  120. package/dist/vector/index.d.ts +1 -1
  121. package/dist/vector/index.js +1 -1
  122. package/package.json +157 -157
  123. package/src/access/PermissionService.ts +635 -635
  124. package/src/aggregation/AggregationService.ts +389 -389
  125. package/src/ai-sdk/PDWVectorStore.ts +715 -715
  126. package/src/ai-sdk/index.ts +65 -65
  127. package/src/ai-sdk/tools.ts +460 -460
  128. package/src/ai-sdk/types.ts +404 -404
  129. package/src/batch/BatchManager.ts +597 -597
  130. package/src/batch/BatchingService.ts +429 -429
  131. package/src/batch/MemoryProcessingCache.ts +492 -492
  132. package/src/batch/index.ts +30 -30
  133. package/src/browser.ts +200 -200
  134. package/src/client/ClientMemoryManager.ts +987 -987
  135. package/src/client/PersonalDataWallet.ts +345 -345
  136. package/src/client/SimplePDWClient.ts +1289 -1222
  137. package/src/client/factory.ts +154 -154
  138. package/src/client/namespaces/AnalyticsNamespace.ts +377 -377
  139. package/src/client/namespaces/BatchNamespace.ts +356 -356
  140. package/src/client/namespaces/CacheNamespace.ts +123 -123
  141. package/src/client/namespaces/CapabilityNamespace.ts +217 -217
  142. package/src/client/namespaces/ClassifyNamespace.ts +169 -169
  143. package/src/client/namespaces/ContextNamespace.ts +297 -297
  144. package/src/client/namespaces/EmbeddingsNamespace.ts +99 -99
  145. package/src/client/namespaces/EncryptionNamespace.ts +221 -221
  146. package/src/client/namespaces/GraphNamespace.ts +468 -468
  147. package/src/client/namespaces/IndexNamespace.ts +361 -361
  148. package/src/client/namespaces/MemoryNamespace.ts +1422 -1135
  149. package/src/client/namespaces/PermissionsNamespace.ts +254 -254
  150. package/src/client/namespaces/PipelineNamespace.ts +220 -220
  151. package/src/client/namespaces/SearchNamespace.ts +1049 -1049
  152. package/src/client/namespaces/StorageNamespace.ts +458 -458
  153. package/src/client/namespaces/TxNamespace.ts +260 -260
  154. package/src/client/namespaces/WalletNamespace.ts +243 -243
  155. package/src/client/namespaces/consolidated/AINamespace.ts +449 -449
  156. package/src/client/namespaces/consolidated/BlockchainNamespace.ts +607 -546
  157. package/src/client/namespaces/consolidated/SecurityNamespace.ts +648 -648
  158. package/src/client/namespaces/consolidated/StorageNamespace.ts +1141 -497
  159. package/src/client/namespaces/consolidated/index.ts +39 -39
  160. package/src/client/signers/KeypairSigner.ts +108 -108
  161. package/src/client/signers/UnifiedSigner.ts +110 -110
  162. package/src/client/signers/WalletAdapterSigner.ts +159 -159
  163. package/src/client/signers/index.ts +26 -26
  164. package/src/config/ConfigurationHelper.ts +412 -412
  165. package/src/config/defaults.ts +51 -51
  166. package/src/config/index.ts +8 -8
  167. package/src/config/validation.ts +70 -70
  168. package/src/core/index.ts +14 -14
  169. package/src/core/interfaces/IService.ts +307 -307
  170. package/src/core/interfaces/index.ts +8 -8
  171. package/src/core/types/capability.ts +297 -297
  172. package/src/core/types/index.ts +870 -870
  173. package/src/core/types/wallet.ts +270 -270
  174. package/src/core/types.ts +9 -9
  175. package/src/core/wallet.ts +222 -222
  176. package/src/embedding/index.ts +19 -19
  177. package/src/embedding/types.ts +357 -357
  178. package/src/errors/index.ts +602 -602
  179. package/src/errors/recovery.ts +461 -461
  180. package/src/errors/validation.ts +567 -567
  181. package/src/generated/pdw/capability.ts +319 -319
  182. package/src/graph/GraphService.ts +887 -887
  183. package/src/graph/KnowledgeGraphManager.ts +728 -728
  184. package/src/graph/index.ts +25 -25
  185. package/src/index.ts +498 -474
  186. package/src/infrastructure/index.ts +22 -22
  187. package/src/infrastructure/seal/EncryptionService.ts +628 -603
  188. package/src/infrastructure/seal/SealService.ts +613 -615
  189. package/src/infrastructure/seal/index.ts +9 -9
  190. package/src/infrastructure/sui/BlockchainManager.ts +627 -627
  191. package/src/infrastructure/sui/SuiService.ts +888 -888
  192. package/src/infrastructure/sui/index.ts +9 -9
  193. package/src/infrastructure/walrus/StorageManager.ts +604 -604
  194. package/src/infrastructure/walrus/WalrusStorageService.ts +612 -612
  195. package/src/infrastructure/walrus/index.ts +9 -9
  196. package/src/langchain/PDWEmbeddings.ts +145 -145
  197. package/src/langchain/PDWVectorStore.ts +456 -456
  198. package/src/langchain/createPDWRAG.ts +303 -303
  199. package/src/langchain/index.ts +47 -47
  200. package/src/permissions/ConsentRepository.browser.ts +249 -249
  201. package/src/permissions/ConsentRepository.ts +364 -364
  202. package/src/pipeline/MemoryPipeline.ts +862 -862
  203. package/src/pipeline/PipelineManager.ts +683 -683
  204. package/src/pipeline/index.ts +26 -26
  205. package/src/retrieval/AdvancedSearchService.ts +629 -629
  206. package/src/retrieval/MemoryAnalyticsService.ts +711 -711
  207. package/src/retrieval/MemoryDecryptionPipeline.ts +825 -824
  208. package/src/retrieval/MemoryRetrievalService.ts +904 -830
  209. package/src/retrieval/index.ts +42 -42
  210. package/src/services/BatchService.ts +352 -352
  211. package/src/services/CapabilityService.ts +464 -448
  212. package/src/services/ClassifierService.ts +465 -465
  213. package/src/services/CrossContextPermissionService.ts +486 -484
  214. package/src/services/EmbeddingService.ts +771 -706
  215. package/src/services/EncryptionService.ts +712 -711
  216. package/src/services/GeminiAIService.ts +753 -753
  217. package/src/services/IndexManager.ts +977 -1004
  218. package/src/services/MemoryIndexService.ts +1003 -1003
  219. package/src/services/MemoryService.ts +369 -369
  220. package/src/services/QueryService.ts +890 -890
  221. package/src/services/StorageService.ts +1182 -1111
  222. package/src/services/TransactionService.ts +838 -790
  223. package/src/services/VectorService.ts +462 -462
  224. package/src/services/ViewService.ts +484 -484
  225. package/src/services/index.ts +25 -25
  226. package/src/services/storage/BlobAttributesManager.ts +333 -333
  227. package/src/services/storage/KnowledgeGraphManager.ts +425 -425
  228. package/src/services/storage/MemorySearchManager.ts +387 -387
  229. package/src/services/storage/QuiltBatchManager.ts +1130 -660
  230. package/src/services/storage/WalrusMetadataManager.ts +268 -268
  231. package/src/services/storage/WalrusStorageManager.ts +287 -287
  232. package/src/services/storage/index.ts +57 -52
  233. package/src/types/index.ts +13 -13
  234. package/src/utils/LRUCache.ts +378 -0
  235. package/src/utils/index.ts +76 -68
  236. package/src/utils/memoryIndexOnChain.ts +507 -0
  237. package/src/utils/rebuildIndex.ts +290 -290
  238. package/src/utils/rebuildIndexNode.ts +771 -424
  239. package/src/vector/BrowserHnswIndexService.ts +758 -758
  240. package/src/vector/HnswWasmService.ts +731 -679
  241. package/src/vector/IHnswService.ts +233 -224
  242. package/src/vector/NodeHnswService.ts +833 -735
  243. package/src/vector/VectorManager.ts +478 -478
  244. package/src/vector/createHnswService.ts +135 -135
  245. package/src/vector/index.ts +56 -56
  246. package/src/wallet/ContextWalletService.ts +656 -656
  247. package/src/wallet/MainWalletService.ts +317 -317
@@ -1,706 +1,771 @@
1
- /**
2
- * EmbeddingService - AI SDK Integration
3
- *
4
- * Refactored to use Vercel AI SDK as the underlying embedding provider.
5
- * Supports any AI SDK compatible provider (OpenAI, Google, Cohere, etc.)
6
- * while maintaining backward compatibility with existing PDW code.
7
- *
8
- * OpenRouter now uses the official @openrouter/sdk instead of raw fetch calls.
9
- *
10
- * Key features:
11
- * - Provider-agnostic: Accept any ai-sdk EmbeddingModel
12
- * - Backward compatible: Existing code continues to work
13
- * - Flexible configuration: Direct model OR provider config
14
- */
15
-
16
- import type { EmbeddingModelV2 } from '@ai-sdk/provider';
17
- import { embed, embedMany } from 'ai';
18
- import { createGoogleGenerativeAI } from '@ai-sdk/google';
19
- import { createOpenAI } from '@ai-sdk/openai';
20
- import { OpenRouter } from '@openrouter/sdk';
21
-
22
- // Type alias for embedding models - V2 is the default in AI SDK v5
23
- type EmbeddingModel<VALUE> = EmbeddingModelV2<VALUE>;
24
-
25
- // Provider instances (lazily initialized)
26
- let googleProvider: ReturnType<typeof createGoogleGenerativeAI> | null = null;
27
- let openaiProvider: ReturnType<typeof createOpenAI> | null = null;
28
- let openrouterProvider: ReturnType<typeof createOpenAI> | null = null;
29
- let cohereProvider: any = null;
30
-
31
- export interface EmbeddingConfig {
32
- /**
33
- * Option 1: Direct ai-sdk model (most flexible)
34
- * User provides their own EmbeddingModel from any provider
35
- *
36
- * For backward compatibility, also accepts string (treated as modelName)
37
- *
38
- * @example
39
- * ```typescript
40
- * import { openai } from '@ai-sdk/openai';
41
- * const service = new EmbeddingService({
42
- * model: openai.embedding('text-embedding-3-large')
43
- * });
44
- *
45
- * // Backward compatible:
46
- * const service = new EmbeddingService({
47
- * model: 'text-embedding-004', // Treated as modelName
48
- * apiKey: 'your-key'
49
- * });
50
- * ```
51
- */
52
- model?: EmbeddingModel<string> | string;
53
-
54
- /**
55
- * Option 2: Provider-based configuration
56
- * PDW creates the model from provider settings
57
- *
58
- * - google: Direct Google AI API
59
- * - openai: Direct OpenAI API
60
- * - openrouter: OpenRouter API gateway (supports multiple models)
61
- * - cohere: Direct Cohere API
62
- */
63
- provider?: 'google' | 'openai' | 'openrouter' | 'cohere';
64
-
65
- /**
66
- * API key for the provider
67
- * Falls back to environment variables:
68
- * - GEMINI_API_KEY or GOOGLE_AI_API_KEY (for google)
69
- * - OPENAI_API_KEY (for openai)
70
- * - OPENROUTER_API_KEY (for openrouter)
71
- * - COHERE_API_KEY (for cohere)
72
- */
73
- apiKey?: string;
74
-
75
- /**
76
- * Model name to use
77
- * - Google: 'text-embedding-004', 'gemini-embedding-001'
78
- * - OpenAI: 'text-embedding-3-small', 'text-embedding-3-large'
79
- * - OpenRouter: 'google/gemini-embedding-001', 'openai/text-embedding-3-small', etc.
80
- * - Cohere: 'embed-english-v3.0', 'embed-multilingual-v3.0'
81
- */
82
- modelName?: string;
83
-
84
- /**
85
- * Embedding dimensions (optional, provider-dependent)
86
- * - Google: Up to 768
87
- * - OpenAI: 256, 512, 1024, 1536, 3072 (depending on model)
88
- * - OpenRouter: Depends on the underlying model
89
- * - Cohere: Model-specific
90
- */
91
- dimensions?: number;
92
-
93
- /**
94
- * Rate limiting
95
- */
96
- requestsPerMinute?: number;
97
- }
98
-
99
- export interface EmbeddingOptions {
100
- text: string;
101
- type?: 'content' | 'metadata' | 'query';
102
- taskType?: 'RETRIEVAL_QUERY' | 'RETRIEVAL_DOCUMENT' | 'SEMANTIC_SIMILARITY';
103
- }
104
-
105
- export interface EmbeddingResult {
106
- vector: number[];
107
- dimension: number;
108
- model: string;
109
- processingTime: number;
110
- tokenCount?: number;
111
- }
112
-
113
- export interface BatchEmbeddingResult {
114
- vectors: number[][];
115
- dimension: number;
116
- model: string;
117
- totalProcessingTime: number;
118
- averageProcessingTime: number;
119
- successCount: number;
120
- failedCount: number;
121
- }
122
-
123
- /**
124
- * Embedding service using Vercel AI SDK
125
- * Supports all AI SDK compatible providers
126
- * OpenRouter uses the official @openrouter/sdk for better type safety
127
- */
128
- export class EmbeddingService {
129
- private embeddingModel: EmbeddingModel<string> | null = null;
130
- private modelName: string;
131
- private dimensions: number;
132
- private requestCount = 0;
133
- private lastReset = Date.now();
134
- private readonly maxRequestsPerMinute: number;
135
- private provider: 'google' | 'openai' | 'openrouter' | 'cohere' | 'custom';
136
- private apiKey: string = '';
137
- private openRouterClient: OpenRouter | null = null;
138
-
139
- constructor(config: EmbeddingConfig = {}) {
140
- this.maxRequestsPerMinute = config.requestsPerMinute || 1500;
141
-
142
- // Case 1: Direct model provided (most flexible)
143
- if (config.model) {
144
- // Backward compatibility: If model is a string, treat as modelName
145
- if (typeof config.model === 'string') {
146
- const modelNameFromString = config.model;
147
- console.log(`🔄 Backward compatibility: treating model string "${modelNameFromString}" as modelName`);
148
-
149
- // Treat string as modelName and use provider config path
150
- const provider = config.provider || 'google';
151
- this.apiKey = this.resolveApiKey(provider, config.apiKey);
152
-
153
- if (!this.apiKey) {
154
- throw new Error(
155
- `API key is required for ${provider} provider. ` +
156
- `Provide it via config.apiKey or environment variable.`
157
- );
158
- }
159
-
160
- this.provider = provider;
161
- this.modelName = modelNameFromString;
162
- this.dimensions = config.dimensions || this.getDefaultDimensions(provider);
163
-
164
- // OpenRouter uses SDK, others use AI SDK
165
- if (provider === 'openrouter') {
166
- this.openRouterClient = new OpenRouter({ apiKey: this.apiKey });
167
- } else {
168
- this.embeddingModel = this.createModel(provider, this.apiKey, this.modelName);
169
- }
170
-
171
- console.log(`✅ EmbeddingService initialized with ${provider} provider (${this.modelName}) [backward compat mode]`);
172
- return;
173
- }
174
-
175
- // New behavior: Direct EmbeddingModel from ai-sdk
176
- this.embeddingModel = config.model;
177
- this.modelName = 'custom';
178
- this.dimensions = config.dimensions || 3072;
179
- this.provider = 'custom';
180
- console.log('✅ EmbeddingService initialized with custom ai-sdk model');
181
- return;
182
- }
183
-
184
- // Case 2: Provider-based configuration
185
- const provider = config.provider || 'google'; // Default to google for backward compat
186
- this.apiKey = this.resolveApiKey(provider, config.apiKey);
187
-
188
- if (!this.apiKey) {
189
- throw new Error(
190
- `API key is required for ${provider} provider. ` +
191
- `Provide it via config.apiKey or environment variable.`
192
- );
193
- }
194
-
195
- this.provider = provider;
196
- this.modelName = config.modelName || this.getDefaultModelName(provider);
197
- this.dimensions = config.dimensions || this.getDefaultDimensions(provider);
198
-
199
- // OpenRouter uses SDK, others use AI SDK
200
- if (provider === 'openrouter') {
201
- this.openRouterClient = new OpenRouter({ apiKey: this.apiKey });
202
- } else {
203
- this.embeddingModel = this.createModel(provider, this.apiKey, this.modelName);
204
- }
205
-
206
- console.log(`✅ EmbeddingService initialized with ${provider} provider (${this.modelName})`);
207
- }
208
-
209
- /**
210
- * Resolve API key from config or environment
211
- */
212
- private resolveApiKey(provider: string, configKey?: string): string {
213
- if (configKey) return configKey;
214
-
215
- switch (provider) {
216
- case 'google':
217
- return process.env.GEMINI_API_KEY || process.env.GOOGLE_AI_API_KEY || '';
218
- case 'openai':
219
- return process.env.OPENAI_API_KEY || '';
220
- case 'openrouter':
221
- return process.env.OPENROUTER_API_KEY || '';
222
- case 'cohere':
223
- return process.env.COHERE_API_KEY || '';
224
- default:
225
- return '';
226
- }
227
- }
228
-
229
- /**
230
- * Get default model name for provider
231
- */
232
- private getDefaultModelName(provider: string): string {
233
- switch (provider) {
234
- case 'google':
235
- return 'text-embedding-004';
236
- case 'openai':
237
- return 'text-embedding-3-small';
238
- case 'openrouter':
239
- return 'google/gemini-embedding-001'; // Default OpenRouter embedding model
240
- case 'cohere':
241
- return 'embed-english-v3.0';
242
- default:
243
- return 'text-embedding-004';
244
- }
245
- }
246
-
247
- /**
248
- * Get default dimensions for provider
249
- */
250
- private getDefaultDimensions(provider: string): number {
251
- switch (provider) {
252
- case 'google':
253
- return 3072;
254
- case 'openai':
255
- return 1536; // text-embedding-3-small default
256
- case 'openrouter':
257
- return 3072; // google/gemini-embedding-001 returns 3072 dimensions
258
- case 'cohere':
259
- return 1024;
260
- default:
261
- return 3072;
262
- }
263
- }
264
-
265
- /**
266
- * Create embedding model from provider
267
- */
268
- private createModel(
269
- provider: string,
270
- apiKey: string,
271
- modelName: string
272
- ): EmbeddingModel<string> {
273
- switch (provider) {
274
- case 'google': {
275
- if (!googleProvider) {
276
- googleProvider = createGoogleGenerativeAI({ apiKey });
277
- }
278
- return googleProvider.textEmbeddingModel(modelName);
279
- }
280
-
281
- case 'openai': {
282
- if (!openaiProvider) {
283
- openaiProvider = createOpenAI({ apiKey });
284
- }
285
- // OpenAI returns EmbeddingModelV2 but is compatible with ai SDK
286
- return openaiProvider.textEmbeddingModel(modelName) as unknown as EmbeddingModel<string>;
287
- }
288
-
289
- case 'openrouter': {
290
- // OpenRouter uses OpenAI-compatible API with custom baseURL
291
- if (!openrouterProvider) {
292
- openrouterProvider = createOpenAI({
293
- baseURL: 'https://openrouter.ai/api/v1',
294
- apiKey,
295
- });
296
- }
297
- // OpenRouter embedding models use the same interface as OpenAI
298
- return openrouterProvider.textEmbeddingModel(modelName) as unknown as EmbeddingModel<string>;
299
- }
300
-
301
- case 'cohere': {
302
- if (!cohereProvider) {
303
- throw new Error(
304
- 'Cohere provider requires manual initialization. ' +
305
- 'Import createCohere from @ai-sdk/cohere and set cohereProvider before use.'
306
- );
307
- }
308
- return cohereProvider.textEmbedding(modelName);
309
- }
310
-
311
- default:
312
- throw new Error(`Unsupported provider: ${provider}`);
313
- }
314
- }
315
-
316
- /**
317
- * Generate embedding for a single text
318
- */
319
- async embedText(options: EmbeddingOptions): Promise<EmbeddingResult> {
320
- const startTime = Date.now();
321
-
322
- // Validate input
323
- if (!options.text || typeof options.text !== 'string' || options.text.trim().length === 0) {
324
- throw new Error('Invalid or empty text provided for embedding');
325
- }
326
-
327
- await this.checkRateLimit();
328
-
329
- try {
330
- // OpenRouter uses native fetch API for better compatibility
331
- if (this.provider === 'openrouter') {
332
- return await this.embedTextOpenRouter(options.text, startTime);
333
- }
334
-
335
- // Other providers use AI SDK
336
- if (!this.embeddingModel) {
337
- throw new Error('Embedding model not initialized');
338
- }
339
-
340
- const result = await embed({
341
- model: this.embeddingModel,
342
- value: options.text,
343
- ...this.getProviderOptions(options),
344
- });
345
-
346
- this.requestCount++;
347
-
348
- return {
349
- vector: result.embedding,
350
- dimension: result.embedding.length,
351
- model: this.modelName,
352
- processingTime: Date.now() - startTime,
353
- tokenCount: result.usage?.tokens,
354
- };
355
- } catch (error) {
356
- throw new Error(
357
- `Embedding generation failed: ${error instanceof Error ? error.message : 'Unknown error'}`
358
- );
359
- }
360
- }
361
-
362
- /**
363
- * Generate embedding using OpenRouter SDK
364
- * Uses official @openrouter/sdk for embeddings
365
- */
366
- private async embedTextOpenRouter(text: string, startTime: number): Promise<EmbeddingResult> {
367
- if (!this.openRouterClient) {
368
- throw new Error('OpenRouter client not initialized');
369
- }
370
-
371
- const result = await this.openRouterClient.embeddings.generate({
372
- model: this.modelName,
373
- input: text
374
- });
375
-
376
- // Handle union type - result can be string or object
377
- if (typeof result === 'string') {
378
- throw new Error('Unexpected string response from OpenRouter embeddings API');
379
- }
380
-
381
- const data = (result as any).data;
382
- if (!data || !data[0] || !data[0].embedding) {
383
- throw new Error('Invalid response from OpenRouter embeddings API');
384
- }
385
-
386
- this.requestCount++;
387
-
388
- // Handle embedding which can be string or number[]
389
- const embedding = data[0].embedding;
390
- const vector = typeof embedding === 'string'
391
- ? JSON.parse(embedding) as number[]
392
- : embedding as number[];
393
-
394
- const usage = (result as any).usage;
395
-
396
- return {
397
- vector,
398
- dimension: vector.length,
399
- model: this.modelName,
400
- processingTime: Date.now() - startTime,
401
- tokenCount: usage?.totalTokens
402
- };
403
- }
404
-
405
- /**
406
- * Generate embeddings for multiple texts (batched)
407
- */
408
- async embedBatch(
409
- texts: string[],
410
- options: Omit<EmbeddingOptions, 'text'> = {}
411
- ): Promise<BatchEmbeddingResult> {
412
- const startTime = Date.now();
413
- let successCount = 0;
414
- let failedCount = 0;
415
-
416
- try {
417
- await this.checkRateLimit();
418
-
419
- // OpenRouter uses native fetch API for better compatibility
420
- if (this.provider === 'openrouter') {
421
- return await this.embedBatchOpenRouter(texts, startTime);
422
- }
423
-
424
- // Other providers use AI SDK
425
- if (!this.embeddingModel) {
426
- throw new Error('Embedding model not initialized');
427
- }
428
-
429
- const result = await embedMany({
430
- model: this.embeddingModel,
431
- values: texts,
432
- ...this.getProviderOptions(options as EmbeddingOptions),
433
- });
434
-
435
- successCount = result.embeddings.length;
436
- const totalTime = Date.now() - startTime;
437
-
438
- return {
439
- vectors: result.embeddings,
440
- dimension: result.embeddings[0]?.length || this.dimensions,
441
- model: this.modelName,
442
- totalProcessingTime: totalTime,
443
- averageProcessingTime: totalTime / texts.length,
444
- successCount,
445
- failedCount,
446
- };
447
- } catch (error) {
448
- throw new Error(
449
- `Batch embedding failed: ${error instanceof Error ? error.message : 'Unknown error'}`
450
- );
451
- }
452
- }
453
-
454
- /**
455
- * Generate batch embeddings using OpenRouter SDK
456
- */
457
- private async embedBatchOpenRouter(texts: string[], startTime: number): Promise<BatchEmbeddingResult> {
458
- if (!this.openRouterClient) {
459
- throw new Error('OpenRouter client not initialized');
460
- }
461
-
462
- const result = await this.openRouterClient.embeddings.generate({
463
- model: this.modelName,
464
- input: texts
465
- });
466
-
467
- // Handle union type - result can be string or object
468
- if (typeof result === 'string') {
469
- throw new Error('Unexpected string response from OpenRouter embeddings API');
470
- }
471
-
472
- const data = (result as any).data;
473
- if (!data || !Array.isArray(data)) {
474
- throw new Error('Invalid response from OpenRouter embeddings API');
475
- }
476
-
477
- // Sort by index to ensure correct order
478
- const sortedData = [...data].sort((a: any, b: any) => (a.index || 0) - (b.index || 0));
479
- const vectors = sortedData.map((item: any) => {
480
- const embedding = item.embedding;
481
- return typeof embedding === 'string'
482
- ? JSON.parse(embedding) as number[]
483
- : embedding as number[];
484
- });
485
-
486
- this.requestCount++;
487
- const totalTime = Date.now() - startTime;
488
-
489
- return {
490
- vectors,
491
- dimension: vectors[0]?.length || this.dimensions,
492
- model: this.modelName,
493
- totalProcessingTime: totalTime,
494
- averageProcessingTime: totalTime / texts.length,
495
- successCount: vectors.length,
496
- failedCount: texts.length - vectors.length
497
- };
498
- }
499
-
500
- /**
501
- * Get provider-specific options
502
- */
503
- private getProviderOptions(options: EmbeddingOptions): any {
504
- const providerOpts: any = {};
505
-
506
- if (this.provider === 'google') {
507
- providerOpts.providerOptions = {
508
- google: {
509
- outputDimensionality: this.dimensions,
510
- taskType: this.getGoogleTaskType(options.type),
511
- },
512
- };
513
- } else if (this.provider === 'openai') {
514
- providerOpts.providerOptions = {
515
- openai: {
516
- dimensions: this.dimensions,
517
- },
518
- };
519
- } else if (this.provider === 'openrouter') {
520
- // OpenRouter uses OpenAI-compatible options
521
- // Note: dimensions may not be supported for all models via OpenRouter
522
- providerOpts.providerOptions = {
523
- openai: {
524
- dimensions: this.dimensions,
525
- },
526
- };
527
- } else if (this.provider === 'cohere') {
528
- providerOpts.providerOptions = {
529
- cohere: {
530
- inputType: this.getCohereInputType(options.type),
531
- },
532
- };
533
- }
534
-
535
- return providerOpts;
536
- }
537
-
538
- /**
539
- * Map PDW type to Google task type
540
- */
541
- private getGoogleTaskType(type?: string): string {
542
- switch (type) {
543
- case 'query':
544
- return 'RETRIEVAL_QUERY';
545
- case 'content':
546
- return 'RETRIEVAL_DOCUMENT';
547
- case 'metadata':
548
- return 'SEMANTIC_SIMILARITY';
549
- default:
550
- return 'RETRIEVAL_DOCUMENT';
551
- }
552
- }
553
-
554
- /**
555
- * Map PDW type to Cohere input type
556
- */
557
- private getCohereInputType(type?: string): string {
558
- switch (type) {
559
- case 'query':
560
- return 'search_query';
561
- case 'content':
562
- return 'search_document';
563
- default:
564
- return 'search_document';
565
- }
566
- }
567
-
568
- /**
569
- * Calculate cosine similarity between two vectors
570
- */
571
- calculateCosineSimilarity(vectorA: number[], vectorB: number[]): number {
572
- if (vectorA.length !== vectorB.length) {
573
- throw new Error(`Vector dimension mismatch: ${vectorA.length} vs ${vectorB.length}`);
574
- }
575
-
576
- let dotProduct = 0;
577
- let normA = 0;
578
- let normB = 0;
579
-
580
- for (let i = 0; i < vectorA.length; i++) {
581
- dotProduct += vectorA[i] * vectorB[i];
582
- normA += vectorA[i] * vectorA[i];
583
- normB += vectorB[i] * vectorB[i];
584
- }
585
-
586
- const magnitude = Math.sqrt(normA) * Math.sqrt(normB);
587
-
588
- if (magnitude === 0) {
589
- return 0;
590
- }
591
-
592
- return dotProduct / magnitude;
593
- }
594
-
595
- /**
596
- * Calculate Euclidean distance between two vectors
597
- */
598
- calculateEuclideanDistance(vectorA: number[], vectorB: number[]): number {
599
- if (vectorA.length !== vectorB.length) {
600
- throw new Error(`Vector dimension mismatch: ${vectorA.length} vs ${vectorB.length}`);
601
- }
602
-
603
- let sum = 0;
604
- for (let i = 0; i < vectorA.length; i++) {
605
- const diff = vectorA[i] - vectorB[i];
606
- sum += diff * diff;
607
- }
608
-
609
- return Math.sqrt(sum);
610
- }
611
-
612
- /**
613
- * Normalize a vector to unit length
614
- */
615
- normalizeVector(vector: number[]): number[] {
616
- const magnitude = Math.sqrt(vector.reduce((sum, val) => sum + val * val, 0));
617
-
618
- if (magnitude === 0) {
619
- return vector;
620
- }
621
-
622
- return vector.map(val => val / magnitude);
623
- }
624
-
625
- /**
626
- * Find the most similar vectors to a query vector
627
- */
628
- findMostSimilar(
629
- queryVector: number[],
630
- candidateVectors: number[][],
631
- k: number = 5
632
- ): Array<{ index: number; similarity: number; distance: number }> {
633
- const similarities = candidateVectors.map((vector, index) => {
634
- const similarity = this.calculateCosineSimilarity(queryVector, vector);
635
- const distance = this.calculateEuclideanDistance(queryVector, vector);
636
-
637
- return { index, similarity, distance };
638
- });
639
-
640
- similarities.sort((a, b) => b.similarity - a.similarity);
641
-
642
- return similarities.slice(0, k);
643
- }
644
-
645
- /**
646
- * Get embedding statistics
647
- */
648
- getStats(): {
649
- totalRequests: number;
650
- requestsThisMinute: number;
651
- model: string;
652
- dimensions: number;
653
- rateLimit: number;
654
- provider: string;
655
- } {
656
- const now = Date.now();
657
- const requestsThisMinute = (now - this.lastReset) < 60000 ? this.requestCount : 0;
658
-
659
- return {
660
- totalRequests: this.requestCount,
661
- requestsThisMinute,
662
- model: this.modelName,
663
- dimensions: this.dimensions,
664
- rateLimit: this.maxRequestsPerMinute,
665
- provider: this.provider,
666
- };
667
- }
668
-
669
- /**
670
- * Reset rate limiting counters
671
- */
672
- private resetRateLimit(): void {
673
- const now = Date.now();
674
- if (now - this.lastReset >= 60000) {
675
- this.requestCount = 0;
676
- this.lastReset = now;
677
- }
678
- }
679
-
680
- /**
681
- * Check rate limiting and wait if necessary
682
- */
683
- private async checkRateLimit(): Promise<void> {
684
- this.resetRateLimit();
685
-
686
- if (this.requestCount >= this.maxRequestsPerMinute) {
687
- const waitTime = 60000 - (Date.now() - this.lastReset);
688
- if (waitTime > 0) {
689
- if (process.env.NODE_ENV === 'development') {
690
- console.warn(`Rate limit reached, waiting ${waitTime}ms`);
691
- }
692
- await this.delay(waitTime);
693
- this.resetRateLimit();
694
- }
695
- }
696
- }
697
-
698
- /**
699
- * Utility delay function
700
- */
701
- private delay(ms: number): Promise<void> {
702
- return new Promise(resolve => setTimeout(resolve, ms));
703
- }
704
- }
705
-
706
- export default EmbeddingService;
1
+ /**
2
+ * EmbeddingService - AI SDK Integration
3
+ *
4
+ * Refactored to use Vercel AI SDK as the underlying embedding provider.
5
+ * Supports any AI SDK compatible provider (OpenAI, Google, Cohere, etc.)
6
+ * while maintaining backward compatibility with existing PDW code.
7
+ *
8
+ * OpenRouter now uses the official @openrouter/sdk instead of raw fetch calls.
9
+ *
10
+ * Key features:
11
+ * - Provider-agnostic: Accept any ai-sdk EmbeddingModel
12
+ * - Backward compatible: Existing code continues to work
13
+ * - Flexible configuration: Direct model OR provider config
14
+ */
15
+
16
+ import type { EmbeddingModelV2 } from '@ai-sdk/provider';
17
+ import { embed, embedMany } from 'ai';
18
+ import { createGoogleGenerativeAI } from '@ai-sdk/google';
19
+ import { createOpenAI } from '@ai-sdk/openai';
20
+ import { OpenRouter } from '@openrouter/sdk';
21
+
22
+ // Type alias for embedding models - V2 is the default in AI SDK v5
23
+ type EmbeddingModel<VALUE> = EmbeddingModelV2<VALUE>;
24
+
25
+ // Provider instances (lazily initialized)
26
+ let googleProvider: ReturnType<typeof createGoogleGenerativeAI> | null = null;
27
+ let openaiProvider: ReturnType<typeof createOpenAI> | null = null;
28
+ let openrouterProvider: ReturnType<typeof createOpenAI> | null = null;
29
+ let cohereProvider: any = null;
30
+
31
+ export interface EmbeddingConfig {
32
+ /**
33
+ * Option 1: Direct ai-sdk model (most flexible)
34
+ * User provides their own EmbeddingModel from any provider
35
+ *
36
+ * For backward compatibility, also accepts string (treated as modelName)
37
+ *
38
+ * @example
39
+ * ```typescript
40
+ * import { openai } from '@ai-sdk/openai';
41
+ * const service = new EmbeddingService({
42
+ * model: openai.embedding('text-embedding-3-large')
43
+ * });
44
+ *
45
+ * // Backward compatible:
46
+ * const service = new EmbeddingService({
47
+ * model: 'text-embedding-004', // Treated as modelName
48
+ * apiKey: 'your-key'
49
+ * });
50
+ * ```
51
+ */
52
+ model?: EmbeddingModel<string> | string;
53
+
54
+ /**
55
+ * Option 2: Provider-based configuration
56
+ * PDW creates the model from provider settings
57
+ *
58
+ * - google: Direct Google AI API
59
+ * - openai: Direct OpenAI API
60
+ * - openrouter: OpenRouter API gateway (supports multiple models)
61
+ * - cohere: Direct Cohere API
62
+ */
63
+ provider?: 'google' | 'openai' | 'openrouter' | 'cohere';
64
+
65
+ /**
66
+ * API key for the provider
67
+ * Falls back to environment variables:
68
+ * - GEMINI_API_KEY or GOOGLE_AI_API_KEY (for google)
69
+ * - OPENAI_API_KEY (for openai)
70
+ * - OPENROUTER_API_KEY (for openrouter)
71
+ * - COHERE_API_KEY (for cohere)
72
+ */
73
+ apiKey?: string;
74
+
75
+ /**
76
+ * Model name to use
77
+ * - Google: 'text-embedding-004', 'gemini-embedding-001'
78
+ * - OpenAI: 'text-embedding-3-small', 'text-embedding-3-large'
79
+ * - OpenRouter: 'google/gemini-embedding-001', 'openai/text-embedding-3-small', etc.
80
+ * - Cohere: 'embed-english-v3.0', 'embed-multilingual-v3.0'
81
+ */
82
+ modelName?: string;
83
+
84
+ /**
85
+ * Embedding dimensions (optional, provider-dependent)
86
+ * - Google: Up to 3072
87
+ * - OpenAI: 256, 512, 1024, 1536, 3072 (depending on model)
88
+ * - OpenRouter: Depends on the underlying model
89
+ * - Cohere: Model-specific
90
+ */
91
+ dimensions?: number;
92
+
93
+ /**
94
+ * Rate limiting
95
+ */
96
+ requestsPerMinute?: number;
97
+ }
98
+
99
+ export interface EmbeddingOptions {
100
+ text: string;
101
+ type?: 'content' | 'metadata' | 'query';
102
+ taskType?: 'RETRIEVAL_QUERY' | 'RETRIEVAL_DOCUMENT' | 'SEMANTIC_SIMILARITY';
103
+ }
104
+
105
+ export interface EmbeddingResult {
106
+ vector: number[];
107
+ dimension: number;
108
+ model: string;
109
+ processingTime: number;
110
+ tokenCount?: number;
111
+ }
112
+
113
+ export interface BatchEmbeddingResult {
114
+ vectors: number[][];
115
+ dimension: number;
116
+ model: string;
117
+ totalProcessingTime: number;
118
+ averageProcessingTime: number;
119
+ successCount: number;
120
+ failedCount: number;
121
+ }
122
+
123
+ /**
124
+ * Embedding service using Vercel AI SDK
125
+ * Supports all AI SDK compatible providers
126
+ * OpenRouter uses the official @openrouter/sdk for better type safety
127
+ */
128
+ export class EmbeddingService {
129
+ private embeddingModel: EmbeddingModel<string> | null = null;
130
+ private modelName: string;
131
+ private dimensions: number;
132
+ private requestCount = 0;
133
+ private lastReset = Date.now();
134
+ private readonly maxRequestsPerMinute: number;
135
+ private provider: 'google' | 'openai' | 'openrouter' | 'cohere' | 'custom';
136
+ private apiKey: string = '';
137
+ private openRouterClient: OpenRouter | null = null;
138
+
139
+ constructor(config: EmbeddingConfig = {}) {
140
+ this.maxRequestsPerMinute = config.requestsPerMinute || 1500;
141
+
142
+ // Case 1: Direct model provided (most flexible)
143
+ if (config.model) {
144
+ // Backward compatibility: If model is a string, treat as modelName
145
+ if (typeof config.model === 'string') {
146
+ const modelNameFromString = config.model;
147
+ console.log(`🔄 Backward compatibility: treating model string "${modelNameFromString}" as modelName`);
148
+
149
+ // Treat string as modelName and use provider config path
150
+ const provider = config.provider || 'google';
151
+ this.apiKey = this.resolveApiKey(provider, config.apiKey);
152
+
153
+ if (!this.apiKey) {
154
+ throw new Error(
155
+ `API key is required for ${provider} provider. ` +
156
+ `Provide it via config.apiKey or environment variable.`
157
+ );
158
+ }
159
+
160
+ this.provider = provider;
161
+ this.modelName = modelNameFromString;
162
+ this.dimensions = config.dimensions || this.getDefaultDimensions(provider);
163
+
164
+ // OpenRouter uses SDK, others use AI SDK
165
+ if (provider === 'openrouter') {
166
+ this.openRouterClient = new OpenRouter({ apiKey: this.apiKey });
167
+ } else {
168
+ this.embeddingModel = this.createModel(provider, this.apiKey, this.modelName);
169
+ }
170
+
171
+ console.log(`✅ EmbeddingService initialized with ${provider} provider (${this.modelName}) [backward compat mode]`);
172
+ return;
173
+ }
174
+
175
+ // New behavior: Direct EmbeddingModel from ai-sdk
176
+ this.embeddingModel = config.model;
177
+ this.modelName = 'custom';
178
+ this.dimensions = config.dimensions || 3072;
179
+ this.provider = 'custom';
180
+ console.log('✅ EmbeddingService initialized with custom ai-sdk model');
181
+ return;
182
+ }
183
+
184
+ // Case 2: Provider-based configuration
185
+ const provider = config.provider || 'google'; // Default to google for backward compat
186
+ this.apiKey = this.resolveApiKey(provider, config.apiKey);
187
+
188
+ if (!this.apiKey) {
189
+ throw new Error(
190
+ `API key is required for ${provider} provider. ` +
191
+ `Provide it via config.apiKey or environment variable.`
192
+ );
193
+ }
194
+
195
+ this.provider = provider;
196
+ this.modelName = config.modelName || this.getDefaultModelName(provider);
197
+ this.dimensions = config.dimensions || this.getDefaultDimensions(provider);
198
+
199
+ // OpenRouter uses SDK, others use AI SDK
200
+ if (provider === 'openrouter') {
201
+ this.openRouterClient = new OpenRouter({ apiKey: this.apiKey });
202
+ } else {
203
+ this.embeddingModel = this.createModel(provider, this.apiKey, this.modelName);
204
+ }
205
+
206
+ console.log(`✅ EmbeddingService initialized with ${provider} provider (${this.modelName})`);
207
+ }
208
+
209
+ /**
210
+ * Resolve API key from config or environment
211
+ */
212
+ private resolveApiKey(provider: string, configKey?: string): string {
213
+ if (configKey) return configKey;
214
+
215
+ switch (provider) {
216
+ case 'google':
217
+ return process.env.GEMINI_API_KEY || process.env.GOOGLE_AI_API_KEY || '';
218
+ case 'openai':
219
+ return process.env.OPENAI_API_KEY || '';
220
+ case 'openrouter':
221
+ return process.env.OPENROUTER_API_KEY || '';
222
+ case 'cohere':
223
+ return process.env.COHERE_API_KEY || '';
224
+ default:
225
+ return '';
226
+ }
227
+ }
228
+
229
+ /**
230
+ * Get default model name for provider
231
+ */
232
+ private getDefaultModelName(provider: string): string {
233
+ switch (provider) {
234
+ case 'google':
235
+ return 'text-embedding-004';
236
+ case 'openai':
237
+ return 'text-embedding-3-small';
238
+ case 'openrouter':
239
+ return 'google/gemini-embedding-001'; // Default OpenRouter embedding model
240
+ case 'cohere':
241
+ return 'embed-english-v3.0';
242
+ default:
243
+ return 'text-embedding-004';
244
+ }
245
+ }
246
+
247
+ /**
248
+ * Get default dimensions for provider
249
+ */
250
+ private getDefaultDimensions(provider: string): number {
251
+ switch (provider) {
252
+ case 'google':
253
+ return 3072;
254
+ case 'openai':
255
+ return 1536; // text-embedding-3-small default
256
+ case 'openrouter':
257
+ return 3072; // google/gemini-embedding-001 returns 3072 dimensions
258
+ case 'cohere':
259
+ return 1024;
260
+ default:
261
+ return 3072;
262
+ }
263
+ }
264
+
265
+ /**
266
+ * Create embedding model from provider
267
+ */
268
+ private createModel(
269
+ provider: string,
270
+ apiKey: string,
271
+ modelName: string
272
+ ): EmbeddingModel<string> {
273
+ switch (provider) {
274
+ case 'google': {
275
+ if (!googleProvider) {
276
+ googleProvider = createGoogleGenerativeAI({ apiKey });
277
+ }
278
+ return googleProvider.textEmbeddingModel(modelName);
279
+ }
280
+
281
+ case 'openai': {
282
+ if (!openaiProvider) {
283
+ openaiProvider = createOpenAI({ apiKey });
284
+ }
285
+ // OpenAI returns EmbeddingModelV2 but is compatible with ai SDK
286
+ return openaiProvider.textEmbeddingModel(modelName) as unknown as EmbeddingModel<string>;
287
+ }
288
+
289
+ case 'openrouter': {
290
+ // OpenRouter uses OpenAI-compatible API with custom baseURL
291
+ if (!openrouterProvider) {
292
+ openrouterProvider = createOpenAI({
293
+ baseURL: 'https://openrouter.ai/api/v1',
294
+ apiKey,
295
+ });
296
+ }
297
+ // OpenRouter embedding models use the same interface as OpenAI
298
+ return openrouterProvider.textEmbeddingModel(modelName) as unknown as EmbeddingModel<string>;
299
+ }
300
+
301
+ case 'cohere': {
302
+ if (!cohereProvider) {
303
+ throw new Error(
304
+ 'Cohere provider requires manual initialization. ' +
305
+ 'Import createCohere from @ai-sdk/cohere and set cohereProvider before use.'
306
+ );
307
+ }
308
+ return cohereProvider.textEmbedding(modelName);
309
+ }
310
+
311
+ default:
312
+ throw new Error(`Unsupported provider: ${provider}`);
313
+ }
314
+ }
315
+
316
+ /**
317
+ * Generate embedding for a single text
318
+ */
319
+ async embedText(options: EmbeddingOptions): Promise<EmbeddingResult> {
320
+ const startTime = Date.now();
321
+
322
+ // Validate input
323
+ if (!options.text || typeof options.text !== 'string' || options.text.trim().length === 0) {
324
+ throw new Error('Invalid or empty text provided for embedding');
325
+ }
326
+
327
+ await this.checkRateLimit();
328
+
329
+ try {
330
+ // OpenRouter uses native fetch API for better compatibility
331
+ if (this.provider === 'openrouter') {
332
+ return await this.embedTextOpenRouter(options.text, startTime);
333
+ }
334
+
335
+ // Other providers use AI SDK
336
+ if (!this.embeddingModel) {
337
+ throw new Error('Embedding model not initialized');
338
+ }
339
+
340
+ const result = await embed({
341
+ model: this.embeddingModel,
342
+ value: options.text,
343
+ ...this.getProviderOptions(options),
344
+ });
345
+
346
+ this.requestCount++;
347
+
348
+ return {
349
+ vector: result.embedding,
350
+ dimension: result.embedding.length,
351
+ model: this.modelName,
352
+ processingTime: Date.now() - startTime,
353
+ tokenCount: result.usage?.tokens,
354
+ };
355
+ } catch (error) {
356
+ throw new Error(
357
+ `Embedding generation failed: ${error instanceof Error ? error.message : 'Unknown error'}`
358
+ );
359
+ }
360
+ }
361
+
362
+ /**
363
+ * Generate embedding using OpenRouter SDK
364
+ * Uses official @openrouter/sdk for embeddings
365
+ */
366
+ private async embedTextOpenRouter(text: string, startTime: number): Promise<EmbeddingResult> {
367
+ if (!this.openRouterClient) {
368
+ throw new Error('OpenRouter client not initialized');
369
+ }
370
+
371
+ const result = await this.openRouterClient.embeddings.generate({
372
+ model: this.modelName,
373
+ input: text
374
+ });
375
+
376
+ // Handle union type - result can be string or object
377
+ if (typeof result === 'string') {
378
+ throw new Error('Unexpected string response from OpenRouter embeddings API');
379
+ }
380
+
381
+ const data = (result as any).data;
382
+ if (!data || !data[0] || !data[0].embedding) {
383
+ throw new Error('Invalid response from OpenRouter embeddings API');
384
+ }
385
+
386
+ this.requestCount++;
387
+
388
+ // Handle embedding which can be string or number[]
389
+ const embedding = data[0].embedding;
390
+ const vector = typeof embedding === 'string'
391
+ ? JSON.parse(embedding) as number[]
392
+ : embedding as number[];
393
+
394
+ const usage = (result as any).usage;
395
+
396
+ return {
397
+ vector,
398
+ dimension: vector.length,
399
+ model: this.modelName,
400
+ processingTime: Date.now() - startTime,
401
+ tokenCount: usage?.totalTokens
402
+ };
403
+ }
404
+
405
+ /**
406
+ * Generate embeddings for multiple texts (batched)
407
+ */
408
+ async embedBatch(
409
+ texts: string[],
410
+ options: Omit<EmbeddingOptions, 'text'> = {}
411
+ ): Promise<BatchEmbeddingResult> {
412
+ const startTime = Date.now();
413
+ let successCount = 0;
414
+ let failedCount = 0;
415
+
416
+ try {
417
+ await this.checkRateLimit();
418
+
419
+ // OpenRouter uses native fetch API for better compatibility
420
+ if (this.provider === 'openrouter') {
421
+ return await this.embedBatchOpenRouter(texts, startTime);
422
+ }
423
+
424
+ // Other providers use AI SDK
425
+ if (!this.embeddingModel) {
426
+ throw new Error('Embedding model not initialized');
427
+ }
428
+
429
+ const result = await embedMany({
430
+ model: this.embeddingModel,
431
+ values: texts,
432
+ ...this.getProviderOptions(options as EmbeddingOptions),
433
+ });
434
+
435
+ successCount = result.embeddings.length;
436
+ const totalTime = Date.now() - startTime;
437
+
438
+ return {
439
+ vectors: result.embeddings,
440
+ dimension: result.embeddings[0]?.length || this.dimensions,
441
+ model: this.modelName,
442
+ totalProcessingTime: totalTime,
443
+ averageProcessingTime: totalTime / texts.length,
444
+ successCount,
445
+ failedCount,
446
+ };
447
+ } catch (error) {
448
+ throw new Error(
449
+ `Batch embedding failed: ${error instanceof Error ? error.message : 'Unknown error'}`
450
+ );
451
+ }
452
+ }
453
+
454
+ /**
455
+ * Generate batch embeddings using OpenRouter SDK
456
+ */
457
+ private async embedBatchOpenRouter(texts: string[], startTime: number): Promise<BatchEmbeddingResult> {
458
+ if (!this.openRouterClient) {
459
+ throw new Error('OpenRouter client not initialized');
460
+ }
461
+
462
+ const result = await this.openRouterClient.embeddings.generate({
463
+ model: this.modelName,
464
+ input: texts
465
+ });
466
+
467
+ // Handle union type - result can be string or object
468
+ if (typeof result === 'string') {
469
+ throw new Error('Unexpected string response from OpenRouter embeddings API');
470
+ }
471
+
472
+ const data = (result as any).data;
473
+ if (!data || !Array.isArray(data)) {
474
+ throw new Error('Invalid response from OpenRouter embeddings API');
475
+ }
476
+
477
+ // Sort by index to ensure correct order
478
+ const sortedData = [...data].sort((a: any, b: any) => (a.index || 0) - (b.index || 0));
479
+ const vectors = sortedData.map((item: any) => {
480
+ const embedding = item.embedding;
481
+ return typeof embedding === 'string'
482
+ ? JSON.parse(embedding) as number[]
483
+ : embedding as number[];
484
+ });
485
+
486
+ this.requestCount++;
487
+ const totalTime = Date.now() - startTime;
488
+
489
+ return {
490
+ vectors,
491
+ dimension: vectors[0]?.length || this.dimensions,
492
+ model: this.modelName,
493
+ totalProcessingTime: totalTime,
494
+ averageProcessingTime: totalTime / texts.length,
495
+ successCount: vectors.length,
496
+ failedCount: texts.length - vectors.length
497
+ };
498
+ }
499
+
500
+ /**
501
+ * Get provider-specific options
502
+ */
503
+ private getProviderOptions(options: EmbeddingOptions): any {
504
+ const providerOpts: any = {};
505
+
506
+ if (this.provider === 'google') {
507
+ providerOpts.providerOptions = {
508
+ google: {
509
+ outputDimensionality: this.dimensions,
510
+ taskType: this.getGoogleTaskType(options.type),
511
+ },
512
+ };
513
+ } else if (this.provider === 'openai') {
514
+ providerOpts.providerOptions = {
515
+ openai: {
516
+ dimensions: this.dimensions,
517
+ },
518
+ };
519
+ } else if (this.provider === 'openrouter') {
520
+ // OpenRouter uses OpenAI-compatible options
521
+ // Note: dimensions may not be supported for all models via OpenRouter
522
+ providerOpts.providerOptions = {
523
+ openai: {
524
+ dimensions: this.dimensions,
525
+ },
526
+ };
527
+ } else if (this.provider === 'cohere') {
528
+ providerOpts.providerOptions = {
529
+ cohere: {
530
+ inputType: this.getCohereInputType(options.type),
531
+ },
532
+ };
533
+ }
534
+
535
+ return providerOpts;
536
+ }
537
+
538
+ /**
539
+ * Map PDW type to Google task type
540
+ */
541
+ private getGoogleTaskType(type?: string): string {
542
+ switch (type) {
543
+ case 'query':
544
+ return 'RETRIEVAL_QUERY';
545
+ case 'content':
546
+ return 'RETRIEVAL_DOCUMENT';
547
+ case 'metadata':
548
+ return 'SEMANTIC_SIMILARITY';
549
+ default:
550
+ return 'RETRIEVAL_DOCUMENT';
551
+ }
552
+ }
553
+
554
+ /**
555
+ * Map PDW type to Cohere input type
556
+ */
557
+ private getCohereInputType(type?: string): string {
558
+ switch (type) {
559
+ case 'query':
560
+ return 'search_query';
561
+ case 'content':
562
+ return 'search_document';
563
+ default:
564
+ return 'search_document';
565
+ }
566
+ }
567
+
568
+ /**
569
+ * Calculate cosine similarity between two vectors
570
+ */
571
+ calculateCosineSimilarity(vectorA: number[], vectorB: number[]): number {
572
+ if (vectorA.length !== vectorB.length) {
573
+ throw new Error(`Vector dimension mismatch: ${vectorA.length} vs ${vectorB.length}`);
574
+ }
575
+
576
+ let dotProduct = 0;
577
+ let normA = 0;
578
+ let normB = 0;
579
+
580
+ for (let i = 0; i < vectorA.length; i++) {
581
+ dotProduct += vectorA[i] * vectorB[i];
582
+ normA += vectorA[i] * vectorA[i];
583
+ normB += vectorB[i] * vectorB[i];
584
+ }
585
+
586
+ const magnitude = Math.sqrt(normA) * Math.sqrt(normB);
587
+
588
+ if (magnitude === 0) {
589
+ return 0;
590
+ }
591
+
592
+ return dotProduct / magnitude;
593
+ }
594
+
595
+ /**
596
+ * Calculate Euclidean distance between two vectors
597
+ */
598
+ calculateEuclideanDistance(vectorA: number[], vectorB: number[]): number {
599
+ if (vectorA.length !== vectorB.length) {
600
+ throw new Error(`Vector dimension mismatch: ${vectorA.length} vs ${vectorB.length}`);
601
+ }
602
+
603
+ let sum = 0;
604
+ for (let i = 0; i < vectorA.length; i++) {
605
+ const diff = vectorA[i] - vectorB[i];
606
+ sum += diff * diff;
607
+ }
608
+
609
+ return Math.sqrt(sum);
610
+ }
611
+
612
+ /**
613
+ * Normalize a vector to unit length
614
+ */
615
+ normalizeVector(vector: number[]): number[] {
616
+ const magnitude = Math.sqrt(vector.reduce((sum, val) => sum + val * val, 0));
617
+
618
+ if (magnitude === 0) {
619
+ return vector;
620
+ }
621
+
622
+ return vector.map(val => val / magnitude);
623
+ }
624
+
625
+ /**
626
+ * Find the most similar vectors to a query vector
627
+ */
628
+ findMostSimilar(
629
+ queryVector: number[],
630
+ candidateVectors: number[][],
631
+ k: number = 5
632
+ ): Array<{ index: number; similarity: number; distance: number }> {
633
+ const similarities = candidateVectors.map((vector, index) => {
634
+ const similarity = this.calculateCosineSimilarity(queryVector, vector);
635
+ const distance = this.calculateEuclideanDistance(queryVector, vector);
636
+
637
+ return { index, similarity, distance };
638
+ });
639
+
640
+ similarities.sort((a, b) => b.similarity - a.similarity);
641
+
642
+ return similarities.slice(0, k);
643
+ }
644
+
645
+ /**
646
+ * Get embedding statistics
647
+ */
648
+ getStats(): {
649
+ totalRequests: number;
650
+ requestsThisMinute: number;
651
+ model: string;
652
+ dimensions: number;
653
+ rateLimit: number;
654
+ provider: string;
655
+ } {
656
+ const now = Date.now();
657
+ const requestsThisMinute = (now - this.lastReset) < 60000 ? this.requestCount : 0;
658
+
659
+ return {
660
+ totalRequests: this.requestCount,
661
+ requestsThisMinute,
662
+ model: this.modelName,
663
+ dimensions: this.dimensions,
664
+ rateLimit: this.maxRequestsPerMinute,
665
+ provider: this.provider,
666
+ };
667
+ }
668
+
669
+ /**
670
+ * Reset rate limiting counters
671
+ */
672
+ private resetRateLimit(): void {
673
+ const now = Date.now();
674
+ if (now - this.lastReset >= 60000) {
675
+ this.requestCount = 0;
676
+ this.lastReset = now;
677
+ }
678
+ }
679
+
680
+ /**
681
+ * Check rate limiting and wait if necessary
682
+ */
683
+ private async checkRateLimit(): Promise<void> {
684
+ this.resetRateLimit();
685
+
686
+ if (this.requestCount >= this.maxRequestsPerMinute) {
687
+ const waitTime = 60000 - (Date.now() - this.lastReset);
688
+ if (waitTime > 0) {
689
+ if (process.env.NODE_ENV === 'development') {
690
+ console.warn(`Rate limit reached, waiting ${waitTime}ms`);
691
+ }
692
+ await this.delay(waitTime);
693
+ this.resetRateLimit();
694
+ }
695
+ }
696
+ }
697
+
698
+ /**
699
+ * Utility delay function
700
+ */
701
+ private delay(ms: number): Promise<void> {
702
+ return new Promise(resolve => setTimeout(resolve, ms));
703
+ }
704
+ }
705
+
706
+ export default EmbeddingService;
707
+
708
+ // ==================== Singleton Pattern ====================
709
+
710
+ /**
711
+ * Generate config key for singleton cache
712
+ */
713
+ function getConfigKey(config: EmbeddingConfig): string {
714
+ const provider = config.provider || 'google';
715
+ const modelName = typeof config.model === 'string'
716
+ ? config.model
717
+ : (config.modelName || 'default');
718
+ const dimensions = config.dimensions || 'default';
719
+ return `${provider}:${modelName}:${dimensions}`;
720
+ }
721
+
722
+ /** Singleton cache */
723
+ const sharedInstances = new Map<string, EmbeddingService>();
724
+
725
+ /**
726
+ * Get or create a shared EmbeddingService instance (Singleton)
727
+ *
728
+ * All clients with same provider/model/dimensions share one instance.
729
+ * Reduces memory usage and connection overhead.
730
+ *
731
+ * @example
732
+ * ```typescript
733
+ * // Instead of: new EmbeddingService({ apiKey, modelName })
734
+ * const embedding = getSharedEmbeddingService({ apiKey, modelName });
735
+ * ```
736
+ */
737
+ export function getSharedEmbeddingService(config: EmbeddingConfig): EmbeddingService {
738
+ const key = getConfigKey(config);
739
+
740
+ let instance = sharedInstances.get(key);
741
+ if (!instance) {
742
+ console.log(`🔧 [Singleton] Creating shared EmbeddingService: ${key}`);
743
+ instance = new EmbeddingService(config);
744
+ sharedInstances.set(key, instance);
745
+ }
746
+
747
+ return instance;
748
+ }
749
+
750
+ /**
751
+ * Clear all shared instances (for testing)
752
+ */
753
+ export function clearSharedEmbeddingServices(): void {
754
+ sharedInstances.clear();
755
+ }
756
+
757
+ /**
758
+ * Get singleton stats
759
+ */
760
+ export function getSharedEmbeddingStats(): {
761
+ instanceCount: number;
762
+ instances: Array<{ key: string; stats: ReturnType<EmbeddingService['getStats']> }>;
763
+ } {
764
+ return {
765
+ instanceCount: sharedInstances.size,
766
+ instances: Array.from(sharedInstances.entries()).map(([key, svc]) => ({
767
+ key,
768
+ stats: svc.getStats(),
769
+ })),
770
+ };
771
+ }