ruvector 0.2.23 → 0.2.25

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (111) hide show
  1. package/bin/cli.js +211 -63
  2. package/dist/analysis/complexity.d.ts +52 -0
  3. package/dist/analysis/complexity.d.ts.map +1 -0
  4. package/dist/analysis/complexity.js +146 -0
  5. package/dist/analysis/index.d.ts +15 -0
  6. package/dist/analysis/index.d.ts.map +1 -0
  7. package/dist/analysis/index.js +38 -0
  8. package/dist/analysis/patterns.d.ts +71 -0
  9. package/dist/analysis/patterns.d.ts.map +1 -0
  10. package/dist/analysis/patterns.js +243 -0
  11. package/dist/analysis/security.d.ts +51 -0
  12. package/dist/analysis/security.d.ts.map +1 -0
  13. package/dist/analysis/security.js +139 -0
  14. package/dist/core/adaptive-embedder.d.ts +156 -0
  15. package/dist/core/adaptive-embedder.d.ts.map +1 -0
  16. package/dist/core/adaptive-embedder.js +838 -0
  17. package/dist/core/agentdb-fast.d.ts +149 -0
  18. package/dist/core/agentdb-fast.d.ts.map +1 -0
  19. package/dist/core/agentdb-fast.js +301 -0
  20. package/dist/core/ast-parser.d.ts +108 -0
  21. package/dist/core/ast-parser.d.ts.map +1 -0
  22. package/dist/core/ast-parser.js +602 -0
  23. package/dist/core/attention-fallbacks.d.ts +321 -0
  24. package/dist/core/attention-fallbacks.d.ts.map +1 -0
  25. package/dist/core/attention-fallbacks.js +552 -0
  26. package/dist/core/cluster-wrapper.d.ts +148 -0
  27. package/dist/core/cluster-wrapper.d.ts.map +1 -0
  28. package/dist/core/cluster-wrapper.js +271 -0
  29. package/dist/core/coverage-router.d.ts +88 -0
  30. package/dist/core/coverage-router.d.ts.map +1 -0
  31. package/dist/core/coverage-router.js +315 -0
  32. package/dist/core/diff-embeddings.d.ts +93 -0
  33. package/dist/core/diff-embeddings.d.ts.map +1 -0
  34. package/dist/core/diff-embeddings.js +334 -0
  35. package/dist/core/diskann-wrapper.d.ts +53 -0
  36. package/dist/core/diskann-wrapper.d.ts.map +1 -0
  37. package/dist/core/diskann-wrapper.js +105 -0
  38. package/dist/core/gnn-wrapper.d.ts +143 -0
  39. package/dist/core/gnn-wrapper.d.ts.map +1 -0
  40. package/dist/core/gnn-wrapper.js +213 -0
  41. package/dist/core/graph-algorithms.d.ts +83 -0
  42. package/dist/core/graph-algorithms.d.ts.map +1 -0
  43. package/dist/core/graph-algorithms.js +514 -0
  44. package/dist/core/graph-wrapper.d.ts +147 -0
  45. package/dist/core/graph-wrapper.d.ts.map +1 -0
  46. package/dist/core/graph-wrapper.js +299 -0
  47. package/dist/core/index.d.ts +50 -0
  48. package/dist/core/index.d.ts.map +1 -0
  49. package/dist/core/index.js +92 -0
  50. package/dist/core/intelligence-engine.d.ts +258 -0
  51. package/dist/core/intelligence-engine.d.ts.map +1 -0
  52. package/dist/core/intelligence-engine.js +1030 -0
  53. package/dist/core/learning-engine.d.ts +160 -0
  54. package/dist/core/learning-engine.d.ts.map +1 -0
  55. package/dist/core/learning-engine.js +589 -0
  56. package/dist/core/neural-embeddings.d.ts +393 -0
  57. package/dist/core/neural-embeddings.d.ts.map +1 -0
  58. package/dist/core/neural-embeddings.js +1091 -0
  59. package/dist/core/neural-perf.d.ts +331 -0
  60. package/dist/core/neural-perf.d.ts.map +1 -0
  61. package/dist/core/neural-perf.js +704 -0
  62. package/dist/core/onnx/pkg/package.json +3 -0
  63. package/dist/core/onnx-embedder.d.ts +105 -0
  64. package/dist/core/onnx-embedder.d.ts.map +1 -0
  65. package/dist/core/onnx-embedder.js +410 -0
  66. package/dist/core/onnx-optimized.d.ts +109 -0
  67. package/dist/core/onnx-optimized.d.ts.map +1 -0
  68. package/dist/core/onnx-optimized.js +419 -0
  69. package/dist/core/parallel-intelligence.d.ts +109 -0
  70. package/dist/core/parallel-intelligence.d.ts.map +1 -0
  71. package/dist/core/parallel-intelligence.js +340 -0
  72. package/dist/core/parallel-workers.d.ts +177 -0
  73. package/dist/core/parallel-workers.d.ts.map +1 -0
  74. package/dist/core/parallel-workers.js +783 -0
  75. package/dist/core/router-wrapper.d.ts +75 -0
  76. package/dist/core/router-wrapper.d.ts.map +1 -0
  77. package/dist/core/router-wrapper.js +243 -0
  78. package/dist/core/rvf-wrapper.d.ts +86 -0
  79. package/dist/core/rvf-wrapper.d.ts.map +1 -0
  80. package/dist/core/rvf-wrapper.js +102 -0
  81. package/dist/core/sona-wrapper.d.ts +226 -0
  82. package/dist/core/sona-wrapper.d.ts.map +1 -0
  83. package/dist/core/sona-wrapper.js +282 -0
  84. package/dist/core/tensor-compress.d.ts +134 -0
  85. package/dist/core/tensor-compress.d.ts.map +1 -0
  86. package/dist/core/tensor-compress.js +432 -0
  87. package/dist/index.d.ts +106 -0
  88. package/dist/index.d.ts.map +1 -0
  89. package/dist/index.js +258 -0
  90. package/dist/services/embedding-service.d.ts +136 -0
  91. package/dist/services/embedding-service.d.ts.map +1 -0
  92. package/dist/services/embedding-service.js +294 -0
  93. package/dist/services/index.d.ts +6 -0
  94. package/dist/services/index.d.ts.map +1 -0
  95. package/dist/services/index.js +26 -0
  96. package/dist/types.d.ts +145 -0
  97. package/dist/types.d.ts.map +1 -0
  98. package/dist/types.js +2 -0
  99. package/dist/workers/benchmark.d.ts +44 -0
  100. package/dist/workers/benchmark.d.ts.map +1 -0
  101. package/dist/workers/benchmark.js +230 -0
  102. package/dist/workers/index.d.ts +10 -0
  103. package/dist/workers/index.d.ts.map +1 -0
  104. package/dist/workers/index.js +25 -0
  105. package/dist/workers/native-worker.d.ts +76 -0
  106. package/dist/workers/native-worker.d.ts.map +1 -0
  107. package/dist/workers/native-worker.js +490 -0
  108. package/dist/workers/types.d.ts +69 -0
  109. package/dist/workers/types.d.ts.map +1 -0
  110. package/dist/workers/types.js +7 -0
  111. package/package.json +8 -7
package/dist/index.js ADDED
@@ -0,0 +1,258 @@
1
+ "use strict";
2
+ /**
3
+ * ruvector - High-performance vector database for Node.js
4
+ *
5
+ * This package automatically detects and uses the best available implementation:
6
+ * 1. Native (Rust-based, fastest) - if available for your platform
7
+ * 2. RVF (persistent store) - if @ruvector/rvf is installed
8
+ * 3. Stub (testing fallback) - limited functionality
9
+ *
10
+ * Also provides safe wrappers for GNN and Attention modules that handle
11
+ * array type conversions automatically.
12
+ */
13
+ var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
14
+ if (k2 === undefined) k2 = k;
15
+ var desc = Object.getOwnPropertyDescriptor(m, k);
16
+ if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
17
+ desc = { enumerable: true, get: function() { return m[k]; } };
18
+ }
19
+ Object.defineProperty(o, k2, desc);
20
+ }) : (function(o, m, k, k2) {
21
+ if (k2 === undefined) k2 = k;
22
+ o[k2] = m[k];
23
+ }));
24
+ var __exportStar = (this && this.__exportStar) || function(m, exports) {
25
+ for (var p in m) if (p !== "default" && !Object.prototype.hasOwnProperty.call(exports, p)) __createBinding(exports, m, p);
26
+ };
27
+ Object.defineProperty(exports, "__esModule", { value: true });
28
+ exports.NativeVectorDb = exports.VectorDB = exports.VectorDb = void 0;
29
+ exports.getImplementationType = getImplementationType;
30
+ exports.isNative = isNative;
31
+ exports.isRvf = isRvf;
32
+ exports.isWasm = isWasm;
33
+ exports.getVersion = getVersion;
34
+ __exportStar(require("./types"), exports);
35
+ // Export core wrappers (safe interfaces with automatic type conversion)
36
+ __exportStar(require("./core"), exports);
37
+ __exportStar(require("./services"), exports);
38
+ let implementation;
39
+ let implementationType = 'wasm';
40
+ // Check for explicit --backend rvf flag or RUVECTOR_BACKEND env var
41
+ const rvfRequested = process.env.RUVECTOR_BACKEND === 'rvf' ||
42
+ process.argv.includes('--backend') && process.argv[process.argv.indexOf('--backend') + 1] === 'rvf';
43
+ if (rvfRequested) {
44
+ // Explicit rvf backend requested - fail hard if not available
45
+ try {
46
+ implementation = require('@ruvector/rvf');
47
+ implementationType = 'rvf';
48
+ }
49
+ catch (e) {
50
+ throw new Error('@ruvector/rvf is not installed.\n' +
51
+ ' Run: npm install @ruvector/rvf\n' +
52
+ ' The --backend rvf flag requires this package.');
53
+ }
54
+ }
55
+ else {
56
+ try {
57
+ // Try to load native module first
58
+ implementation = require('@ruvector/core');
59
+ implementationType = 'native';
60
+ // Verify it's actually working (native module exports VectorDb, not VectorDB)
61
+ if (typeof implementation.VectorDb !== 'function') {
62
+ throw new Error('Native module loaded but VectorDb class not found');
63
+ }
64
+ }
65
+ catch (e) {
66
+ // Try rvf (persistent store) as second fallback
67
+ try {
68
+ implementation = require('@ruvector/rvf');
69
+ implementationType = 'rvf';
70
+ }
71
+ catch (rvfErr) {
72
+ // Graceful fallback - don't crash, just warn
73
+ console.warn('[RuVector] Native module not available:', e.message);
74
+ console.warn('[RuVector] RVF module not available:', rvfErr.message);
75
+ console.warn('[RuVector] Vector operations will be limited. Install @ruvector/core or @ruvector/rvf for full functionality.');
76
+ // Create a stub implementation that provides basic functionality
77
+ implementation = {
78
+ VectorDb: class StubVectorDb {
79
+ constructor() {
80
+ console.warn('[RuVector] Using stub VectorDb - install @ruvector/core for native performance');
81
+ }
82
+ async insert() { return 'stub-id-' + Date.now(); }
83
+ async insertBatch(entries) { return entries.map(() => 'stub-id-' + Date.now()); }
84
+ async search() { return []; }
85
+ async delete() { return true; }
86
+ async get() { return null; }
87
+ async len() { return 0; }
88
+ async isEmpty() { return true; }
89
+ }
90
+ };
91
+ implementationType = 'wasm'; // Mark as fallback mode
92
+ }
93
+ }
94
+ }
95
+ /**
96
+ * Get the current implementation type
97
+ */
98
+ function getImplementationType() {
99
+ return implementationType;
100
+ }
101
+ /**
102
+ * Check if native implementation is being used
103
+ */
104
+ function isNative() {
105
+ return implementationType === 'native';
106
+ }
107
+ /**
108
+ * Check if RVF implementation is being used
109
+ */
110
+ function isRvf() {
111
+ return implementationType === 'rvf';
112
+ }
113
+ /**
114
+ * Check if stub/fallback implementation is being used
115
+ */
116
+ function isWasm() {
117
+ return implementationType === 'wasm';
118
+ }
119
+ /**
120
+ * Get version information
121
+ */
122
+ function getVersion() {
123
+ const pkg = require('../package.json');
124
+ return {
125
+ version: pkg.version,
126
+ implementation: implementationType
127
+ };
128
+ }
129
+ /**
130
+ * Normalize a user-friendly distance metric string (`"cosine"`, `"euclidean"`,
131
+ * etc.) to the PascalCase variant the native `JsDistanceMetric` enum accepts.
132
+ * Native: { Euclidean, Cosine, DotProduct, Manhattan }.
133
+ */
134
+ function normalizeMetric(metric) {
135
+ if (!metric)
136
+ return metric;
137
+ const m = metric.toLowerCase().replace(/[_\s-]/g, '');
138
+ switch (m) {
139
+ case 'cosine':
140
+ return 'Cosine';
141
+ case 'euclidean':
142
+ case 'l2':
143
+ return 'Euclidean';
144
+ case 'dot':
145
+ case 'dotproduct':
146
+ case 'innerproduct':
147
+ return 'DotProduct';
148
+ case 'manhattan':
149
+ case 'l1':
150
+ return 'Manhattan';
151
+ default:
152
+ return metric; // pass through; native will error with the variant list.
153
+ }
154
+ }
155
+ /**
156
+ * Wrapper class that automatically handles metadata JSON conversion
157
+ */
158
+ class VectorDBWrapper {
159
+ constructor(options) {
160
+ // Accept both `distanceMetric` (canonical) and `metric` (CLI shorthand).
161
+ // Normalize to the PascalCase enum variant the native binding expects.
162
+ const distanceMetric = normalizeMetric(options.distanceMetric ?? options.metric);
163
+ const nativeOptions = {
164
+ dimensions: options.dimensions,
165
+ storagePath: options.storagePath,
166
+ hnswConfig: options.hnswConfig,
167
+ };
168
+ if (distanceMetric !== undefined) {
169
+ nativeOptions.distanceMetric = distanceMetric;
170
+ }
171
+ this.db = new implementation.VectorDb(nativeOptions);
172
+ }
173
+ /**
174
+ * Insert a vector with optional metadata (objects are auto-converted to JSON)
175
+ */
176
+ async insert(entry) {
177
+ const nativeEntry = {
178
+ id: entry.id,
179
+ vector: entry.vector instanceof Float32Array ? entry.vector : new Float32Array(entry.vector),
180
+ };
181
+ // Auto-convert metadata object to JSON string
182
+ if (entry.metadata) {
183
+ nativeEntry.metadata = JSON.stringify(entry.metadata);
184
+ }
185
+ return this.db.insert(nativeEntry);
186
+ }
187
+ /**
188
+ * Insert multiple vectors in batch
189
+ */
190
+ async insertBatch(entries) {
191
+ const nativeEntries = entries.map(entry => ({
192
+ id: entry.id,
193
+ vector: entry.vector instanceof Float32Array ? entry.vector : new Float32Array(entry.vector),
194
+ metadata: entry.metadata ? JSON.stringify(entry.metadata) : undefined,
195
+ }));
196
+ return this.db.insertBatch(nativeEntries);
197
+ }
198
+ /**
199
+ * Search for similar vectors (metadata is auto-parsed from JSON)
200
+ */
201
+ async search(query) {
202
+ const nativeQuery = {
203
+ vector: query.vector instanceof Float32Array ? query.vector : new Float32Array(query.vector),
204
+ k: query.k,
205
+ efSearch: query.efSearch,
206
+ };
207
+ // Auto-convert filter object to JSON string
208
+ if (query.filter) {
209
+ nativeQuery.filter = JSON.stringify(query.filter);
210
+ }
211
+ const results = await this.db.search(nativeQuery);
212
+ // Auto-parse metadata JSON strings back to objects
213
+ return results.map((r) => ({
214
+ id: r.id,
215
+ score: r.score,
216
+ vector: r.vector,
217
+ metadata: r.metadata ? JSON.parse(r.metadata) : undefined,
218
+ }));
219
+ }
220
+ /**
221
+ * Get a vector by ID (metadata is auto-parsed from JSON)
222
+ */
223
+ async get(id) {
224
+ const entry = await this.db.get(id);
225
+ if (!entry)
226
+ return null;
227
+ return {
228
+ id: entry.id,
229
+ vector: entry.vector,
230
+ metadata: entry.metadata ? JSON.parse(entry.metadata) : undefined,
231
+ };
232
+ }
233
+ /**
234
+ * Delete a vector by ID
235
+ */
236
+ async delete(id) {
237
+ return this.db.delete(id);
238
+ }
239
+ /**
240
+ * Get the number of vectors in the database
241
+ */
242
+ async len() {
243
+ return this.db.len();
244
+ }
245
+ /**
246
+ * Check if the database is empty
247
+ */
248
+ async isEmpty() {
249
+ return this.db.isEmpty();
250
+ }
251
+ }
252
+ // Export the wrapper class (aliased as VectorDB for backwards compatibility)
253
+ exports.VectorDb = VectorDBWrapper;
254
+ exports.VectorDB = VectorDBWrapper;
255
+ // Also export the raw native implementation for advanced users
256
+ exports.NativeVectorDb = implementation.VectorDb;
257
+ // Export everything from the implementation
258
+ exports.default = implementation;
@@ -0,0 +1,136 @@
1
+ /**
2
+ * Embedding Service - Unified embedding generation and management
3
+ *
4
+ * This service provides a unified interface for generating, caching, and
5
+ * managing embeddings from various sources (local models, APIs, etc.)
6
+ */
7
+ /**
8
+ * Embedding provider interface
9
+ */
10
+ export interface EmbeddingProvider {
11
+ /** Provider name */
12
+ name: string;
13
+ /** Generate embeddings for texts */
14
+ embed(texts: string[]): Promise<number[][]>;
15
+ /** Get embedding dimensions */
16
+ getDimensions(): number;
17
+ }
18
+ /**
19
+ * Embedding service configuration
20
+ */
21
+ export interface EmbeddingServiceConfig {
22
+ /** Default provider to use */
23
+ defaultProvider?: string;
24
+ /** Maximum cache size */
25
+ maxCacheSize?: number;
26
+ /** Cache TTL in milliseconds */
27
+ cacheTtl?: number;
28
+ /** Batch size for embedding generation */
29
+ batchSize?: number;
30
+ }
31
+ /**
32
+ * Mock embedding provider for testing
33
+ */
34
+ export declare class MockEmbeddingProvider implements EmbeddingProvider {
35
+ name: string;
36
+ private dimensions;
37
+ constructor(dimensions?: number);
38
+ embed(texts: string[]): Promise<number[][]>;
39
+ getDimensions(): number;
40
+ }
41
+ /**
42
+ * Simple local embedding using character n-grams
43
+ * This is a fallback when no external provider is available
44
+ */
45
+ export declare class LocalNGramProvider implements EmbeddingProvider {
46
+ name: string;
47
+ private dimensions;
48
+ private ngramSize;
49
+ constructor(dimensions?: number, ngramSize?: number);
50
+ embed(texts: string[]): Promise<number[][]>;
51
+ private embedSingle;
52
+ private hashNgram;
53
+ getDimensions(): number;
54
+ }
55
+ /**
56
+ * Embedding service with caching and batching
57
+ */
58
+ export declare class EmbeddingService {
59
+ private providers;
60
+ private cache;
61
+ private config;
62
+ constructor(config?: EmbeddingServiceConfig);
63
+ /**
64
+ * Register an embedding provider
65
+ */
66
+ registerProvider(provider: EmbeddingProvider): void;
67
+ /**
68
+ * Get a registered provider
69
+ */
70
+ getProvider(name?: string): EmbeddingProvider;
71
+ /**
72
+ * Generate embeddings for texts with caching
73
+ *
74
+ * @param texts - Texts to embed
75
+ * @param provider - Provider name (uses default if not specified)
76
+ * @returns Array of embeddings
77
+ */
78
+ embed(texts: string[], provider?: string): Promise<number[][]>;
79
+ /**
80
+ * Generate a single embedding
81
+ */
82
+ embedOne(text: string, provider?: string): Promise<number[]>;
83
+ /**
84
+ * Add entry to cache with LRU eviction
85
+ */
86
+ private addToCache;
87
+ /**
88
+ * Compute cosine similarity between two embeddings
89
+ */
90
+ cosineSimilarity(a: number[], b: number[]): number;
91
+ /**
92
+ * Find most similar texts from a corpus
93
+ */
94
+ findSimilar(query: string, corpus: string[], k?: number, provider?: string): Promise<{
95
+ text: string;
96
+ similarity: number;
97
+ index: number;
98
+ }[]>;
99
+ /**
100
+ * Get cache statistics
101
+ */
102
+ getCacheStats(): {
103
+ size: number;
104
+ maxSize: number;
105
+ hitRate: number;
106
+ };
107
+ /**
108
+ * Clear the cache
109
+ */
110
+ clearCache(): void;
111
+ /**
112
+ * Get embedding dimensions for a provider
113
+ */
114
+ getDimensions(provider?: string): number;
115
+ /**
116
+ * List available providers
117
+ */
118
+ listProviders(): string[];
119
+ }
120
+ /**
121
+ * Create an embedding service instance
122
+ */
123
+ export declare function createEmbeddingService(config?: EmbeddingServiceConfig): EmbeddingService;
124
+ /**
125
+ * Get the default embedding service instance
126
+ */
127
+ export declare function getDefaultEmbeddingService(): EmbeddingService;
128
+ declare const _default: {
129
+ EmbeddingService: typeof EmbeddingService;
130
+ LocalNGramProvider: typeof LocalNGramProvider;
131
+ MockEmbeddingProvider: typeof MockEmbeddingProvider;
132
+ createEmbeddingService: typeof createEmbeddingService;
133
+ getDefaultEmbeddingService: typeof getDefaultEmbeddingService;
134
+ };
135
+ export default _default;
136
+ //# sourceMappingURL=embedding-service.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"embedding-service.d.ts","sourceRoot":"","sources":["../../src/services/embedding-service.ts"],"names":[],"mappings":"AAAA;;;;;GAKG;AAEH;;GAEG;AACH,MAAM,WAAW,iBAAiB;IAChC,oBAAoB;IACpB,IAAI,EAAE,MAAM,CAAC;IACb,oCAAoC;IACpC,KAAK,CAAC,KAAK,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC,CAAC;IAC5C,+BAA+B;IAC/B,aAAa,IAAI,MAAM,CAAC;CACzB;AAWD;;GAEG;AACH,MAAM,WAAW,sBAAsB;IACrC,8BAA8B;IAC9B,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,yBAAyB;IACzB,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,gCAAgC;IAChC,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,0CAA0C;IAC1C,SAAS,CAAC,EAAE,MAAM,CAAC;CACpB;AAeD;;GAEG;AACH,qBAAa,qBAAsB,YAAW,iBAAiB;IAC7D,IAAI,SAAU;IACd,OAAO,CAAC,UAAU,CAAS;gBAEf,UAAU,GAAE,MAAY;IAI9B,KAAK,CAAC,KAAK,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC;IAoBjD,aAAa,IAAI,MAAM;CAGxB;AAED;;;GAGG;AACH,qBAAa,kBAAmB,YAAW,iBAAiB;IAC1D,IAAI,SAAiB;IACrB,OAAO,CAAC,UAAU,CAAS;IAC3B,OAAO,CAAC,SAAS,CAAS;gBAEd,UAAU,GAAE,MAAY,EAAE,SAAS,GAAE,MAAU;IAKrD,KAAK,CAAC,KAAK,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC;IAIjD,OAAO,CAAC,WAAW;IAiBnB,OAAO,CAAC,SAAS;IAQjB,aAAa,IAAI,MAAM;CAGxB;AAED;;GAEG;AACH,qBAAa,gBAAgB;IAC3B,OAAO,CAAC,SAAS,CAA6C;IAC9D,OAAO,CAAC,KAAK,CAAsC;IACnD,OAAO,CAAC,MAAM,CAAmC;gBAErC,MAAM,GAAE,sBAA2B;IAa/C;;OAEG;IACH,gBAAgB,CAAC,QAAQ,EAAE,iBAAiB,GAAG,IAAI;IAInD;;OAEG;IACH,WAAW,CAAC,IAAI,CAAC,EAAE,MAAM,GAAG,iBAAiB;IAS7C;;;;;;OAMG;IACG,KAAK,CAAC,KAAK,EAAE,MAAM,EAAE,EAAE,QAAQ,CAAC,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC;IAkDpE;;OAEG;IACG,QAAQ,CAAC,IAAI,EAAE,MAAM,EAAE,QAAQ,CAAC,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,EAAE,CAAC;IAKlE;;OAEG;IACH,OAAO,CAAC,UAAU;IAwBlB;;OAEG;IACH,gBAAgB,CAAC,CAAC,EAAE,MAAM,EAAE,EAAE,CAAC,EAAE,MAAM,EAAE,GAAG,MAAM;IAmBlD;;OAEG;IACG,WAAW,CACf,KAAK,EAAE,MAAM,EACb,MAAM,EAAE,MAAM,EAAE,EAChB,CAAC,GAAE,MAAU,EACb,QAAQ,CAAC,EAAE,MAAM,GAChB,OAAO,CAAC;QAAE,IAAI,EAAE,MAAM,CAAC;QAAC,UAAU,EAAE,MAAM,CAAC;QAAC,KAAK,EAAE,MAAM,CAAA;KAAE,EAAE,CAAC;IAcjE;;OAEG;IACH,aAAa,IAAI;QACf,IAAI,EAAE,MAAM,CAAC;QACb,OAAO,EAAE,MAAM,CAAC;QAChB,OAAO,EAAE,MAAM,CAAC;KACjB;IAaD;;OAEG;IACH,UAAU,IAAI,IAAI;IAIlB;;OAEG;IACH,aAAa,CAAC,QAAQ,CAAC,EAAE,MAAM,GAAG,MAAM;IAIxC;;OAEG;IACH,aAAa,IAAI,MAAM,EAAE;CAG1B;AAED;;GAEG;AACH,wBAAgB,sBAAsB,CACpC,MAAM,CAAC,EAAE,sBAAsB,GAC9B,gBAAgB,CAElB;AAKD;;GAEG;AACH,wBAAgB,0BAA0B,IAAI,gBAAgB,CAK7D;;;;;;;;AAED,wBAME"}
@@ -0,0 +1,294 @@
1
+ "use strict";
2
+ /**
3
+ * Embedding Service - Unified embedding generation and management
4
+ *
5
+ * This service provides a unified interface for generating, caching, and
6
+ * managing embeddings from various sources (local models, APIs, etc.)
7
+ */
8
+ Object.defineProperty(exports, "__esModule", { value: true });
9
+ exports.EmbeddingService = exports.LocalNGramProvider = exports.MockEmbeddingProvider = void 0;
10
+ exports.createEmbeddingService = createEmbeddingService;
11
+ exports.getDefaultEmbeddingService = getDefaultEmbeddingService;
12
+ /**
13
+ * Simple hash function for cache keys
14
+ */
15
+ function hashText(text) {
16
+ let hash = 0;
17
+ for (let i = 0; i < text.length; i++) {
18
+ const char = text.charCodeAt(i);
19
+ hash = ((hash << 5) - hash) + char;
20
+ hash = hash & hash;
21
+ }
22
+ return `h${hash.toString(36)}`;
23
+ }
24
+ /**
25
+ * Mock embedding provider for testing
26
+ */
27
+ class MockEmbeddingProvider {
28
+ constructor(dimensions = 384) {
29
+ this.name = 'mock';
30
+ this.dimensions = dimensions;
31
+ }
32
+ async embed(texts) {
33
+ return texts.map(text => {
34
+ // Generate deterministic pseudo-random embeddings based on text
35
+ const embedding = [];
36
+ let seed = 0;
37
+ for (let i = 0; i < text.length; i++) {
38
+ seed = ((seed << 5) - seed + text.charCodeAt(i)) | 0;
39
+ }
40
+ for (let i = 0; i < this.dimensions; i++) {
41
+ seed = (seed * 1103515245 + 12345) | 0;
42
+ embedding.push((seed % 1000) / 1000 - 0.5);
43
+ }
44
+ // Normalize
45
+ const norm = Math.sqrt(embedding.reduce((s, v) => s + v * v, 0));
46
+ return embedding.map(v => v / (norm || 1));
47
+ });
48
+ }
49
+ getDimensions() {
50
+ return this.dimensions;
51
+ }
52
+ }
53
+ exports.MockEmbeddingProvider = MockEmbeddingProvider;
54
+ /**
55
+ * Simple local embedding using character n-grams
56
+ * This is a fallback when no external provider is available
57
+ */
58
+ class LocalNGramProvider {
59
+ constructor(dimensions = 256, ngramSize = 3) {
60
+ this.name = 'local-ngram';
61
+ this.dimensions = dimensions;
62
+ this.ngramSize = ngramSize;
63
+ }
64
+ async embed(texts) {
65
+ return texts.map(text => this.embedSingle(text));
66
+ }
67
+ embedSingle(text) {
68
+ const embedding = new Array(this.dimensions).fill(0);
69
+ const normalized = text.toLowerCase().replace(/[^a-z0-9]/g, ' ');
70
+ // Generate n-grams and hash them into embedding dimensions
71
+ for (let i = 0; i <= normalized.length - this.ngramSize; i++) {
72
+ const ngram = normalized.slice(i, i + this.ngramSize);
73
+ const hash = this.hashNgram(ngram);
74
+ const idx = Math.abs(hash) % this.dimensions;
75
+ embedding[idx] += hash > 0 ? 1 : -1;
76
+ }
77
+ // Normalize
78
+ const norm = Math.sqrt(embedding.reduce((s, v) => s + v * v, 0));
79
+ return embedding.map(v => v / (norm || 1));
80
+ }
81
+ hashNgram(ngram) {
82
+ let hash = 0;
83
+ for (let i = 0; i < ngram.length; i++) {
84
+ hash = ((hash << 5) - hash + ngram.charCodeAt(i)) | 0;
85
+ }
86
+ return hash;
87
+ }
88
+ getDimensions() {
89
+ return this.dimensions;
90
+ }
91
+ }
92
+ exports.LocalNGramProvider = LocalNGramProvider;
93
+ /**
94
+ * Embedding service with caching and batching
95
+ */
96
+ class EmbeddingService {
97
+ constructor(config = {}) {
98
+ this.providers = new Map();
99
+ this.cache = new Map();
100
+ this.config = {
101
+ defaultProvider: config.defaultProvider ?? 'local-ngram',
102
+ maxCacheSize: config.maxCacheSize ?? 10000,
103
+ cacheTtl: config.cacheTtl ?? 3600000, // 1 hour
104
+ batchSize: config.batchSize ?? 32,
105
+ };
106
+ // Register default providers
107
+ this.registerProvider(new LocalNGramProvider());
108
+ this.registerProvider(new MockEmbeddingProvider());
109
+ }
110
+ /**
111
+ * Register an embedding provider
112
+ */
113
+ registerProvider(provider) {
114
+ this.providers.set(provider.name, provider);
115
+ }
116
+ /**
117
+ * Get a registered provider
118
+ */
119
+ getProvider(name) {
120
+ const providerName = name ?? this.config.defaultProvider;
121
+ const provider = this.providers.get(providerName);
122
+ if (!provider) {
123
+ throw new Error(`Provider not found: ${providerName}`);
124
+ }
125
+ return provider;
126
+ }
127
+ /**
128
+ * Generate embeddings for texts with caching
129
+ *
130
+ * @param texts - Texts to embed
131
+ * @param provider - Provider name (uses default if not specified)
132
+ * @returns Array of embeddings
133
+ */
134
+ async embed(texts, provider) {
135
+ const providerInstance = this.getProvider(provider);
136
+ const providerName = providerInstance.name;
137
+ const now = Date.now();
138
+ // Check cache and collect texts that need embedding
139
+ const results = new Array(texts.length).fill(null);
140
+ const uncachedIndices = [];
141
+ const uncachedTexts = [];
142
+ for (let i = 0; i < texts.length; i++) {
143
+ const cacheKey = `${providerName}:${hashText(texts[i])}`;
144
+ const cached = this.cache.get(cacheKey);
145
+ if (cached && now - cached.timestamp < this.config.cacheTtl) {
146
+ results[i] = cached.embedding;
147
+ cached.hits++;
148
+ }
149
+ else {
150
+ uncachedIndices.push(i);
151
+ uncachedTexts.push(texts[i]);
152
+ }
153
+ }
154
+ // Generate embeddings for uncached texts in batches
155
+ if (uncachedTexts.length > 0) {
156
+ const batches = [];
157
+ for (let i = 0; i < uncachedTexts.length; i += this.config.batchSize) {
158
+ batches.push(uncachedTexts.slice(i, i + this.config.batchSize));
159
+ }
160
+ let batchOffset = 0;
161
+ for (const batch of batches) {
162
+ const embeddings = await providerInstance.embed(batch);
163
+ for (let j = 0; j < embeddings.length; j++) {
164
+ const originalIndex = uncachedIndices[batchOffset + j];
165
+ results[originalIndex] = embeddings[j];
166
+ // Cache the result
167
+ const cacheKey = `${providerName}:${hashText(texts[originalIndex])}`;
168
+ this.addToCache(cacheKey, embeddings[j], now);
169
+ }
170
+ batchOffset += batch.length;
171
+ }
172
+ }
173
+ return results;
174
+ }
175
+ /**
176
+ * Generate a single embedding
177
+ */
178
+ async embedOne(text, provider) {
179
+ const results = await this.embed([text], provider);
180
+ return results[0];
181
+ }
182
+ /**
183
+ * Add entry to cache with LRU eviction
184
+ */
185
+ addToCache(key, embedding, timestamp) {
186
+ // Evict old entries if cache is full
187
+ if (this.cache.size >= this.config.maxCacheSize) {
188
+ // Find and remove least recently used entry
189
+ let oldestKey = '';
190
+ let oldestTime = Infinity;
191
+ let lowestHits = Infinity;
192
+ for (const [k, v] of this.cache.entries()) {
193
+ if (v.hits < lowestHits || (v.hits === lowestHits && v.timestamp < oldestTime)) {
194
+ oldestKey = k;
195
+ oldestTime = v.timestamp;
196
+ lowestHits = v.hits;
197
+ }
198
+ }
199
+ if (oldestKey) {
200
+ this.cache.delete(oldestKey);
201
+ }
202
+ }
203
+ this.cache.set(key, { embedding, timestamp, hits: 0 });
204
+ }
205
+ /**
206
+ * Compute cosine similarity between two embeddings
207
+ */
208
+ cosineSimilarity(a, b) {
209
+ if (a.length !== b.length) {
210
+ throw new Error('Embeddings must have same dimensions');
211
+ }
212
+ let dotProduct = 0;
213
+ let normA = 0;
214
+ let normB = 0;
215
+ for (let i = 0; i < a.length; i++) {
216
+ dotProduct += a[i] * b[i];
217
+ normA += a[i] * a[i];
218
+ normB += b[i] * b[i];
219
+ }
220
+ const denom = Math.sqrt(normA) * Math.sqrt(normB);
221
+ return denom === 0 ? 0 : dotProduct / denom;
222
+ }
223
+ /**
224
+ * Find most similar texts from a corpus
225
+ */
226
+ async findSimilar(query, corpus, k = 5, provider) {
227
+ const [queryEmbed, ...corpusEmbeds] = await this.embed([query, ...corpus], provider);
228
+ const results = corpusEmbeds.map((embed, i) => ({
229
+ text: corpus[i],
230
+ similarity: this.cosineSimilarity(queryEmbed, embed),
231
+ index: i,
232
+ }));
233
+ return results
234
+ .sort((a, b) => b.similarity - a.similarity)
235
+ .slice(0, k);
236
+ }
237
+ /**
238
+ * Get cache statistics
239
+ */
240
+ getCacheStats() {
241
+ let totalHits = 0;
242
+ for (const entry of this.cache.values()) {
243
+ totalHits += entry.hits;
244
+ }
245
+ return {
246
+ size: this.cache.size,
247
+ maxSize: this.config.maxCacheSize,
248
+ hitRate: this.cache.size > 0 ? totalHits / this.cache.size : 0,
249
+ };
250
+ }
251
+ /**
252
+ * Clear the cache
253
+ */
254
+ clearCache() {
255
+ this.cache.clear();
256
+ }
257
+ /**
258
+ * Get embedding dimensions for a provider
259
+ */
260
+ getDimensions(provider) {
261
+ return this.getProvider(provider).getDimensions();
262
+ }
263
+ /**
264
+ * List available providers
265
+ */
266
+ listProviders() {
267
+ return Array.from(this.providers.keys());
268
+ }
269
+ }
270
+ exports.EmbeddingService = EmbeddingService;
271
+ /**
272
+ * Create an embedding service instance
273
+ */
274
+ function createEmbeddingService(config) {
275
+ return new EmbeddingService(config);
276
+ }
277
+ // Singleton instance
278
+ let defaultService = null;
279
+ /**
280
+ * Get the default embedding service instance
281
+ */
282
+ function getDefaultEmbeddingService() {
283
+ if (!defaultService) {
284
+ defaultService = new EmbeddingService();
285
+ }
286
+ return defaultService;
287
+ }
288
+ exports.default = {
289
+ EmbeddingService,
290
+ LocalNGramProvider,
291
+ MockEmbeddingProvider,
292
+ createEmbeddingService,
293
+ getDefaultEmbeddingService,
294
+ };
@@ -0,0 +1,6 @@
1
+ /**
2
+ * Services module exports
3
+ */
4
+ export * from './embedding-service';
5
+ export { default as embeddingService } from './embedding-service';
6
+ //# sourceMappingURL=index.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/services/index.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,cAAc,qBAAqB,CAAC;AACpC,OAAO,EAAE,OAAO,IAAI,gBAAgB,EAAE,MAAM,qBAAqB,CAAC"}