@lov3kaizen/agentsea-embeddings 1.0.1 → 1.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/caching/index.js +7 -1
- package/dist/caching/index.mjs +1 -1
- package/dist/chunk-2TCNSTX3.mjs +12 -0
- package/dist/{chunk-NBHIRTJT.mjs → chunk-5GTQFVEI.mjs} +41 -1
- package/dist/chunk-JHWMXQ56.mjs +1650 -0
- package/dist/{chunk-VPSMDBHH.mjs → chunk-MNJPAUDC.mjs} +7 -1
- package/dist/{chunk-DJAURHAS.mjs → chunk-U6EYWYUD.mjs} +31 -1
- package/dist/chunking/index.js +33 -4
- package/dist/chunking/index.mjs +1 -1
- package/dist/{index-DmEEUzJg.d.mts → index-DGzfvyHY.d.mts} +3 -0
- package/dist/{index-G-KgyvZT.d.ts → index-_uJcyK8e.d.ts} +3 -0
- package/dist/index.d.mts +2 -2
- package/dist/index.d.ts +2 -2
- package/dist/index.js +848 -16
- package/dist/index.mjs +22 -22
- package/dist/providers/index.d.mts +1 -1
- package/dist/providers/index.d.ts +1 -1
- package/dist/providers/index.js +47 -1
- package/dist/providers/index.mjs +2 -1
- package/dist/stores/index.d.mts +255 -1
- package/dist/stores/index.d.ts +255 -1
- package/dist/stores/index.js +794 -7
- package/dist/stores/index.mjs +20 -3
- package/package.json +9 -6
- package/dist/chunk-TER262ST.mjs +0 -877
|
@@ -572,7 +572,13 @@ var SQLiteCache = class extends BaseCache {
|
|
|
572
572
|
`);
|
|
573
573
|
updateStmt.run(Date.now(), key);
|
|
574
574
|
const vectorBuffer = row.vector;
|
|
575
|
-
const vector = Array.from(
|
|
575
|
+
const vector = Array.from(
|
|
576
|
+
new Float32Array(
|
|
577
|
+
vectorBuffer.buffer,
|
|
578
|
+
vectorBuffer.byteOffset,
|
|
579
|
+
vectorBuffer.byteLength / Float32Array.BYTES_PER_ELEMENT
|
|
580
|
+
)
|
|
581
|
+
);
|
|
576
582
|
return {
|
|
577
583
|
key: row.key,
|
|
578
584
|
vector,
|
|
@@ -2,8 +2,37 @@ import {
|
|
|
2
2
|
EmbeddingModel
|
|
3
3
|
} from "./chunk-QAITLJ2E.mjs";
|
|
4
4
|
|
|
5
|
+
// ../../node_modules/.pnpm/nanoid@5.1.6/node_modules/nanoid/index.js
|
|
6
|
+
import { webcrypto as crypto } from "crypto";
|
|
7
|
+
|
|
8
|
+
// ../../node_modules/.pnpm/nanoid@5.1.6/node_modules/nanoid/url-alphabet/index.js
|
|
9
|
+
var urlAlphabet = "useandom-26T198340PX75pxJACKVERYMINDBUSHWOLF_GQZbfghjklqvwyzrict";
|
|
10
|
+
|
|
11
|
+
// ../../node_modules/.pnpm/nanoid@5.1.6/node_modules/nanoid/index.js
|
|
12
|
+
var POOL_SIZE_MULTIPLIER = 128;
|
|
13
|
+
var pool;
|
|
14
|
+
var poolOffset;
|
|
15
|
+
function fillPool(bytes) {
|
|
16
|
+
if (!pool || pool.length < bytes) {
|
|
17
|
+
pool = Buffer.allocUnsafe(bytes * POOL_SIZE_MULTIPLIER);
|
|
18
|
+
crypto.getRandomValues(pool);
|
|
19
|
+
poolOffset = 0;
|
|
20
|
+
} else if (poolOffset + bytes > pool.length) {
|
|
21
|
+
crypto.getRandomValues(pool);
|
|
22
|
+
poolOffset = 0;
|
|
23
|
+
}
|
|
24
|
+
poolOffset += bytes;
|
|
25
|
+
}
|
|
26
|
+
function nanoid(size = 21) {
|
|
27
|
+
fillPool(size |= 0);
|
|
28
|
+
let id = "";
|
|
29
|
+
for (let i = poolOffset - size; i < poolOffset; i++) {
|
|
30
|
+
id += urlAlphabet[pool[i] & 63];
|
|
31
|
+
}
|
|
32
|
+
return id;
|
|
33
|
+
}
|
|
34
|
+
|
|
5
35
|
// src/chunking/BaseChunker.ts
|
|
6
|
-
import { nanoid } from "nanoid";
|
|
7
36
|
var defaultTokenCounter = (text) => {
|
|
8
37
|
return Math.ceil(text.length / 4);
|
|
9
38
|
};
|
|
@@ -1098,6 +1127,7 @@ async function chunk(text, strategy = "recursive", options) {
|
|
|
1098
1127
|
}
|
|
1099
1128
|
|
|
1100
1129
|
export {
|
|
1130
|
+
nanoid,
|
|
1101
1131
|
defaultTokenCounter,
|
|
1102
1132
|
BaseChunker,
|
|
1103
1133
|
mergeSmallChunks,
|
package/dist/chunking/index.js
CHANGED
|
@@ -39,8 +39,37 @@ __export(chunking_exports, {
|
|
|
39
39
|
});
|
|
40
40
|
module.exports = __toCommonJS(chunking_exports);
|
|
41
41
|
|
|
42
|
+
// ../../node_modules/.pnpm/nanoid@5.1.6/node_modules/nanoid/index.js
|
|
43
|
+
var import_node_crypto = require("crypto");
|
|
44
|
+
|
|
45
|
+
// ../../node_modules/.pnpm/nanoid@5.1.6/node_modules/nanoid/url-alphabet/index.js
|
|
46
|
+
var urlAlphabet = "useandom-26T198340PX75pxJACKVERYMINDBUSHWOLF_GQZbfghjklqvwyzrict";
|
|
47
|
+
|
|
48
|
+
// ../../node_modules/.pnpm/nanoid@5.1.6/node_modules/nanoid/index.js
|
|
49
|
+
var POOL_SIZE_MULTIPLIER = 128;
|
|
50
|
+
var pool;
|
|
51
|
+
var poolOffset;
|
|
52
|
+
function fillPool(bytes) {
|
|
53
|
+
if (!pool || pool.length < bytes) {
|
|
54
|
+
pool = Buffer.allocUnsafe(bytes * POOL_SIZE_MULTIPLIER);
|
|
55
|
+
import_node_crypto.webcrypto.getRandomValues(pool);
|
|
56
|
+
poolOffset = 0;
|
|
57
|
+
} else if (poolOffset + bytes > pool.length) {
|
|
58
|
+
import_node_crypto.webcrypto.getRandomValues(pool);
|
|
59
|
+
poolOffset = 0;
|
|
60
|
+
}
|
|
61
|
+
poolOffset += bytes;
|
|
62
|
+
}
|
|
63
|
+
function nanoid(size = 21) {
|
|
64
|
+
fillPool(size |= 0);
|
|
65
|
+
let id = "";
|
|
66
|
+
for (let i = poolOffset - size; i < poolOffset; i++) {
|
|
67
|
+
id += urlAlphabet[pool[i] & 63];
|
|
68
|
+
}
|
|
69
|
+
return id;
|
|
70
|
+
}
|
|
71
|
+
|
|
42
72
|
// src/chunking/BaseChunker.ts
|
|
43
|
-
var import_nanoid = require("nanoid");
|
|
44
73
|
var defaultTokenCounter = (text) => {
|
|
45
74
|
return Math.ceil(text.length / 4);
|
|
46
75
|
};
|
|
@@ -82,7 +111,7 @@ var BaseChunker = class {
|
|
|
82
111
|
if (options.source) metadata.source = options.source;
|
|
83
112
|
if (options.type) metadata.type = options.type;
|
|
84
113
|
return {
|
|
85
|
-
id:
|
|
114
|
+
id: nanoid(),
|
|
86
115
|
text,
|
|
87
116
|
index,
|
|
88
117
|
startPosition,
|
|
@@ -190,7 +219,7 @@ function splitLargeChunks(chunks, maxTokens, tokenCounter) {
|
|
|
190
219
|
if (testTokens > maxTokens && currentText) {
|
|
191
220
|
result.push({
|
|
192
221
|
...chunk2,
|
|
193
|
-
id:
|
|
222
|
+
id: nanoid(),
|
|
194
223
|
text: currentText,
|
|
195
224
|
startPosition: currentStart,
|
|
196
225
|
endPosition: currentStart + currentText.length,
|
|
@@ -206,7 +235,7 @@ function splitLargeChunks(chunks, maxTokens, tokenCounter) {
|
|
|
206
235
|
if (currentText) {
|
|
207
236
|
result.push({
|
|
208
237
|
...chunk2,
|
|
209
|
-
id:
|
|
238
|
+
id: nanoid(),
|
|
210
239
|
text: currentText,
|
|
211
240
|
startPosition: currentStart,
|
|
212
241
|
endPosition: currentStart + currentText.length,
|
package/dist/chunking/index.mjs
CHANGED
|
@@ -259,7 +259,10 @@ declare class LocalProvider extends BaseProvider {
|
|
|
259
259
|
private embedFn;
|
|
260
260
|
private normalize;
|
|
261
261
|
private batchSize;
|
|
262
|
+
private readonly modelPath?;
|
|
263
|
+
private extractorPromise?;
|
|
262
264
|
constructor(config: LocalProviderOptions);
|
|
265
|
+
private getOnnxEmbedFn;
|
|
263
266
|
get info(): EmbeddingModelInfo;
|
|
264
267
|
protected doEmbed(texts: string[], options?: EmbeddingOptions): Promise<{
|
|
265
268
|
vectors: number[][];
|
|
@@ -259,7 +259,10 @@ declare class LocalProvider extends BaseProvider {
|
|
|
259
259
|
private embedFn;
|
|
260
260
|
private normalize;
|
|
261
261
|
private batchSize;
|
|
262
|
+
private readonly modelPath?;
|
|
263
|
+
private extractorPromise?;
|
|
262
264
|
constructor(config: LocalProviderOptions);
|
|
265
|
+
private getOnnxEmbedFn;
|
|
263
266
|
get info(): EmbeddingModelInfo;
|
|
264
267
|
protected doEmbed(texts: string[], options?: EmbeddingOptions): Promise<{
|
|
265
268
|
vectors: number[][];
|
package/dist/index.d.mts
CHANGED
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { E as EmbeddingProviderType, M as ModelInfo, a as EmbeddingModel } from './index-
|
|
2
|
-
export { B as BaseProvider, b as BatchEmbeddingRequest, C as CohereProvider, c as CohereProviderConfig, d as CustomProviderConfig, e as EmbeddingRequest, H as HuggingFaceProvider, f as HuggingFaceProviderConfig, L as LocalEmbeddingFn, g as LocalProvider, h as LocalProviderConfig, i as LocalProviderOptions, j as ModelRegistry, O as OpenAIProvider, k as OpenAIProviderConfig, P as ProviderCapabilities, l as ProviderConfig, m as ProviderError, n as ProviderFactoryOptions, o as ProviderHealth, p as ProviderMetrics, q as ProviderResponse, R as RateLimitInfo, T as TokenUsage, V as VoyageProvider, r as VoyageProviderConfig, s as createCohereProvider, t as createHuggingFaceProvider, u as createLocalProvider, v as createMockProvider, w as createOpenAIProvider, x as createRandomProvider, y as createVoyageProvider, z as modelRegistry } from './index-
|
|
1
|
+
import { E as EmbeddingProviderType, M as ModelInfo, a as EmbeddingModel } from './index-DGzfvyHY.mjs';
|
|
2
|
+
export { B as BaseProvider, b as BatchEmbeddingRequest, C as CohereProvider, c as CohereProviderConfig, d as CustomProviderConfig, e as EmbeddingRequest, H as HuggingFaceProvider, f as HuggingFaceProviderConfig, L as LocalEmbeddingFn, g as LocalProvider, h as LocalProviderConfig, i as LocalProviderOptions, j as ModelRegistry, O as OpenAIProvider, k as OpenAIProviderConfig, P as ProviderCapabilities, l as ProviderConfig, m as ProviderError, n as ProviderFactoryOptions, o as ProviderHealth, p as ProviderMetrics, q as ProviderResponse, R as RateLimitInfo, T as TokenUsage, V as VoyageProvider, r as VoyageProviderConfig, s as createCohereProvider, t as createHuggingFaceProvider, u as createLocalProvider, v as createMockProvider, w as createOpenAIProvider, x as createRandomProvider, y as createVoyageProvider, z as modelRegistry } from './index-DGzfvyHY.mjs';
|
|
3
3
|
import EventEmitter from 'eventemitter3';
|
|
4
4
|
import { E as EmbeddingVector, a as EmbeddingOptions, b as EmbeddingResult, B as BatchEmbeddingOptions, c as BatchEmbeddingResult, d as EmbeddedChunk, S as SearchOptions, e as SearchResult, D as DocumentEmbeddingOptions, f as EmbeddingStats } from './embedding.types-6Qr8Mgij.mjs';
|
|
5
5
|
export { g as BatchProgress, C as ChunkMetadata, h as EmbeddingModelInfo, i as SimilarityMetric } from './embedding.types-6Qr8Mgij.mjs';
|
package/dist/index.d.ts
CHANGED
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { E as EmbeddingProviderType, M as ModelInfo, a as EmbeddingModel } from './index-
|
|
2
|
-
export { B as BaseProvider, b as BatchEmbeddingRequest, C as CohereProvider, c as CohereProviderConfig, d as CustomProviderConfig, e as EmbeddingRequest, H as HuggingFaceProvider, f as HuggingFaceProviderConfig, L as LocalEmbeddingFn, g as LocalProvider, h as LocalProviderConfig, i as LocalProviderOptions, j as ModelRegistry, O as OpenAIProvider, k as OpenAIProviderConfig, P as ProviderCapabilities, l as ProviderConfig, m as ProviderError, n as ProviderFactoryOptions, o as ProviderHealth, p as ProviderMetrics, q as ProviderResponse, R as RateLimitInfo, T as TokenUsage, V as VoyageProvider, r as VoyageProviderConfig, s as createCohereProvider, t as createHuggingFaceProvider, u as createLocalProvider, v as createMockProvider, w as createOpenAIProvider, x as createRandomProvider, y as createVoyageProvider, z as modelRegistry } from './index-
|
|
1
|
+
import { E as EmbeddingProviderType, M as ModelInfo, a as EmbeddingModel } from './index-_uJcyK8e.js';
|
|
2
|
+
export { B as BaseProvider, b as BatchEmbeddingRequest, C as CohereProvider, c as CohereProviderConfig, d as CustomProviderConfig, e as EmbeddingRequest, H as HuggingFaceProvider, f as HuggingFaceProviderConfig, L as LocalEmbeddingFn, g as LocalProvider, h as LocalProviderConfig, i as LocalProviderOptions, j as ModelRegistry, O as OpenAIProvider, k as OpenAIProviderConfig, P as ProviderCapabilities, l as ProviderConfig, m as ProviderError, n as ProviderFactoryOptions, o as ProviderHealth, p as ProviderMetrics, q as ProviderResponse, R as RateLimitInfo, T as TokenUsage, V as VoyageProvider, r as VoyageProviderConfig, s as createCohereProvider, t as createHuggingFaceProvider, u as createLocalProvider, v as createMockProvider, w as createOpenAIProvider, x as createRandomProvider, y as createVoyageProvider, z as modelRegistry } from './index-_uJcyK8e.js';
|
|
3
3
|
import EventEmitter from 'eventemitter3';
|
|
4
4
|
import { E as EmbeddingVector, a as EmbeddingOptions, b as EmbeddingResult, B as BatchEmbeddingOptions, c as BatchEmbeddingResult, d as EmbeddedChunk, S as SearchOptions, e as SearchResult, D as DocumentEmbeddingOptions, f as EmbeddingStats } from './embedding.types-6Qr8Mgij.js';
|
|
5
5
|
export { g as BatchProgress, C as ChunkMetadata, h as EmbeddingModelInfo, i as SimilarityMetric } from './embedding.types-6Qr8Mgij.js';
|