@smythos/sre 1.5.46 → 1.5.50
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG +98 -90
- package/LICENSE +18 -18
- package/README.md +135 -135
- package/dist/bundle-analysis-lazy.html +4949 -0
- package/dist/bundle-analysis.html +4949 -0
- package/dist/index.js +3 -3
- package/dist/index.js.map +1 -1
- package/dist/types/Components/MCPClient.class.d.ts +1 -0
- package/dist/types/subsystems/LLMManager/LLM.service/connectors/openai/OpenAIConnector.class.d.ts +1 -6
- package/dist/types/utils/package-manager.utils.d.ts +26 -0
- package/package.json +1 -1
- package/src/Components/APICall/APICall.class.ts +156 -156
- package/src/Components/APICall/AccessTokenManager.ts +130 -130
- package/src/Components/APICall/ArrayBufferResponse.helper.ts +58 -58
- package/src/Components/APICall/OAuth.helper.ts +294 -294
- package/src/Components/APICall/mimeTypeCategories.ts +46 -46
- package/src/Components/APICall/parseData.ts +167 -167
- package/src/Components/APICall/parseHeaders.ts +41 -41
- package/src/Components/APICall/parseProxy.ts +68 -68
- package/src/Components/APICall/parseUrl.ts +91 -91
- package/src/Components/APIEndpoint.class.ts +234 -234
- package/src/Components/APIOutput.class.ts +58 -58
- package/src/Components/AgentPlugin.class.ts +102 -102
- package/src/Components/Async.class.ts +155 -155
- package/src/Components/Await.class.ts +90 -90
- package/src/Components/Classifier.class.ts +158 -158
- package/src/Components/Component.class.ts +132 -132
- package/src/Components/ComponentHost.class.ts +38 -38
- package/src/Components/DataSourceCleaner.class.ts +92 -92
- package/src/Components/DataSourceIndexer.class.ts +181 -181
- package/src/Components/DataSourceLookup.class.ts +161 -161
- package/src/Components/ECMASandbox.class.ts +71 -71
- package/src/Components/FEncDec.class.ts +29 -29
- package/src/Components/FHash.class.ts +33 -33
- package/src/Components/FSign.class.ts +80 -80
- package/src/Components/FSleep.class.ts +25 -25
- package/src/Components/FTimestamp.class.ts +25 -25
- package/src/Components/FileStore.class.ts +78 -78
- package/src/Components/ForEach.class.ts +97 -97
- package/src/Components/GPTPlugin.class.ts +70 -70
- package/src/Components/GenAILLM.class.ts +586 -586
- package/src/Components/HuggingFace.class.ts +314 -314
- package/src/Components/Image/imageSettings.config.ts +70 -70
- package/src/Components/ImageGenerator.class.ts +502 -502
- package/src/Components/JSONFilter.class.ts +54 -54
- package/src/Components/LLMAssistant.class.ts +213 -213
- package/src/Components/LogicAND.class.ts +28 -28
- package/src/Components/LogicAtLeast.class.ts +85 -85
- package/src/Components/LogicAtMost.class.ts +86 -86
- package/src/Components/LogicOR.class.ts +29 -29
- package/src/Components/LogicXOR.class.ts +34 -34
- package/src/Components/MCPClient.class.ts +138 -112
- package/src/Components/MemoryDeleteKeyVal.class.ts +70 -70
- package/src/Components/MemoryReadKeyVal.class.ts +66 -66
- package/src/Components/MemoryWriteKeyVal.class.ts +62 -62
- package/src/Components/MemoryWriteObject.class.ts +97 -97
- package/src/Components/MultimodalLLM.class.ts +128 -128
- package/src/Components/OpenAPI.class.ts +72 -72
- package/src/Components/PromptGenerator.class.ts +122 -122
- package/src/Components/ScrapflyWebScrape.class.ts +159 -159
- package/src/Components/ServerlessCode.class.ts +123 -123
- package/src/Components/TavilyWebSearch.class.ts +98 -98
- package/src/Components/VisionLLM.class.ts +104 -104
- package/src/Components/ZapierAction.class.ts +127 -127
- package/src/Components/index.ts +97 -97
- package/src/Core/AgentProcess.helper.ts +240 -240
- package/src/Core/Connector.class.ts +123 -123
- package/src/Core/ConnectorsService.ts +197 -197
- package/src/Core/DummyConnector.ts +49 -49
- package/src/Core/HookService.ts +105 -105
- package/src/Core/SmythRuntime.class.ts +235 -235
- package/src/Core/SystemEvents.ts +16 -16
- package/src/Core/boot.ts +56 -56
- package/src/config.ts +15 -15
- package/src/constants.ts +126 -126
- package/src/data/hugging-face.params.json +579 -579
- package/src/helpers/AWSLambdaCode.helper.ts +587 -587
- package/src/helpers/BinaryInput.helper.ts +331 -331
- package/src/helpers/Conversation.helper.ts +1119 -1119
- package/src/helpers/ECMASandbox.helper.ts +54 -54
- package/src/helpers/JsonContent.helper.ts +97 -97
- package/src/helpers/LocalCache.helper.ts +97 -97
- package/src/helpers/Log.helper.ts +274 -274
- package/src/helpers/OpenApiParser.helper.ts +150 -150
- package/src/helpers/S3Cache.helper.ts +147 -147
- package/src/helpers/SmythURI.helper.ts +5 -5
- package/src/helpers/Sysconfig.helper.ts +77 -77
- package/src/helpers/TemplateString.helper.ts +243 -243
- package/src/helpers/TypeChecker.helper.ts +329 -329
- package/src/index.ts +3 -3
- package/src/index.ts.bak +3 -3
- package/src/subsystems/AgentManager/Agent.class.ts +1114 -1114
- package/src/subsystems/AgentManager/Agent.helper.ts +3 -3
- package/src/subsystems/AgentManager/AgentData.service/AgentDataConnector.ts +230 -230
- package/src/subsystems/AgentManager/AgentData.service/connectors/CLIAgentDataConnector.class.ts +66 -66
- package/src/subsystems/AgentManager/AgentData.service/connectors/LocalAgentDataConnector.class.ts +142 -142
- package/src/subsystems/AgentManager/AgentData.service/connectors/NullAgentData.class.ts +39 -39
- package/src/subsystems/AgentManager/AgentData.service/index.ts +18 -18
- package/src/subsystems/AgentManager/AgentLogger.class.ts +297 -297
- package/src/subsystems/AgentManager/AgentRequest.class.ts +51 -51
- package/src/subsystems/AgentManager/AgentRuntime.class.ts +559 -559
- package/src/subsystems/AgentManager/AgentSSE.class.ts +101 -101
- package/src/subsystems/AgentManager/AgentSettings.class.ts +52 -52
- package/src/subsystems/AgentManager/Component.service/ComponentConnector.ts +32 -32
- package/src/subsystems/AgentManager/Component.service/connectors/LocalComponentConnector.class.ts +60 -60
- package/src/subsystems/AgentManager/Component.service/index.ts +11 -11
- package/src/subsystems/AgentManager/EmbodimentSettings.class.ts +47 -47
- package/src/subsystems/AgentManager/ForkedAgent.class.ts +154 -154
- package/src/subsystems/AgentManager/OSResourceMonitor.ts +77 -77
- package/src/subsystems/ComputeManager/Code.service/CodeConnector.ts +98 -98
- package/src/subsystems/ComputeManager/Code.service/connectors/AWSLambdaCode.class.ts +172 -172
- package/src/subsystems/ComputeManager/Code.service/connectors/ECMASandbox.class.ts +131 -131
- package/src/subsystems/ComputeManager/Code.service/index.ts +13 -13
- package/src/subsystems/IO/CLI.service/CLIConnector.ts +47 -47
- package/src/subsystems/IO/CLI.service/index.ts +9 -9
- package/src/subsystems/IO/Log.service/LogConnector.ts +32 -32
- package/src/subsystems/IO/Log.service/connectors/ConsoleLog.class.ts +28 -28
- package/src/subsystems/IO/Log.service/index.ts +13 -13
- package/src/subsystems/IO/NKV.service/NKVConnector.ts +43 -43
- package/src/subsystems/IO/NKV.service/connectors/NKVLocalStorage.class.ts +234 -234
- package/src/subsystems/IO/NKV.service/connectors/NKVRAM.class.ts +204 -204
- package/src/subsystems/IO/NKV.service/connectors/NKVRedis.class.ts +182 -182
- package/src/subsystems/IO/NKV.service/index.ts +14 -14
- package/src/subsystems/IO/Router.service/RouterConnector.ts +21 -21
- package/src/subsystems/IO/Router.service/connectors/ExpressRouter.class.ts +48 -48
- package/src/subsystems/IO/Router.service/connectors/NullRouter.class.ts +40 -40
- package/src/subsystems/IO/Router.service/index.ts +11 -11
- package/src/subsystems/IO/Storage.service/SmythFS.class.ts +489 -489
- package/src/subsystems/IO/Storage.service/StorageConnector.ts +66 -66
- package/src/subsystems/IO/Storage.service/connectors/LocalStorage.class.ts +327 -327
- package/src/subsystems/IO/Storage.service/connectors/S3Storage.class.ts +482 -482
- package/src/subsystems/IO/Storage.service/index.ts +13 -13
- package/src/subsystems/IO/VectorDB.service/VectorDBConnector.ts +108 -108
- package/src/subsystems/IO/VectorDB.service/connectors/MilvusVectorDB.class.ts +454 -454
- package/src/subsystems/IO/VectorDB.service/connectors/PineconeVectorDB.class.ts +384 -384
- package/src/subsystems/IO/VectorDB.service/connectors/RAMVecrtorDB.class.ts +421 -421
- package/src/subsystems/IO/VectorDB.service/embed/BaseEmbedding.ts +107 -107
- package/src/subsystems/IO/VectorDB.service/embed/OpenAIEmbedding.ts +109 -109
- package/src/subsystems/IO/VectorDB.service/embed/index.ts +21 -21
- package/src/subsystems/IO/VectorDB.service/index.ts +14 -14
- package/src/subsystems/LLMManager/LLM.helper.ts +251 -251
- package/src/subsystems/LLMManager/LLM.inference.ts +339 -339
- package/src/subsystems/LLMManager/LLM.service/LLMConnector.ts +489 -489
- package/src/subsystems/LLMManager/LLM.service/LLMCredentials.helper.ts +171 -171
- package/src/subsystems/LLMManager/LLM.service/connectors/Anthropic.class.ts +659 -659
- package/src/subsystems/LLMManager/LLM.service/connectors/Bedrock.class.ts +400 -400
- package/src/subsystems/LLMManager/LLM.service/connectors/Echo.class.ts +77 -77
- package/src/subsystems/LLMManager/LLM.service/connectors/GoogleAI.class.ts +757 -757
- package/src/subsystems/LLMManager/LLM.service/connectors/Groq.class.ts +304 -304
- package/src/subsystems/LLMManager/LLM.service/connectors/Perplexity.class.ts +250 -250
- package/src/subsystems/LLMManager/LLM.service/connectors/VertexAI.class.ts +423 -423
- package/src/subsystems/LLMManager/LLM.service/connectors/openai/OpenAIConnector.class.ts +488 -488
- package/src/subsystems/LLMManager/LLM.service/connectors/openai/apiInterfaces/ChatCompletionsApiInterface.ts +524 -524
- package/src/subsystems/LLMManager/LLM.service/connectors/openai/apiInterfaces/OpenAIApiInterface.ts +100 -100
- package/src/subsystems/LLMManager/LLM.service/connectors/openai/apiInterfaces/OpenAIApiInterfaceFactory.ts +81 -81
- package/src/subsystems/LLMManager/LLM.service/connectors/openai/apiInterfaces/ResponsesApiInterface.ts +1145 -1145
- package/src/subsystems/LLMManager/LLM.service/connectors/openai/apiInterfaces/constants.ts +13 -13
- package/src/subsystems/LLMManager/LLM.service/connectors/openai/apiInterfaces/index.ts +4 -4
- package/src/subsystems/LLMManager/LLM.service/connectors/openai/apiInterfaces/utils.ts +11 -11
- package/src/subsystems/LLMManager/LLM.service/connectors/openai/types.ts +32 -32
- package/src/subsystems/LLMManager/LLM.service/connectors/xAI.class.ts +471 -471
- package/src/subsystems/LLMManager/LLM.service/index.ts +44 -44
- package/src/subsystems/LLMManager/ModelsProvider.service/ModelsProviderConnector.ts +300 -300
- package/src/subsystems/LLMManager/ModelsProvider.service/connectors/JSONModelsProvider.class.ts +252 -252
- package/src/subsystems/LLMManager/ModelsProvider.service/index.ts +11 -11
- package/src/subsystems/LLMManager/custom-models.ts +854 -854
- package/src/subsystems/LLMManager/models.ts +2540 -2540
- package/src/subsystems/LLMManager/paramMappings.ts +69 -69
- package/src/subsystems/MemoryManager/Cache.service/CacheConnector.ts +86 -86
- package/src/subsystems/MemoryManager/Cache.service/connectors/LocalStorageCache.class.ts +297 -297
- package/src/subsystems/MemoryManager/Cache.service/connectors/RAMCache.class.ts +201 -201
- package/src/subsystems/MemoryManager/Cache.service/connectors/RedisCache.class.ts +252 -252
- package/src/subsystems/MemoryManager/Cache.service/connectors/S3Cache.class.ts +373 -373
- package/src/subsystems/MemoryManager/Cache.service/index.ts +15 -15
- package/src/subsystems/MemoryManager/LLMCache.ts +72 -72
- package/src/subsystems/MemoryManager/LLMContext.ts +124 -124
- package/src/subsystems/MemoryManager/LLMMemory.service/LLMMemoryConnector.ts +26 -26
- package/src/subsystems/MemoryManager/RuntimeContext.ts +266 -266
- package/src/subsystems/Security/AccessControl/ACL.class.ts +208 -208
- package/src/subsystems/Security/AccessControl/AccessCandidate.class.ts +82 -82
- package/src/subsystems/Security/AccessControl/AccessRequest.class.ts +52 -52
- package/src/subsystems/Security/Account.service/AccountConnector.ts +44 -44
- package/src/subsystems/Security/Account.service/connectors/AWSAccount.class.ts +76 -76
- package/src/subsystems/Security/Account.service/connectors/DummyAccount.class.ts +130 -130
- package/src/subsystems/Security/Account.service/connectors/JSONFileAccount.class.ts +159 -159
- package/src/subsystems/Security/Account.service/index.ts +14 -14
- package/src/subsystems/Security/Credentials.helper.ts +62 -62
- package/src/subsystems/Security/ManagedVault.service/ManagedVaultConnector.ts +38 -38
- package/src/subsystems/Security/ManagedVault.service/connectors/NullManagedVault.class.ts +53 -53
- package/src/subsystems/Security/ManagedVault.service/connectors/SecretManagerManagedVault.ts +154 -154
- package/src/subsystems/Security/ManagedVault.service/index.ts +12 -12
- package/src/subsystems/Security/SecureConnector.class.ts +110 -110
- package/src/subsystems/Security/Vault.service/Vault.helper.ts +30 -30
- package/src/subsystems/Security/Vault.service/VaultConnector.ts +29 -29
- package/src/subsystems/Security/Vault.service/connectors/HashicorpVault.class.ts +46 -46
- package/src/subsystems/Security/Vault.service/connectors/JSONFileVault.class.ts +221 -221
- package/src/subsystems/Security/Vault.service/connectors/NullVault.class.ts +54 -54
- package/src/subsystems/Security/Vault.service/connectors/SecretsManager.class.ts +140 -140
- package/src/subsystems/Security/Vault.service/index.ts +12 -12
- package/src/types/ACL.types.ts +104 -104
- package/src/types/AWS.types.ts +10 -10
- package/src/types/Agent.types.ts +61 -61
- package/src/types/AgentLogger.types.ts +17 -17
- package/src/types/Cache.types.ts +1 -1
- package/src/types/Common.types.ts +2 -2
- package/src/types/LLM.types.ts +496 -496
- package/src/types/Redis.types.ts +8 -8
- package/src/types/SRE.types.ts +64 -64
- package/src/types/Security.types.ts +14 -14
- package/src/types/Storage.types.ts +5 -5
- package/src/types/VectorDB.types.ts +86 -86
- package/src/utils/base64.utils.ts +275 -275
- package/src/utils/cli.utils.ts +68 -68
- package/src/utils/data.utils.ts +322 -322
- package/src/utils/date-time.utils.ts +22 -22
- package/src/utils/general.utils.ts +238 -238
- package/src/utils/index.ts +12 -12
- package/src/utils/lazy-client.ts +261 -261
- package/src/utils/numbers.utils.ts +13 -13
- package/src/utils/oauth.utils.ts +35 -35
- package/src/utils/string.utils.ts +414 -414
- package/src/utils/url.utils.ts +19 -19
- package/src/utils/validation.utils.ts +74 -74
- package/dist/types/subsystems/LLMManager/ModelsProvider.service/connectors/SmythModelsProvider.class.d.ts +0 -39
|
@@ -1,384 +1,384 @@
|
|
|
1
|
-
//==[ SRE: S3Storage ]======================
|
|
2
|
-
import { ACL } from '@sre/Security/AccessControl/ACL.class';
|
|
3
|
-
import { IAccessCandidate, IACL, TAccessLevel, TAccessRole } from '@sre/types/ACL.types';
|
|
4
|
-
import { AccessRequest } from '@sre/Security/AccessControl/AccessRequest.class';
|
|
5
|
-
import { AccessCandidate } from '@sre/Security/AccessControl/AccessCandidate.class';
|
|
6
|
-
import { SecureConnector } from '@sre/Security/SecureConnector.class';
|
|
7
|
-
import { VectorDBConnector, DeleteTarget } from '../VectorDBConnector';
|
|
8
|
-
import {
|
|
9
|
-
DatasourceDto,
|
|
10
|
-
IStorageVectorDataSource,
|
|
11
|
-
IStorageVectorNamespace,
|
|
12
|
-
IVectorDataSourceDto,
|
|
13
|
-
QueryOptions,
|
|
14
|
-
VectorsResultData,
|
|
15
|
-
} from '@sre/types/VectorDB.types';
|
|
16
|
-
import { Pinecone } from '@pinecone-database/pinecone';
|
|
17
|
-
import { ConnectorService } from '@sre/Core/ConnectorsService';
|
|
18
|
-
import { Logger } from '@sre/helpers/Log.helper';
|
|
19
|
-
import { NKVConnector } from '@sre/IO/NKV.service/NKVConnector';
|
|
20
|
-
import { AccountConnector } from '@sre/Security/Account.service/AccountConnector';
|
|
21
|
-
import { JSONContentHelper } from '@sre/helpers/JsonContent.helper';
|
|
22
|
-
import { CacheConnector } from '@sre/MemoryManager/Cache.service/CacheConnector';
|
|
23
|
-
import crypto from 'crypto';
|
|
24
|
-
import { BaseEmbedding, TEmbeddings } from '../embed/BaseEmbedding';
|
|
25
|
-
import { EmbeddingsFactory, SupportedProviders, SupportedModels } from '../embed';
|
|
26
|
-
import { chunkText } from '@sre/utils/string.utils';
|
|
27
|
-
import { jsonrepair } from 'jsonrepair';
|
|
28
|
-
|
|
29
|
-
const console = Logger('Pinecone VectorDB');
|
|
30
|
-
|
|
31
|
-
export type PineconeConfig = {
|
|
32
|
-
/**
|
|
33
|
-
* The Pinecone API key
|
|
34
|
-
*/
|
|
35
|
-
apiKey: string;
|
|
36
|
-
/**
|
|
37
|
-
* The Pinecone index name
|
|
38
|
-
*/
|
|
39
|
-
indexName: string;
|
|
40
|
-
/**
|
|
41
|
-
* The embeddings model to use
|
|
42
|
-
*/
|
|
43
|
-
embeddings: TEmbeddings;
|
|
44
|
-
};
|
|
45
|
-
export class PineconeVectorDB extends VectorDBConnector {
|
|
46
|
-
public name = 'PineconeVectorDB';
|
|
47
|
-
public id = 'pinecone';
|
|
48
|
-
private client: Pinecone;
|
|
49
|
-
private indexName: string;
|
|
50
|
-
private cache: CacheConnector;
|
|
51
|
-
private accountConnector: AccountConnector;
|
|
52
|
-
private nkvConnector: NKVConnector;
|
|
53
|
-
public embedder: BaseEmbedding;
|
|
54
|
-
|
|
55
|
-
constructor(protected _settings: PineconeConfig) {
|
|
56
|
-
super(_settings);
|
|
57
|
-
if (!_settings.apiKey) {
|
|
58
|
-
console.warn('Missing Pinecone API key : returning empty Pinecone connector');
|
|
59
|
-
return;
|
|
60
|
-
}
|
|
61
|
-
if (!_settings.indexName) {
|
|
62
|
-
console.warn('Missing Pinecone index name : returning empty Pinecone connector');
|
|
63
|
-
return;
|
|
64
|
-
}
|
|
65
|
-
|
|
66
|
-
this.client = new Pinecone({
|
|
67
|
-
apiKey: _settings.apiKey,
|
|
68
|
-
});
|
|
69
|
-
console.info('Pinecone client initialized');
|
|
70
|
-
console.info('Pinecone index name:', _settings.indexName);
|
|
71
|
-
this.indexName = _settings.indexName;
|
|
72
|
-
this.accountConnector = ConnectorService.getAccountConnector();
|
|
73
|
-
this.cache = ConnectorService.getCacheConnector();
|
|
74
|
-
this.nkvConnector = ConnectorService.getNKVConnector();
|
|
75
|
-
if (!_settings.embeddings.params) _settings.embeddings.params = { dimensions: 1024 };
|
|
76
|
-
if (!_settings.embeddings.params?.dimensions) _settings.embeddings.params.dimensions = 1024;
|
|
77
|
-
|
|
78
|
-
this.embedder = EmbeddingsFactory.create(_settings.embeddings.provider, _settings.embeddings);
|
|
79
|
-
}
|
|
80
|
-
|
|
81
|
-
public async getResourceACL(resourceId: string, candidate: IAccessCandidate): Promise<ACL> {
|
|
82
|
-
//const teamId = await this.accountConnector.getCandidateTeam(AccessCandidate.clone(candidate));
|
|
83
|
-
const preparedNs = this.constructNsName(candidate as AccessCandidate, resourceId);
|
|
84
|
-
const acl = await this.getACL(AccessCandidate.clone(candidate), preparedNs);
|
|
85
|
-
const exists = !!acl;
|
|
86
|
-
|
|
87
|
-
if (!exists) {
|
|
88
|
-
//the resource does not exist yet, we grant write access to the candidate in order to allow the resource creation
|
|
89
|
-
return new ACL().addAccess(candidate.role, candidate.id, TAccessLevel.Owner);
|
|
90
|
-
}
|
|
91
|
-
return ACL.from(acl);
|
|
92
|
-
}
|
|
93
|
-
|
|
94
|
-
@SecureConnector.AccessControl
|
|
95
|
-
protected async createNamespace(acRequest: AccessRequest, namespace: string, metadata?: { [key: string]: any }): Promise<void> {
|
|
96
|
-
//* Since Pinecone does not create explicit namespaces,
|
|
97
|
-
//* we create a zero or dummy vector in the namespace to trigger the namespace creation and filter it out
|
|
98
|
-
|
|
99
|
-
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
100
|
-
const preparedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
101
|
-
|
|
102
|
-
const acl = new ACL().addAccess(acRequest.candidate.role, acRequest.candidate.id, TAccessLevel.Owner);
|
|
103
|
-
|
|
104
|
-
const nsData = {
|
|
105
|
-
acl: acl.serializedACL,
|
|
106
|
-
displayName: namespace,
|
|
107
|
-
...metadata,
|
|
108
|
-
};
|
|
109
|
-
await this.client
|
|
110
|
-
.Index(this.indexName)
|
|
111
|
-
.namespace(preparedNs)
|
|
112
|
-
.upsert([
|
|
113
|
-
{
|
|
114
|
-
id: `_reserved_${preparedNs}`,
|
|
115
|
-
values: this.embedder.dummyVector,
|
|
116
|
-
metadata: {
|
|
117
|
-
isSkeletonVector: true,
|
|
118
|
-
...nsData,
|
|
119
|
-
},
|
|
120
|
-
},
|
|
121
|
-
]);
|
|
122
|
-
|
|
123
|
-
await this.setACL(acRequest, preparedNs, acl.ACL);
|
|
124
|
-
|
|
125
|
-
return new Promise<void>((resolve) => resolve());
|
|
126
|
-
}
|
|
127
|
-
|
|
128
|
-
@SecureConnector.AccessControl
|
|
129
|
-
protected async namespaceExists(acRequest: AccessRequest, namespace: string): Promise<boolean> {
|
|
130
|
-
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
131
|
-
const stats = await this.client.Index(this.indexName).describeIndexStats();
|
|
132
|
-
return Object.keys(stats.namespaces).includes(this.constructNsName(acRequest.candidate as AccessCandidate, namespace));
|
|
133
|
-
}
|
|
134
|
-
|
|
135
|
-
@SecureConnector.AccessControl
|
|
136
|
-
protected async deleteNamespace(acRequest: AccessRequest, namespace: string): Promise<void> {
|
|
137
|
-
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
138
|
-
//const candidate = AccessCandidate.team(teamId);
|
|
139
|
-
const preparedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
140
|
-
|
|
141
|
-
await this.client
|
|
142
|
-
.Index(this.indexName)
|
|
143
|
-
.namespace(this.constructNsName(acRequest.candidate as AccessCandidate, namespace))
|
|
144
|
-
.deleteAll()
|
|
145
|
-
.catch((e) => {
|
|
146
|
-
if (e?.name == 'PineconeNotFoundError') {
|
|
147
|
-
console.warn(`Namespace ${namespace} does not exist and was requested to be deleted`);
|
|
148
|
-
return;
|
|
149
|
-
}
|
|
150
|
-
throw e;
|
|
151
|
-
});
|
|
152
|
-
|
|
153
|
-
await this.deleteACL(AccessCandidate.clone(acRequest.candidate), namespace);
|
|
154
|
-
}
|
|
155
|
-
|
|
156
|
-
@SecureConnector.AccessControl
|
|
157
|
-
protected async search(
|
|
158
|
-
acRequest: AccessRequest,
|
|
159
|
-
namespace: string,
|
|
160
|
-
query: string | number[],
|
|
161
|
-
options: QueryOptions = {}
|
|
162
|
-
): Promise<VectorsResultData> {
|
|
163
|
-
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
164
|
-
|
|
165
|
-
const pineconeIndex = this.client.Index(this.indexName).namespace(this.constructNsName(acRequest.candidate as AccessCandidate, namespace));
|
|
166
|
-
let _vector = query;
|
|
167
|
-
if (typeof query === 'string') {
|
|
168
|
-
_vector = await this.embedder.embedText(query, acRequest.candidate as AccessCandidate);
|
|
169
|
-
}
|
|
170
|
-
|
|
171
|
-
const topK = (options.topK || 10) + 1; //* we increment one in case it included the skeleton vector
|
|
172
|
-
|
|
173
|
-
const results = await pineconeIndex.query({
|
|
174
|
-
topK,
|
|
175
|
-
vector: _vector as number[],
|
|
176
|
-
includeMetadata: true,
|
|
177
|
-
includeValues: true,
|
|
178
|
-
});
|
|
179
|
-
|
|
180
|
-
let matches = [];
|
|
181
|
-
|
|
182
|
-
for (const match of results.matches) {
|
|
183
|
-
if (match.metadata?.isSkeletonVector) continue;
|
|
184
|
-
|
|
185
|
-
if (match.metadata?.[this.USER_METADATA_KEY]) {
|
|
186
|
-
match.metadata[this.USER_METADATA_KEY] = JSONContentHelper.create(match.metadata[this.USER_METADATA_KEY].toString()).tryParse();
|
|
187
|
-
}
|
|
188
|
-
|
|
189
|
-
matches.push({
|
|
190
|
-
id: match.id,
|
|
191
|
-
values: match.values,
|
|
192
|
-
text: match.metadata?.text as string | undefined,
|
|
193
|
-
metadata: match.metadata?.[this.USER_METADATA_KEY] as Record<string, any> | undefined,
|
|
194
|
-
score: match.score,
|
|
195
|
-
});
|
|
196
|
-
}
|
|
197
|
-
|
|
198
|
-
// in the case where we did not filter out the skeleton vector, we need to remove the extra match from the results
|
|
199
|
-
return matches.slice(0, options.topK);
|
|
200
|
-
}
|
|
201
|
-
|
|
202
|
-
@SecureConnector.AccessControl
|
|
203
|
-
protected async insert(
|
|
204
|
-
acRequest: AccessRequest,
|
|
205
|
-
namespace: string,
|
|
206
|
-
sourceWrapper: IVectorDataSourceDto | IVectorDataSourceDto[]
|
|
207
|
-
): Promise<string[]> {
|
|
208
|
-
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
209
|
-
sourceWrapper = Array.isArray(sourceWrapper) ? sourceWrapper : [sourceWrapper];
|
|
210
|
-
|
|
211
|
-
// make sure that all sources are of the same type (source.source)
|
|
212
|
-
if (sourceWrapper.some((s) => this.embedder.detectSourceType(s.source) !== this.embedder.detectSourceType(sourceWrapper[0].source))) {
|
|
213
|
-
throw new Error('All sources must be of the same type');
|
|
214
|
-
}
|
|
215
|
-
|
|
216
|
-
const sourceType = this.embedder.detectSourceType(sourceWrapper[0].source);
|
|
217
|
-
if (sourceType === 'unknown' || sourceType === 'url') throw new Error('Invalid source type');
|
|
218
|
-
const transformedSource = await this.embedder.transformSource(sourceWrapper, sourceType, acRequest.candidate as AccessCandidate);
|
|
219
|
-
const preparedSource = transformedSource.map((s) => ({
|
|
220
|
-
id: s.id,
|
|
221
|
-
values: s.source as number[],
|
|
222
|
-
metadata: s.metadata,
|
|
223
|
-
}));
|
|
224
|
-
|
|
225
|
-
// await pineconeStore.addDocuments(chunks, ids);
|
|
226
|
-
await this.client
|
|
227
|
-
.Index(this.indexName)
|
|
228
|
-
.namespace(this.constructNsName(acRequest.candidate as AccessCandidate, namespace))
|
|
229
|
-
.upsert(preparedSource);
|
|
230
|
-
|
|
231
|
-
const accessCandidate = acRequest.candidate;
|
|
232
|
-
|
|
233
|
-
const isNewNs = !(await this.requester(AccessCandidate.clone(accessCandidate)).namespaceExists(namespace));
|
|
234
|
-
if (isNewNs) {
|
|
235
|
-
let acl = new ACL().addAccess(accessCandidate.role, accessCandidate.id, TAccessLevel.Owner).ACL;
|
|
236
|
-
await this.setACL(acRequest, namespace, acl);
|
|
237
|
-
}
|
|
238
|
-
|
|
239
|
-
return preparedSource.map((s) => s.id);
|
|
240
|
-
}
|
|
241
|
-
|
|
242
|
-
@SecureConnector.AccessControl
|
|
243
|
-
protected async delete(acRequest: AccessRequest, namespace: string, deleteTarget: DeleteTarget): Promise<void> {
|
|
244
|
-
const isDeleteByFilter = typeof deleteTarget === 'object';
|
|
245
|
-
|
|
246
|
-
if (isDeleteByFilter) {
|
|
247
|
-
// TODO: handle delete by filter logic
|
|
248
|
-
} else {
|
|
249
|
-
const _ids = Array.isArray(deleteTarget) ? deleteTarget : [deleteTarget];
|
|
250
|
-
|
|
251
|
-
const res = await this.client
|
|
252
|
-
.Index(this.indexName)
|
|
253
|
-
.namespace(this.constructNsName(acRequest.candidate as AccessCandidate, namespace))
|
|
254
|
-
.deleteMany(_ids);
|
|
255
|
-
}
|
|
256
|
-
}
|
|
257
|
-
|
|
258
|
-
@SecureConnector.AccessControl
|
|
259
|
-
protected async createDatasource(acRequest: AccessRequest, namespace: string, datasource: DatasourceDto): Promise<IStorageVectorDataSource> {
|
|
260
|
-
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
261
|
-
const acl = new ACL().addAccess(acRequest.candidate.role, acRequest.candidate.id, TAccessLevel.Owner);
|
|
262
|
-
const dsId = datasource.id || crypto.randomUUID();
|
|
263
|
-
|
|
264
|
-
const formattedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
265
|
-
const chunkedText = chunkText(datasource.text, {
|
|
266
|
-
chunkSize: datasource.chunkSize,
|
|
267
|
-
chunkOverlap: datasource.chunkOverlap,
|
|
268
|
-
});
|
|
269
|
-
const label = datasource.label || 'Untitled';
|
|
270
|
-
const ids = Array.from({ length: chunkedText.length }, (_, i) => `${dsId}_${crypto.randomUUID()}`);
|
|
271
|
-
const source: IVectorDataSourceDto[] = chunkedText.map((doc, i) => {
|
|
272
|
-
return {
|
|
273
|
-
id: ids[i],
|
|
274
|
-
source: doc,
|
|
275
|
-
metadata: {
|
|
276
|
-
acl: acl.serializedACL,
|
|
277
|
-
namespaceId: formattedNs,
|
|
278
|
-
datasourceId: dsId,
|
|
279
|
-
datasourceLabel: label,
|
|
280
|
-
user_metadata: datasource.metadata ? jsonrepair(JSON.stringify(datasource.metadata)) : undefined,
|
|
281
|
-
},
|
|
282
|
-
};
|
|
283
|
-
});
|
|
284
|
-
|
|
285
|
-
const _vIds = await this.insert(acRequest, namespace, source);
|
|
286
|
-
|
|
287
|
-
const dsData: IStorageVectorDataSource = {
|
|
288
|
-
namespaceId: formattedNs,
|
|
289
|
-
candidateId: acRequest.candidate.id,
|
|
290
|
-
candidateRole: acRequest.candidate.role,
|
|
291
|
-
name: datasource.label || 'Untitled',
|
|
292
|
-
metadata: datasource.metadata ? jsonrepair(JSON.stringify(datasource.metadata)) : undefined,
|
|
293
|
-
text: datasource.text,
|
|
294
|
-
vectorIds: _vIds,
|
|
295
|
-
id: dsId,
|
|
296
|
-
};
|
|
297
|
-
// const url = `smythfs://${teamId}.team/_datasources/${dsId}.json`;
|
|
298
|
-
// await SmythFS.Instance.write(url, JSON.stringify(dsData), AccessCandidate.team(teamId));
|
|
299
|
-
await this.nkvConnector
|
|
300
|
-
.requester(acRequest.candidate as AccessCandidate)
|
|
301
|
-
.set(`vectorDB:${this.id}:namespaces:${formattedNs}:datasources`, dsId, JSON.stringify(dsData));
|
|
302
|
-
// return { id: dsId, vectorIds: _vIds };
|
|
303
|
-
return dsData;
|
|
304
|
-
}
|
|
305
|
-
|
|
306
|
-
@SecureConnector.AccessControl
|
|
307
|
-
protected async deleteDatasource(acRequest: AccessRequest, namespace: string, datasourceId: string): Promise<void> {
|
|
308
|
-
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
309
|
-
const formattedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
310
|
-
// const url = `smythfs://${teamId}.team/_datasources/${dsId}.json`;
|
|
311
|
-
// await SmythFS.Instance.delete(url, AccessCandidate.team(teamId));
|
|
312
|
-
let ds: IStorageVectorDataSource = JSONContentHelper.create(
|
|
313
|
-
(
|
|
314
|
-
await this.nkvConnector
|
|
315
|
-
.requester(acRequest.candidate as AccessCandidate)
|
|
316
|
-
.get(`vectorDB:${this.id}:namespaces:${formattedNs}:datasources`, datasourceId)
|
|
317
|
-
)?.toString()
|
|
318
|
-
).tryParse();
|
|
319
|
-
|
|
320
|
-
if (!ds || typeof ds !== 'object') {
|
|
321
|
-
throw new Error(`Data source not found with id: ${datasourceId}`);
|
|
322
|
-
}
|
|
323
|
-
|
|
324
|
-
await this.delete(acRequest, namespace, ds.vectorIds || []);
|
|
325
|
-
|
|
326
|
-
await this.nkvConnector
|
|
327
|
-
.requester(acRequest.candidate as AccessCandidate)
|
|
328
|
-
.delete(`vectorDB:${this.id}:namespaces:${formattedNs}:datasources`, datasourceId);
|
|
329
|
-
}
|
|
330
|
-
|
|
331
|
-
@SecureConnector.AccessControl
|
|
332
|
-
protected async listDatasources(acRequest: AccessRequest, namespace: string): Promise<IStorageVectorDataSource[]> {
|
|
333
|
-
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
334
|
-
const formattedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
335
|
-
return (
|
|
336
|
-
await this.nkvConnector
|
|
337
|
-
.requester(acRequest.candidate as AccessCandidate)
|
|
338
|
-
.list(`vectorDB:${this.id}:namespaces:${formattedNs}:datasources`)
|
|
339
|
-
).map((ds) => {
|
|
340
|
-
return JSONContentHelper.create(ds.data?.toString()).tryParse() as IStorageVectorDataSource;
|
|
341
|
-
});
|
|
342
|
-
}
|
|
343
|
-
|
|
344
|
-
@SecureConnector.AccessControl
|
|
345
|
-
protected async getDatasource(acRequest: AccessRequest, namespace: string, datasourceId: string): Promise<IStorageVectorDataSource> {
|
|
346
|
-
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
347
|
-
const formattedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
348
|
-
return JSONContentHelper.create(
|
|
349
|
-
(
|
|
350
|
-
await this.nkvConnector
|
|
351
|
-
.requester(acRequest.candidate as AccessCandidate)
|
|
352
|
-
.get(`vectorDB:${this.id}:namespaces:${formattedNs}:datasources`, datasourceId)
|
|
353
|
-
)?.toString()
|
|
354
|
-
).tryParse() as IStorageVectorDataSource;
|
|
355
|
-
}
|
|
356
|
-
|
|
357
|
-
private async setACL(acRequest: AccessRequest, preparedNs: string, acl: IACL): Promise<void> {
|
|
358
|
-
await this.cache
|
|
359
|
-
.requester(AccessCandidate.clone(acRequest.candidate))
|
|
360
|
-
.set(`vectorDB:pinecone:namespace:${preparedNs}:acl`, JSON.stringify(acl));
|
|
361
|
-
}
|
|
362
|
-
|
|
363
|
-
private async getACL(ac: AccessCandidate, preparedNs: string): Promise<ACL | null | undefined> {
|
|
364
|
-
let aclRes = await this.cache.requester(ac).get(`vectorDB:pinecone:namespace:${preparedNs}:acl`);
|
|
365
|
-
const acl = JSONContentHelper.create(aclRes?.toString?.()).tryParse();
|
|
366
|
-
return acl;
|
|
367
|
-
}
|
|
368
|
-
|
|
369
|
-
private async deleteACL(ac: AccessCandidate, preparedNs: string): Promise<void> {
|
|
370
|
-
this.cache.requester(AccessCandidate.clone(ac)).delete(`vectorDB:pinecone:namespace:${preparedNs}:acl`);
|
|
371
|
-
}
|
|
372
|
-
|
|
373
|
-
public constructNsName(candidate: AccessCandidate, name: string) {
|
|
374
|
-
const joinedName = name.trim().replace(/\s/g, '_').toLowerCase();
|
|
375
|
-
let prefix = candidate.id;
|
|
376
|
-
|
|
377
|
-
if (candidate.role !== TAccessRole.Team) {
|
|
378
|
-
//DO NOT add role prefix for teams to preserve backward compatibility
|
|
379
|
-
prefix = candidate.role[0] + '_' + candidate.id;
|
|
380
|
-
}
|
|
381
|
-
|
|
382
|
-
return `${prefix}_${joinedName}`;
|
|
383
|
-
}
|
|
384
|
-
}
|
|
1
|
+
//==[ SRE: S3Storage ]======================
|
|
2
|
+
import { ACL } from '@sre/Security/AccessControl/ACL.class';
|
|
3
|
+
import { IAccessCandidate, IACL, TAccessLevel, TAccessRole } from '@sre/types/ACL.types';
|
|
4
|
+
import { AccessRequest } from '@sre/Security/AccessControl/AccessRequest.class';
|
|
5
|
+
import { AccessCandidate } from '@sre/Security/AccessControl/AccessCandidate.class';
|
|
6
|
+
import { SecureConnector } from '@sre/Security/SecureConnector.class';
|
|
7
|
+
import { VectorDBConnector, DeleteTarget } from '../VectorDBConnector';
|
|
8
|
+
import {
|
|
9
|
+
DatasourceDto,
|
|
10
|
+
IStorageVectorDataSource,
|
|
11
|
+
IStorageVectorNamespace,
|
|
12
|
+
IVectorDataSourceDto,
|
|
13
|
+
QueryOptions,
|
|
14
|
+
VectorsResultData,
|
|
15
|
+
} from '@sre/types/VectorDB.types';
|
|
16
|
+
import { Pinecone } from '@pinecone-database/pinecone';
|
|
17
|
+
import { ConnectorService } from '@sre/Core/ConnectorsService';
|
|
18
|
+
import { Logger } from '@sre/helpers/Log.helper';
|
|
19
|
+
import { NKVConnector } from '@sre/IO/NKV.service/NKVConnector';
|
|
20
|
+
import { AccountConnector } from '@sre/Security/Account.service/AccountConnector';
|
|
21
|
+
import { JSONContentHelper } from '@sre/helpers/JsonContent.helper';
|
|
22
|
+
import { CacheConnector } from '@sre/MemoryManager/Cache.service/CacheConnector';
|
|
23
|
+
import crypto from 'crypto';
|
|
24
|
+
import { BaseEmbedding, TEmbeddings } from '../embed/BaseEmbedding';
|
|
25
|
+
import { EmbeddingsFactory, SupportedProviders, SupportedModels } from '../embed';
|
|
26
|
+
import { chunkText } from '@sre/utils/string.utils';
|
|
27
|
+
import { jsonrepair } from 'jsonrepair';
|
|
28
|
+
|
|
29
|
+
const console = Logger('Pinecone VectorDB');
|
|
30
|
+
|
|
31
|
+
export type PineconeConfig = {
|
|
32
|
+
/**
|
|
33
|
+
* The Pinecone API key
|
|
34
|
+
*/
|
|
35
|
+
apiKey: string;
|
|
36
|
+
/**
|
|
37
|
+
* The Pinecone index name
|
|
38
|
+
*/
|
|
39
|
+
indexName: string;
|
|
40
|
+
/**
|
|
41
|
+
* The embeddings model to use
|
|
42
|
+
*/
|
|
43
|
+
embeddings: TEmbeddings;
|
|
44
|
+
};
|
|
45
|
+
export class PineconeVectorDB extends VectorDBConnector {
|
|
46
|
+
public name = 'PineconeVectorDB';
|
|
47
|
+
public id = 'pinecone';
|
|
48
|
+
private client: Pinecone;
|
|
49
|
+
private indexName: string;
|
|
50
|
+
private cache: CacheConnector;
|
|
51
|
+
private accountConnector: AccountConnector;
|
|
52
|
+
private nkvConnector: NKVConnector;
|
|
53
|
+
public embedder: BaseEmbedding;
|
|
54
|
+
|
|
55
|
+
constructor(protected _settings: PineconeConfig) {
|
|
56
|
+
super(_settings);
|
|
57
|
+
if (!_settings.apiKey) {
|
|
58
|
+
console.warn('Missing Pinecone API key : returning empty Pinecone connector');
|
|
59
|
+
return;
|
|
60
|
+
}
|
|
61
|
+
if (!_settings.indexName) {
|
|
62
|
+
console.warn('Missing Pinecone index name : returning empty Pinecone connector');
|
|
63
|
+
return;
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
this.client = new Pinecone({
|
|
67
|
+
apiKey: _settings.apiKey,
|
|
68
|
+
});
|
|
69
|
+
console.info('Pinecone client initialized');
|
|
70
|
+
console.info('Pinecone index name:', _settings.indexName);
|
|
71
|
+
this.indexName = _settings.indexName;
|
|
72
|
+
this.accountConnector = ConnectorService.getAccountConnector();
|
|
73
|
+
this.cache = ConnectorService.getCacheConnector();
|
|
74
|
+
this.nkvConnector = ConnectorService.getNKVConnector();
|
|
75
|
+
if (!_settings.embeddings.params) _settings.embeddings.params = { dimensions: 1024 };
|
|
76
|
+
if (!_settings.embeddings.params?.dimensions) _settings.embeddings.params.dimensions = 1024;
|
|
77
|
+
|
|
78
|
+
this.embedder = EmbeddingsFactory.create(_settings.embeddings.provider, _settings.embeddings);
|
|
79
|
+
}
|
|
80
|
+
|
|
81
|
+
public async getResourceACL(resourceId: string, candidate: IAccessCandidate): Promise<ACL> {
|
|
82
|
+
//const teamId = await this.accountConnector.getCandidateTeam(AccessCandidate.clone(candidate));
|
|
83
|
+
const preparedNs = this.constructNsName(candidate as AccessCandidate, resourceId);
|
|
84
|
+
const acl = await this.getACL(AccessCandidate.clone(candidate), preparedNs);
|
|
85
|
+
const exists = !!acl;
|
|
86
|
+
|
|
87
|
+
if (!exists) {
|
|
88
|
+
//the resource does not exist yet, we grant write access to the candidate in order to allow the resource creation
|
|
89
|
+
return new ACL().addAccess(candidate.role, candidate.id, TAccessLevel.Owner);
|
|
90
|
+
}
|
|
91
|
+
return ACL.from(acl);
|
|
92
|
+
}
|
|
93
|
+
|
|
94
|
+
@SecureConnector.AccessControl
|
|
95
|
+
protected async createNamespace(acRequest: AccessRequest, namespace: string, metadata?: { [key: string]: any }): Promise<void> {
|
|
96
|
+
//* Since Pinecone does not create explicit namespaces,
|
|
97
|
+
//* we create a zero or dummy vector in the namespace to trigger the namespace creation and filter it out
|
|
98
|
+
|
|
99
|
+
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
100
|
+
const preparedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
101
|
+
|
|
102
|
+
const acl = new ACL().addAccess(acRequest.candidate.role, acRequest.candidate.id, TAccessLevel.Owner);
|
|
103
|
+
|
|
104
|
+
const nsData = {
|
|
105
|
+
acl: acl.serializedACL,
|
|
106
|
+
displayName: namespace,
|
|
107
|
+
...metadata,
|
|
108
|
+
};
|
|
109
|
+
await this.client
|
|
110
|
+
.Index(this.indexName)
|
|
111
|
+
.namespace(preparedNs)
|
|
112
|
+
.upsert([
|
|
113
|
+
{
|
|
114
|
+
id: `_reserved_${preparedNs}`,
|
|
115
|
+
values: this.embedder.dummyVector,
|
|
116
|
+
metadata: {
|
|
117
|
+
isSkeletonVector: true,
|
|
118
|
+
...nsData,
|
|
119
|
+
},
|
|
120
|
+
},
|
|
121
|
+
]);
|
|
122
|
+
|
|
123
|
+
await this.setACL(acRequest, preparedNs, acl.ACL);
|
|
124
|
+
|
|
125
|
+
return new Promise<void>((resolve) => resolve());
|
|
126
|
+
}
|
|
127
|
+
|
|
128
|
+
@SecureConnector.AccessControl
|
|
129
|
+
protected async namespaceExists(acRequest: AccessRequest, namespace: string): Promise<boolean> {
|
|
130
|
+
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
131
|
+
const stats = await this.client.Index(this.indexName).describeIndexStats();
|
|
132
|
+
return Object.keys(stats.namespaces).includes(this.constructNsName(acRequest.candidate as AccessCandidate, namespace));
|
|
133
|
+
}
|
|
134
|
+
|
|
135
|
+
@SecureConnector.AccessControl
|
|
136
|
+
protected async deleteNamespace(acRequest: AccessRequest, namespace: string): Promise<void> {
|
|
137
|
+
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
138
|
+
//const candidate = AccessCandidate.team(teamId);
|
|
139
|
+
const preparedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
140
|
+
|
|
141
|
+
await this.client
|
|
142
|
+
.Index(this.indexName)
|
|
143
|
+
.namespace(this.constructNsName(acRequest.candidate as AccessCandidate, namespace))
|
|
144
|
+
.deleteAll()
|
|
145
|
+
.catch((e) => {
|
|
146
|
+
if (e?.name == 'PineconeNotFoundError') {
|
|
147
|
+
console.warn(`Namespace ${namespace} does not exist and was requested to be deleted`);
|
|
148
|
+
return;
|
|
149
|
+
}
|
|
150
|
+
throw e;
|
|
151
|
+
});
|
|
152
|
+
|
|
153
|
+
await this.deleteACL(AccessCandidate.clone(acRequest.candidate), namespace);
|
|
154
|
+
}
|
|
155
|
+
|
|
156
|
+
@SecureConnector.AccessControl
|
|
157
|
+
protected async search(
|
|
158
|
+
acRequest: AccessRequest,
|
|
159
|
+
namespace: string,
|
|
160
|
+
query: string | number[],
|
|
161
|
+
options: QueryOptions = {}
|
|
162
|
+
): Promise<VectorsResultData> {
|
|
163
|
+
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
164
|
+
|
|
165
|
+
const pineconeIndex = this.client.Index(this.indexName).namespace(this.constructNsName(acRequest.candidate as AccessCandidate, namespace));
|
|
166
|
+
let _vector = query;
|
|
167
|
+
if (typeof query === 'string') {
|
|
168
|
+
_vector = await this.embedder.embedText(query, acRequest.candidate as AccessCandidate);
|
|
169
|
+
}
|
|
170
|
+
|
|
171
|
+
const topK = (options.topK || 10) + 1; //* we increment one in case it included the skeleton vector
|
|
172
|
+
|
|
173
|
+
const results = await pineconeIndex.query({
|
|
174
|
+
topK,
|
|
175
|
+
vector: _vector as number[],
|
|
176
|
+
includeMetadata: true,
|
|
177
|
+
includeValues: true,
|
|
178
|
+
});
|
|
179
|
+
|
|
180
|
+
let matches = [];
|
|
181
|
+
|
|
182
|
+
for (const match of results.matches) {
|
|
183
|
+
if (match.metadata?.isSkeletonVector) continue;
|
|
184
|
+
|
|
185
|
+
if (match.metadata?.[this.USER_METADATA_KEY]) {
|
|
186
|
+
match.metadata[this.USER_METADATA_KEY] = JSONContentHelper.create(match.metadata[this.USER_METADATA_KEY].toString()).tryParse();
|
|
187
|
+
}
|
|
188
|
+
|
|
189
|
+
matches.push({
|
|
190
|
+
id: match.id,
|
|
191
|
+
values: match.values,
|
|
192
|
+
text: match.metadata?.text as string | undefined,
|
|
193
|
+
metadata: match.metadata?.[this.USER_METADATA_KEY] as Record<string, any> | undefined,
|
|
194
|
+
score: match.score,
|
|
195
|
+
});
|
|
196
|
+
}
|
|
197
|
+
|
|
198
|
+
// in the case where we did not filter out the skeleton vector, we need to remove the extra match from the results
|
|
199
|
+
return matches.slice(0, options.topK);
|
|
200
|
+
}
|
|
201
|
+
|
|
202
|
+
@SecureConnector.AccessControl
|
|
203
|
+
protected async insert(
|
|
204
|
+
acRequest: AccessRequest,
|
|
205
|
+
namespace: string,
|
|
206
|
+
sourceWrapper: IVectorDataSourceDto | IVectorDataSourceDto[]
|
|
207
|
+
): Promise<string[]> {
|
|
208
|
+
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
209
|
+
sourceWrapper = Array.isArray(sourceWrapper) ? sourceWrapper : [sourceWrapper];
|
|
210
|
+
|
|
211
|
+
// make sure that all sources are of the same type (source.source)
|
|
212
|
+
if (sourceWrapper.some((s) => this.embedder.detectSourceType(s.source) !== this.embedder.detectSourceType(sourceWrapper[0].source))) {
|
|
213
|
+
throw new Error('All sources must be of the same type');
|
|
214
|
+
}
|
|
215
|
+
|
|
216
|
+
const sourceType = this.embedder.detectSourceType(sourceWrapper[0].source);
|
|
217
|
+
if (sourceType === 'unknown' || sourceType === 'url') throw new Error('Invalid source type');
|
|
218
|
+
const transformedSource = await this.embedder.transformSource(sourceWrapper, sourceType, acRequest.candidate as AccessCandidate);
|
|
219
|
+
const preparedSource = transformedSource.map((s) => ({
|
|
220
|
+
id: s.id,
|
|
221
|
+
values: s.source as number[],
|
|
222
|
+
metadata: s.metadata,
|
|
223
|
+
}));
|
|
224
|
+
|
|
225
|
+
// await pineconeStore.addDocuments(chunks, ids);
|
|
226
|
+
await this.client
|
|
227
|
+
.Index(this.indexName)
|
|
228
|
+
.namespace(this.constructNsName(acRequest.candidate as AccessCandidate, namespace))
|
|
229
|
+
.upsert(preparedSource);
|
|
230
|
+
|
|
231
|
+
const accessCandidate = acRequest.candidate;
|
|
232
|
+
|
|
233
|
+
const isNewNs = !(await this.requester(AccessCandidate.clone(accessCandidate)).namespaceExists(namespace));
|
|
234
|
+
if (isNewNs) {
|
|
235
|
+
let acl = new ACL().addAccess(accessCandidate.role, accessCandidate.id, TAccessLevel.Owner).ACL;
|
|
236
|
+
await this.setACL(acRequest, namespace, acl);
|
|
237
|
+
}
|
|
238
|
+
|
|
239
|
+
return preparedSource.map((s) => s.id);
|
|
240
|
+
}
|
|
241
|
+
|
|
242
|
+
@SecureConnector.AccessControl
|
|
243
|
+
protected async delete(acRequest: AccessRequest, namespace: string, deleteTarget: DeleteTarget): Promise<void> {
|
|
244
|
+
const isDeleteByFilter = typeof deleteTarget === 'object';
|
|
245
|
+
|
|
246
|
+
if (isDeleteByFilter) {
|
|
247
|
+
// TODO: handle delete by filter logic
|
|
248
|
+
} else {
|
|
249
|
+
const _ids = Array.isArray(deleteTarget) ? deleteTarget : [deleteTarget];
|
|
250
|
+
|
|
251
|
+
const res = await this.client
|
|
252
|
+
.Index(this.indexName)
|
|
253
|
+
.namespace(this.constructNsName(acRequest.candidate as AccessCandidate, namespace))
|
|
254
|
+
.deleteMany(_ids);
|
|
255
|
+
}
|
|
256
|
+
}
|
|
257
|
+
|
|
258
|
+
@SecureConnector.AccessControl
|
|
259
|
+
protected async createDatasource(acRequest: AccessRequest, namespace: string, datasource: DatasourceDto): Promise<IStorageVectorDataSource> {
|
|
260
|
+
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
261
|
+
const acl = new ACL().addAccess(acRequest.candidate.role, acRequest.candidate.id, TAccessLevel.Owner);
|
|
262
|
+
const dsId = datasource.id || crypto.randomUUID();
|
|
263
|
+
|
|
264
|
+
const formattedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
265
|
+
const chunkedText = chunkText(datasource.text, {
|
|
266
|
+
chunkSize: datasource.chunkSize,
|
|
267
|
+
chunkOverlap: datasource.chunkOverlap,
|
|
268
|
+
});
|
|
269
|
+
const label = datasource.label || 'Untitled';
|
|
270
|
+
const ids = Array.from({ length: chunkedText.length }, (_, i) => `${dsId}_${crypto.randomUUID()}`);
|
|
271
|
+
const source: IVectorDataSourceDto[] = chunkedText.map((doc, i) => {
|
|
272
|
+
return {
|
|
273
|
+
id: ids[i],
|
|
274
|
+
source: doc,
|
|
275
|
+
metadata: {
|
|
276
|
+
acl: acl.serializedACL,
|
|
277
|
+
namespaceId: formattedNs,
|
|
278
|
+
datasourceId: dsId,
|
|
279
|
+
datasourceLabel: label,
|
|
280
|
+
user_metadata: datasource.metadata ? jsonrepair(JSON.stringify(datasource.metadata)) : undefined,
|
|
281
|
+
},
|
|
282
|
+
};
|
|
283
|
+
});
|
|
284
|
+
|
|
285
|
+
const _vIds = await this.insert(acRequest, namespace, source);
|
|
286
|
+
|
|
287
|
+
const dsData: IStorageVectorDataSource = {
|
|
288
|
+
namespaceId: formattedNs,
|
|
289
|
+
candidateId: acRequest.candidate.id,
|
|
290
|
+
candidateRole: acRequest.candidate.role,
|
|
291
|
+
name: datasource.label || 'Untitled',
|
|
292
|
+
metadata: datasource.metadata ? jsonrepair(JSON.stringify(datasource.metadata)) : undefined,
|
|
293
|
+
text: datasource.text,
|
|
294
|
+
vectorIds: _vIds,
|
|
295
|
+
id: dsId,
|
|
296
|
+
};
|
|
297
|
+
// const url = `smythfs://${teamId}.team/_datasources/${dsId}.json`;
|
|
298
|
+
// await SmythFS.Instance.write(url, JSON.stringify(dsData), AccessCandidate.team(teamId));
|
|
299
|
+
await this.nkvConnector
|
|
300
|
+
.requester(acRequest.candidate as AccessCandidate)
|
|
301
|
+
.set(`vectorDB:${this.id}:namespaces:${formattedNs}:datasources`, dsId, JSON.stringify(dsData));
|
|
302
|
+
// return { id: dsId, vectorIds: _vIds };
|
|
303
|
+
return dsData;
|
|
304
|
+
}
|
|
305
|
+
|
|
306
|
+
@SecureConnector.AccessControl
|
|
307
|
+
protected async deleteDatasource(acRequest: AccessRequest, namespace: string, datasourceId: string): Promise<void> {
|
|
308
|
+
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
309
|
+
const formattedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
310
|
+
// const url = `smythfs://${teamId}.team/_datasources/${dsId}.json`;
|
|
311
|
+
// await SmythFS.Instance.delete(url, AccessCandidate.team(teamId));
|
|
312
|
+
let ds: IStorageVectorDataSource = JSONContentHelper.create(
|
|
313
|
+
(
|
|
314
|
+
await this.nkvConnector
|
|
315
|
+
.requester(acRequest.candidate as AccessCandidate)
|
|
316
|
+
.get(`vectorDB:${this.id}:namespaces:${formattedNs}:datasources`, datasourceId)
|
|
317
|
+
)?.toString()
|
|
318
|
+
).tryParse();
|
|
319
|
+
|
|
320
|
+
if (!ds || typeof ds !== 'object') {
|
|
321
|
+
throw new Error(`Data source not found with id: ${datasourceId}`);
|
|
322
|
+
}
|
|
323
|
+
|
|
324
|
+
await this.delete(acRequest, namespace, ds.vectorIds || []);
|
|
325
|
+
|
|
326
|
+
await this.nkvConnector
|
|
327
|
+
.requester(acRequest.candidate as AccessCandidate)
|
|
328
|
+
.delete(`vectorDB:${this.id}:namespaces:${formattedNs}:datasources`, datasourceId);
|
|
329
|
+
}
|
|
330
|
+
|
|
331
|
+
@SecureConnector.AccessControl
|
|
332
|
+
protected async listDatasources(acRequest: AccessRequest, namespace: string): Promise<IStorageVectorDataSource[]> {
|
|
333
|
+
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
334
|
+
const formattedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
335
|
+
return (
|
|
336
|
+
await this.nkvConnector
|
|
337
|
+
.requester(acRequest.candidate as AccessCandidate)
|
|
338
|
+
.list(`vectorDB:${this.id}:namespaces:${formattedNs}:datasources`)
|
|
339
|
+
).map((ds) => {
|
|
340
|
+
return JSONContentHelper.create(ds.data?.toString()).tryParse() as IStorageVectorDataSource;
|
|
341
|
+
});
|
|
342
|
+
}
|
|
343
|
+
|
|
344
|
+
@SecureConnector.AccessControl
|
|
345
|
+
protected async getDatasource(acRequest: AccessRequest, namespace: string, datasourceId: string): Promise<IStorageVectorDataSource> {
|
|
346
|
+
//const teamId = await this.accountConnector.getCandidateTeam(acRequest.candidate);
|
|
347
|
+
const formattedNs = this.constructNsName(acRequest.candidate as AccessCandidate, namespace);
|
|
348
|
+
return JSONContentHelper.create(
|
|
349
|
+
(
|
|
350
|
+
await this.nkvConnector
|
|
351
|
+
.requester(acRequest.candidate as AccessCandidate)
|
|
352
|
+
.get(`vectorDB:${this.id}:namespaces:${formattedNs}:datasources`, datasourceId)
|
|
353
|
+
)?.toString()
|
|
354
|
+
).tryParse() as IStorageVectorDataSource;
|
|
355
|
+
}
|
|
356
|
+
|
|
357
|
+
private async setACL(acRequest: AccessRequest, preparedNs: string, acl: IACL): Promise<void> {
|
|
358
|
+
await this.cache
|
|
359
|
+
.requester(AccessCandidate.clone(acRequest.candidate))
|
|
360
|
+
.set(`vectorDB:pinecone:namespace:${preparedNs}:acl`, JSON.stringify(acl));
|
|
361
|
+
}
|
|
362
|
+
|
|
363
|
+
private async getACL(ac: AccessCandidate, preparedNs: string): Promise<ACL | null | undefined> {
|
|
364
|
+
let aclRes = await this.cache.requester(ac).get(`vectorDB:pinecone:namespace:${preparedNs}:acl`);
|
|
365
|
+
const acl = JSONContentHelper.create(aclRes?.toString?.()).tryParse();
|
|
366
|
+
return acl;
|
|
367
|
+
}
|
|
368
|
+
|
|
369
|
+
private async deleteACL(ac: AccessCandidate, preparedNs: string): Promise<void> {
|
|
370
|
+
this.cache.requester(AccessCandidate.clone(ac)).delete(`vectorDB:pinecone:namespace:${preparedNs}:acl`);
|
|
371
|
+
}
|
|
372
|
+
|
|
373
|
+
public constructNsName(candidate: AccessCandidate, name: string) {
|
|
374
|
+
const joinedName = name.trim().replace(/\s/g, '_').toLowerCase();
|
|
375
|
+
let prefix = candidate.id;
|
|
376
|
+
|
|
377
|
+
if (candidate.role !== TAccessRole.Team) {
|
|
378
|
+
//DO NOT add role prefix for teams to preserve backward compatibility
|
|
379
|
+
prefix = candidate.role[0] + '_' + candidate.id;
|
|
380
|
+
}
|
|
381
|
+
|
|
382
|
+
return `${prefix}_${joinedName}`;
|
|
383
|
+
}
|
|
384
|
+
}
|