veadk-python 0.2.8__py3-none-any.whl → 0.2.9__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of veadk-python might be problematic. Click here for more details.
- veadk/agent.py +3 -0
- veadk/cli/cli_prompt.py +9 -2
- veadk/cli/cli_web.py +3 -0
- veadk/configs/database_configs.py +9 -0
- veadk/consts.py +7 -0
- veadk/evaluation/adk_evaluator/adk_evaluator.py +5 -2
- veadk/evaluation/base_evaluator.py +36 -25
- veadk/evaluation/deepeval_evaluator/deepeval_evaluator.py +5 -3
- veadk/integrations/ve_prompt_pilot/ve_prompt_pilot.py +9 -3
- veadk/integrations/ve_tls/utils.py +1 -2
- veadk/integrations/ve_tls/ve_tls.py +9 -5
- veadk/integrations/ve_tos/ve_tos.py +538 -67
- veadk/knowledgebase/backends/base_backend.py +4 -4
- veadk/knowledgebase/backends/vikingdb_knowledge_backend.py +162 -50
- veadk/knowledgebase/entry.py +25 -0
- veadk/knowledgebase/knowledgebase.py +19 -4
- veadk/memory/long_term_memory.py +20 -7
- veadk/memory/long_term_memory_backends/mem0_backend.py +129 -0
- veadk/runner.py +12 -19
- veadk/tools/builtin_tools/generate_image.py +355 -0
- veadk/tools/builtin_tools/image_edit.py +56 -16
- veadk/tools/builtin_tools/image_generate.py +51 -15
- veadk/tools/builtin_tools/video_generate.py +41 -41
- veadk/tools/load_knowledgebase_tool.py +2 -8
- veadk/tracing/telemetry/attributes/extractors/llm_attributes_extractors.py +1 -1
- veadk/tracing/telemetry/opentelemetry_tracer.py +8 -2
- veadk/version.py +1 -1
- {veadk_python-0.2.8.dist-info → veadk_python-0.2.9.dist-info}/METADATA +13 -2
- {veadk_python-0.2.8.dist-info → veadk_python-0.2.9.dist-info}/RECORD +33 -30
- {veadk_python-0.2.8.dist-info → veadk_python-0.2.9.dist-info}/WHEEL +0 -0
- {veadk_python-0.2.8.dist-info → veadk_python-0.2.9.dist-info}/entry_points.txt +0 -0
- {veadk_python-0.2.8.dist-info → veadk_python-0.2.9.dist-info}/licenses/LICENSE +0 -0
- {veadk_python-0.2.8.dist-info → veadk_python-0.2.9.dist-info}/top_level.txt +0 -0
|
@@ -29,19 +29,19 @@ class BaseKnowledgebaseBackend(ABC, BaseModel):
|
|
|
29
29
|
"""
|
|
30
30
|
|
|
31
31
|
@abstractmethod
|
|
32
|
-
def add_from_directory(self, directory: str, **kwargs) -> bool:
|
|
32
|
+
def add_from_directory(self, directory: str, *args, **kwargs) -> bool:
|
|
33
33
|
"""Add knowledge from file path to knowledgebase"""
|
|
34
34
|
|
|
35
35
|
@abstractmethod
|
|
36
|
-
def add_from_files(self, files: list[str], **kwargs) -> bool:
|
|
36
|
+
def add_from_files(self, files: list[str], *args, **kwargs) -> bool:
|
|
37
37
|
"""Add knowledge (e.g, documents, strings, ...) to knowledgebase"""
|
|
38
38
|
|
|
39
39
|
@abstractmethod
|
|
40
|
-
def add_from_text(self, text: str | list[str], **kwargs) -> bool:
|
|
40
|
+
def add_from_text(self, text: str | list[str], *args, **kwargs) -> bool:
|
|
41
41
|
"""Add knowledge from text to knowledgebase"""
|
|
42
42
|
|
|
43
43
|
@abstractmethod
|
|
44
|
-
def search(self, **kwargs) -> list:
|
|
44
|
+
def search(self, *args, **kwargs) -> list:
|
|
45
45
|
"""Search knowledge from knowledgebase"""
|
|
46
46
|
|
|
47
47
|
# Optional methods for future use:
|
|
@@ -13,6 +13,7 @@
|
|
|
13
13
|
# limitations under the License.
|
|
14
14
|
|
|
15
15
|
import asyncio
|
|
16
|
+
import json
|
|
16
17
|
import re
|
|
17
18
|
from pathlib import Path
|
|
18
19
|
from typing import Any, Literal
|
|
@@ -24,9 +25,9 @@ from typing_extensions import override
|
|
|
24
25
|
import veadk.config # noqa E401
|
|
25
26
|
from veadk.config import getenv
|
|
26
27
|
from veadk.configs.database_configs import NormalTOSConfig, TOSConfig
|
|
27
|
-
from veadk.consts import DEFAULT_TOS_BUCKET_NAME
|
|
28
28
|
from veadk.knowledgebase.backends.base_backend import BaseKnowledgebaseBackend
|
|
29
29
|
from veadk.knowledgebase.backends.utils import build_vikingdb_knowledgebase_request
|
|
30
|
+
from veadk.knowledgebase.entry import KnowledgebaseEntry
|
|
30
31
|
from veadk.utils.logger import get_logger
|
|
31
32
|
from veadk.utils.misc import formatted_timestamp
|
|
32
33
|
|
|
@@ -48,13 +49,6 @@ def _read_file_to_bytes(file_path: str) -> tuple[bytes, str]:
|
|
|
48
49
|
return file_content, file_name
|
|
49
50
|
|
|
50
51
|
|
|
51
|
-
def _extract_tos_attributes(**kwargs) -> tuple[str, str]:
|
|
52
|
-
"""Extract TOS attributes from kwargs"""
|
|
53
|
-
tos_bucket_name = kwargs.get("tos_bucket_name", DEFAULT_TOS_BUCKET_NAME)
|
|
54
|
-
tos_bucket_path = kwargs.get("tos_bucket_path", "knowledgebase")
|
|
55
|
-
return tos_bucket_name, tos_bucket_path
|
|
56
|
-
|
|
57
|
-
|
|
58
52
|
def get_files_in_directory(directory: str):
|
|
59
53
|
dir_path = Path(directory)
|
|
60
54
|
if not dir_path.is_dir():
|
|
@@ -109,15 +103,27 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
109
103
|
)
|
|
110
104
|
|
|
111
105
|
@override
|
|
112
|
-
def add_from_directory(
|
|
113
|
-
|
|
106
|
+
def add_from_directory(
|
|
107
|
+
self,
|
|
108
|
+
directory: str,
|
|
109
|
+
tos_bucket_name: str | None = None,
|
|
110
|
+
tos_bucket_path: str = "knowledgebase",
|
|
111
|
+
metadata: dict | None = None,
|
|
112
|
+
**kwargs,
|
|
113
|
+
) -> bool:
|
|
114
|
+
"""Add knowledge from a directory to the knowledgebase.
|
|
115
|
+
|
|
114
116
|
Args:
|
|
115
|
-
directory
|
|
116
|
-
|
|
117
|
-
|
|
118
|
-
|
|
117
|
+
directory (str): The directory to add to knowledgebase.
|
|
118
|
+
tos_bucket_name (str | None, optional): The bucket name of TOS. Defaults to None.
|
|
119
|
+
tos_bucket_path (str, optional): The path of TOS bucket. Defaults to "knowledgebase".
|
|
120
|
+
metadata (dict | None, optional): The metadata of the files. Defaults to None.
|
|
121
|
+
**kwargs: Additional keyword arguments.
|
|
122
|
+
|
|
123
|
+
Returns:
|
|
124
|
+
bool: True if successful, False otherwise.
|
|
119
125
|
"""
|
|
120
|
-
tos_bucket_name
|
|
126
|
+
tos_bucket_name = tos_bucket_name or self.tos_config.bucket
|
|
121
127
|
files = get_files_in_directory(directory=directory)
|
|
122
128
|
for _file in files:
|
|
123
129
|
content, file_name = _read_file_to_bytes(_file)
|
|
@@ -125,40 +131,64 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
125
131
|
content,
|
|
126
132
|
tos_bucket_name=tos_bucket_name,
|
|
127
133
|
object_key=f"{tos_bucket_path}/{file_name}",
|
|
134
|
+
metadata=metadata,
|
|
128
135
|
)
|
|
129
136
|
self._add_doc(tos_url=tos_url)
|
|
130
137
|
return True
|
|
131
138
|
|
|
132
139
|
@override
|
|
133
|
-
def add_from_files(
|
|
134
|
-
|
|
140
|
+
def add_from_files(
|
|
141
|
+
self,
|
|
142
|
+
files: list[str],
|
|
143
|
+
tos_bucket_name: str | None = None,
|
|
144
|
+
tos_bucket_path: str = "knowledgebase",
|
|
145
|
+
metadata: dict | None = None,
|
|
146
|
+
**kwargs,
|
|
147
|
+
) -> bool:
|
|
148
|
+
"""Add knowledge from a directory to the knowledgebase.
|
|
149
|
+
|
|
135
150
|
Args:
|
|
136
|
-
files
|
|
137
|
-
|
|
138
|
-
|
|
139
|
-
|
|
151
|
+
files (list[str]): The files to add to knowledgebase.
|
|
152
|
+
tos_bucket_name (str | None, optional): The bucket name of TOS. Defaults to None.
|
|
153
|
+
tos_bucket_path (str, optional): The path of TOS bucket. Defaults to "knowledgebase".
|
|
154
|
+
metadata (dict | None, optional): The metadata of the files. Defaults to None.
|
|
155
|
+
**kwargs: Additional keyword arguments.
|
|
156
|
+
|
|
157
|
+
Returns:
|
|
158
|
+
bool: True if successful, False otherwise.
|
|
140
159
|
"""
|
|
141
|
-
tos_bucket_name
|
|
160
|
+
tos_bucket_name = tos_bucket_name or self.tos_config.bucket
|
|
142
161
|
for _file in files:
|
|
143
162
|
content, file_name = _read_file_to_bytes(_file)
|
|
144
163
|
tos_url = self._upload_bytes_to_tos(
|
|
145
164
|
content,
|
|
146
165
|
tos_bucket_name=tos_bucket_name,
|
|
147
166
|
object_key=f"{tos_bucket_path}/{file_name}",
|
|
167
|
+
metadata=metadata,
|
|
148
168
|
)
|
|
149
169
|
self._add_doc(tos_url=tos_url)
|
|
150
170
|
return True
|
|
151
171
|
|
|
152
172
|
@override
|
|
153
|
-
def add_from_text(
|
|
154
|
-
|
|
173
|
+
def add_from_text(
|
|
174
|
+
self,
|
|
175
|
+
text: str | list[str],
|
|
176
|
+
tos_bucket_name: str | None = None,
|
|
177
|
+
tos_bucket_path: str = "knowledgebase",
|
|
178
|
+
metadata: dict | None = None,
|
|
179
|
+
**kwargs,
|
|
180
|
+
) -> bool:
|
|
181
|
+
"""Add knowledge from text to the knowledgebase.
|
|
182
|
+
|
|
155
183
|
Args:
|
|
156
|
-
text
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
|
|
184
|
+
text (str | list[str]): The text to add to knowledgebase.
|
|
185
|
+
tos_bucket_name (str | None, optional): The bucket name of TOS. Defaults to None.
|
|
186
|
+
tos_bucket_path (str, optional): The path of TOS bucket. Defaults to "knowledgebase".
|
|
187
|
+
|
|
188
|
+
Returns:
|
|
189
|
+
bool: True if successful, False otherwise.
|
|
160
190
|
"""
|
|
161
|
-
tos_bucket_name
|
|
191
|
+
tos_bucket_name = tos_bucket_name or self.tos_config.bucket
|
|
162
192
|
if isinstance(text, list):
|
|
163
193
|
object_keys = kwargs.get(
|
|
164
194
|
"tos_object_keys",
|
|
@@ -170,7 +200,7 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
170
200
|
for _text, _object_key in zip(text, object_keys):
|
|
171
201
|
_content = _text.encode("utf-8")
|
|
172
202
|
tos_url = self._upload_bytes_to_tos(
|
|
173
|
-
_content, tos_bucket_name, _object_key
|
|
203
|
+
_content, tos_bucket_name, _object_key, metadata=metadata
|
|
174
204
|
)
|
|
175
205
|
self._add_doc(tos_url=tos_url)
|
|
176
206
|
return True
|
|
@@ -179,26 +209,42 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
179
209
|
object_key = kwargs.get(
|
|
180
210
|
"object_key", f"veadk/knowledgebase/{formatted_timestamp()}.txt"
|
|
181
211
|
)
|
|
182
|
-
tos_url = self._upload_bytes_to_tos(
|
|
212
|
+
tos_url = self._upload_bytes_to_tos(
|
|
213
|
+
content, tos_bucket_name, object_key, metadata=metadata
|
|
214
|
+
)
|
|
183
215
|
self._add_doc(tos_url=tos_url)
|
|
184
216
|
else:
|
|
185
217
|
raise ValueError("text must be str or list[str]")
|
|
186
218
|
return True
|
|
187
219
|
|
|
188
|
-
def add_from_bytes(
|
|
189
|
-
|
|
220
|
+
def add_from_bytes(
|
|
221
|
+
self,
|
|
222
|
+
content: bytes,
|
|
223
|
+
file_name: str,
|
|
224
|
+
tos_bucket_name: str | None = None,
|
|
225
|
+
tos_bucket_path: str = "knowledgebase",
|
|
226
|
+
metadata: dict | None = None,
|
|
227
|
+
**kwargs,
|
|
228
|
+
) -> bool:
|
|
229
|
+
"""Add knowledge from bytes to the knowledgebase.
|
|
230
|
+
|
|
190
231
|
Args:
|
|
191
|
-
content
|
|
192
|
-
file_name
|
|
193
|
-
|
|
194
|
-
|
|
195
|
-
|
|
232
|
+
content (bytes): The content to add to knowledgebase.
|
|
233
|
+
file_name (str): The file name of the content.
|
|
234
|
+
tos_bucket_name (str | None, optional): The bucket name of TOS. Defaults to None.
|
|
235
|
+
tos_bucket_path (str, optional): The path of TOS bucket. Defaults to "knowledgebase".
|
|
236
|
+
metadata (dict | None, optional): The metadata of the files. Defaults to None.
|
|
237
|
+
**kwargs: Additional keyword arguments.
|
|
238
|
+
|
|
239
|
+
Returns:
|
|
240
|
+
bool: True if successful, False otherwise.
|
|
196
241
|
"""
|
|
197
|
-
tos_bucket_name
|
|
242
|
+
tos_bucket_name = tos_bucket_name or self.tos_config.bucket
|
|
198
243
|
tos_url = self._upload_bytes_to_tos(
|
|
199
244
|
content,
|
|
200
245
|
tos_bucket_name=tos_bucket_name,
|
|
201
246
|
object_key=f"{tos_bucket_path}/{file_name}",
|
|
247
|
+
metadata=metadata,
|
|
202
248
|
)
|
|
203
249
|
response = self._add_doc(tos_url=tos_url)
|
|
204
250
|
if response["code"] == 0:
|
|
@@ -206,8 +252,16 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
206
252
|
return False
|
|
207
253
|
|
|
208
254
|
@override
|
|
209
|
-
def search(
|
|
210
|
-
|
|
255
|
+
def search(
|
|
256
|
+
self,
|
|
257
|
+
query: str,
|
|
258
|
+
top_k: int = 5,
|
|
259
|
+
metadata: dict | None = None,
|
|
260
|
+
rerank: bool = True,
|
|
261
|
+
) -> list:
|
|
262
|
+
return self._search_knowledge(
|
|
263
|
+
query=query, top_k=top_k, metadata=metadata, rerank=rerank
|
|
264
|
+
)
|
|
211
265
|
|
|
212
266
|
def delete_collection(self) -> bool:
|
|
213
267
|
DELETE_COLLECTION_PATH = "/api/knowledge/collection/delete"
|
|
@@ -330,7 +384,7 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
330
384
|
response = self._do_request(
|
|
331
385
|
body={
|
|
332
386
|
"name": self.index,
|
|
333
|
-
"project":
|
|
387
|
+
"project": self.volcengine_project,
|
|
334
388
|
"description": "Created by Volcengine Agent Development Kit (VeADK).",
|
|
335
389
|
},
|
|
336
390
|
path=CREATE_COLLECTION_PATH,
|
|
@@ -343,10 +397,27 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
343
397
|
)
|
|
344
398
|
|
|
345
399
|
def _upload_bytes_to_tos(
|
|
346
|
-
self,
|
|
400
|
+
self,
|
|
401
|
+
content: bytes,
|
|
402
|
+
tos_bucket_name: str,
|
|
403
|
+
object_key: str,
|
|
404
|
+
metadata: dict | None = None,
|
|
347
405
|
) -> str:
|
|
406
|
+
# Here, we set the metadata via the TOS object, ref: https://www.volcengine.com/docs/84313/1254624
|
|
348
407
|
self._tos_client.bucket_name = tos_bucket_name
|
|
349
|
-
|
|
408
|
+
coro = self._tos_client.upload(
|
|
409
|
+
object_key=object_key,
|
|
410
|
+
bucket_name=tos_bucket_name,
|
|
411
|
+
data=content,
|
|
412
|
+
metadata=metadata,
|
|
413
|
+
)
|
|
414
|
+
try:
|
|
415
|
+
loop = asyncio.get_running_loop()
|
|
416
|
+
loop.run_until_complete(
|
|
417
|
+
coro
|
|
418
|
+
) if not loop.is_running() else asyncio.ensure_future(coro)
|
|
419
|
+
except RuntimeError:
|
|
420
|
+
asyncio.run(coro)
|
|
350
421
|
return f"{self._tos_client.bucket_name}/{object_key}"
|
|
351
422
|
|
|
352
423
|
def _add_doc(self, tos_url: str) -> Any:
|
|
@@ -355,7 +426,7 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
355
426
|
response = self._do_request(
|
|
356
427
|
body={
|
|
357
428
|
"collection_name": self.index,
|
|
358
|
-
"project":
|
|
429
|
+
"project": self.volcengine_project,
|
|
359
430
|
"add_type": "tos",
|
|
360
431
|
"tos_path": tos_url,
|
|
361
432
|
},
|
|
@@ -364,14 +435,43 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
364
435
|
)
|
|
365
436
|
return response
|
|
366
437
|
|
|
367
|
-
def _search_knowledge(
|
|
438
|
+
def _search_knowledge(
|
|
439
|
+
self,
|
|
440
|
+
query: str,
|
|
441
|
+
top_k: int = 5,
|
|
442
|
+
metadata: dict | None = None,
|
|
443
|
+
rerank: bool = True,
|
|
444
|
+
chunk_diffusion_count: int | None = 3,
|
|
445
|
+
) -> list[KnowledgebaseEntry]:
|
|
368
446
|
SEARCH_KNOWLEDGE_PATH = "/api/knowledge/collection/search_knowledge"
|
|
369
447
|
|
|
448
|
+
query_param = (
|
|
449
|
+
{
|
|
450
|
+
"doc_filter": {
|
|
451
|
+
"op": "and",
|
|
452
|
+
"conds": [
|
|
453
|
+
{"op": "must", "field": str(k), "conds": [str(v)]}
|
|
454
|
+
for k, v in metadata.items()
|
|
455
|
+
],
|
|
456
|
+
}
|
|
457
|
+
}
|
|
458
|
+
if metadata
|
|
459
|
+
else None
|
|
460
|
+
)
|
|
461
|
+
|
|
462
|
+
post_precessing = {
|
|
463
|
+
"rerank_swich": rerank,
|
|
464
|
+
"chunk_diffusion_count": chunk_diffusion_count,
|
|
465
|
+
}
|
|
466
|
+
|
|
370
467
|
response = self._do_request(
|
|
371
468
|
body={
|
|
372
469
|
"name": self.index,
|
|
470
|
+
"project": self.volcengine_project,
|
|
373
471
|
"query": query,
|
|
374
472
|
"limit": top_k,
|
|
473
|
+
"query_param": query_param,
|
|
474
|
+
"post_processing": post_precessing,
|
|
375
475
|
},
|
|
376
476
|
path=SEARCH_KNOWLEDGE_PATH,
|
|
377
477
|
method="POST",
|
|
@@ -382,11 +482,19 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
382
482
|
f"Error during knowledge search: {response.get('code')}, message: {response.get('message')}"
|
|
383
483
|
)
|
|
384
484
|
|
|
385
|
-
|
|
485
|
+
entries = []
|
|
486
|
+
for result in response.get("data", {}).get("result_list", []):
|
|
487
|
+
doc_meta_raw_str = result.get("doc_info", {}).get("doc_meta")
|
|
488
|
+
doc_meta_list = json.loads(doc_meta_raw_str) if doc_meta_raw_str else []
|
|
489
|
+
metadata = {}
|
|
490
|
+
for meta in doc_meta_list:
|
|
491
|
+
metadata[meta["field_name"]] = meta["field_value"]
|
|
386
492
|
|
|
387
|
-
|
|
388
|
-
|
|
389
|
-
|
|
493
|
+
entries.append(
|
|
494
|
+
KnowledgebaseEntry(content=result.get("content", ""), metadata=metadata)
|
|
495
|
+
)
|
|
496
|
+
|
|
497
|
+
return entries
|
|
390
498
|
|
|
391
499
|
def _do_request(
|
|
392
500
|
self,
|
|
@@ -409,4 +517,8 @@ class VikingDBKnowledgeBackend(BaseKnowledgebaseBackend):
|
|
|
409
517
|
headers=request.headers,
|
|
410
518
|
data=request.body,
|
|
411
519
|
)
|
|
520
|
+
if not response.ok:
|
|
521
|
+
logger.error(
|
|
522
|
+
f"VikingDBKnowledgeBackend error during request: {response.json()}"
|
|
523
|
+
)
|
|
412
524
|
return response.json()
|
|
@@ -0,0 +1,25 @@
|
|
|
1
|
+
# Copyright (c) 2025 Beijing Volcano Engine Technology Co., Ltd. and/or its affiliates.
|
|
2
|
+
#
|
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
|
+
# you may not use this file except in compliance with the License.
|
|
5
|
+
# You may obtain a copy of the License at
|
|
6
|
+
#
|
|
7
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
8
|
+
#
|
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
12
|
+
# See the License for the specific language governing permissions and
|
|
13
|
+
# limitations under the License.
|
|
14
|
+
|
|
15
|
+
from pydantic import BaseModel
|
|
16
|
+
|
|
17
|
+
|
|
18
|
+
class KnowledgebaseEntry(BaseModel):
|
|
19
|
+
"""Represents a single entry in the knowledgebase."""
|
|
20
|
+
|
|
21
|
+
# The main content of the knowledgebase entry.
|
|
22
|
+
content: str
|
|
23
|
+
|
|
24
|
+
# Optional metadata associated with the entry.
|
|
25
|
+
metadata: dict | None = None
|
|
@@ -18,6 +18,7 @@ from pydantic import BaseModel, Field
|
|
|
18
18
|
from typing_extensions import Union
|
|
19
19
|
|
|
20
20
|
from veadk.knowledgebase.backends.base_backend import BaseKnowledgebaseBackend
|
|
21
|
+
from veadk.knowledgebase.entry import KnowledgebaseEntry
|
|
21
22
|
from veadk.utils.logger import get_logger
|
|
22
23
|
|
|
23
24
|
logger = get_logger(__name__)
|
|
@@ -72,8 +73,8 @@ class KnowledgeBase(BaseModel):
|
|
|
72
73
|
"""Configuration for the backend"""
|
|
73
74
|
|
|
74
75
|
top_k: int = 10
|
|
75
|
-
"""Number of top similar documents to retrieve during search.
|
|
76
|
-
|
|
76
|
+
"""Number of top similar documents to retrieve during search.
|
|
77
|
+
|
|
77
78
|
Default is 10."""
|
|
78
79
|
|
|
79
80
|
app_name: str = ""
|
|
@@ -130,11 +131,25 @@ class KnowledgeBase(BaseModel):
|
|
|
130
131
|
"""Add knowledge from text to knowledgebase"""
|
|
131
132
|
return self._backend.add_from_text(text=text, **kwargs)
|
|
132
133
|
|
|
133
|
-
def search(self, query: str, top_k: int = 0, **kwargs) -> list[
|
|
134
|
+
def search(self, query: str, top_k: int = 0, **kwargs) -> list[KnowledgebaseEntry]:
|
|
134
135
|
"""Search knowledge from knowledgebase"""
|
|
135
136
|
if top_k == 0:
|
|
136
137
|
top_k = self.top_k
|
|
137
|
-
|
|
138
|
+
|
|
139
|
+
_entries = self._backend.search(query=query, top_k=top_k, **kwargs)
|
|
140
|
+
|
|
141
|
+
entries = []
|
|
142
|
+
for entry in _entries:
|
|
143
|
+
if isinstance(entry, KnowledgebaseEntry):
|
|
144
|
+
entries.append(entry)
|
|
145
|
+
elif isinstance(entry, str):
|
|
146
|
+
entries.append(KnowledgebaseEntry(content=entry))
|
|
147
|
+
else:
|
|
148
|
+
logger.error(
|
|
149
|
+
f"Unsupported entry type from backend search method: {type(entry)} with {entry}. Expected `KnowledgebaseEntry` or `str`. Skip for this entry."
|
|
150
|
+
)
|
|
151
|
+
|
|
152
|
+
return entries
|
|
138
153
|
|
|
139
154
|
def __getattr__(self, name) -> Callable:
|
|
140
155
|
"""In case of knowledgebase have no backends' methods (`delete`, `list_chunks`, etc)
|
veadk/memory/long_term_memory.py
CHANGED
|
@@ -62,6 +62,12 @@ def _get_backend_cls(backend: str) -> type[BaseLongTermMemoryBackend]:
|
|
|
62
62
|
)
|
|
63
63
|
|
|
64
64
|
return RedisLTMBackend
|
|
65
|
+
case "mem0":
|
|
66
|
+
from veadk.memory.long_term_memory_backends.mem0_backend import (
|
|
67
|
+
Mem0LTMBackend,
|
|
68
|
+
)
|
|
69
|
+
|
|
70
|
+
return Mem0LTMBackend
|
|
65
71
|
|
|
66
72
|
raise ValueError(f"Unsupported long term memory backend: {backend}")
|
|
67
73
|
|
|
@@ -72,7 +78,7 @@ def build_long_term_memory_index(app_name: str, user_id: str):
|
|
|
72
78
|
|
|
73
79
|
class LongTermMemory(BaseMemoryService, BaseModel):
|
|
74
80
|
backend: Union[
|
|
75
|
-
Literal["local", "opensearch", "redis", "viking", "viking_mem"],
|
|
81
|
+
Literal["local", "opensearch", "redis", "viking", "viking_mem", "mem0"],
|
|
76
82
|
BaseLongTermMemoryBackend,
|
|
77
83
|
] = "opensearch"
|
|
78
84
|
"""Long term memory backend type"""
|
|
@@ -88,6 +94,12 @@ class LongTermMemory(BaseMemoryService, BaseModel):
|
|
|
88
94
|
user_id: str = ""
|
|
89
95
|
|
|
90
96
|
def model_post_init(self, __context: Any) -> None:
|
|
97
|
+
if self.backend == "viking_mem":
|
|
98
|
+
logger.warning(
|
|
99
|
+
"The `viking_mem` backend is deprecated, please use `viking` instead."
|
|
100
|
+
)
|
|
101
|
+
self.backend = "viking"
|
|
102
|
+
|
|
91
103
|
self._backend = None
|
|
92
104
|
|
|
93
105
|
# Once user define a backend instance, use it directly
|
|
@@ -147,12 +159,6 @@ class LongTermMemory(BaseMemoryService, BaseModel):
|
|
|
147
159
|
app_name = session.app_name
|
|
148
160
|
user_id = session.user_id
|
|
149
161
|
|
|
150
|
-
if self._index != build_long_term_memory_index(app_name, user_id):
|
|
151
|
-
logger.warning(
|
|
152
|
-
f"The `app_name` or `user_id` is different from the initialized one, skip add session to memory. Initialized index: {self._index}, current built index: {build_long_term_memory_index(app_name, user_id)}"
|
|
153
|
-
)
|
|
154
|
-
return
|
|
155
|
-
|
|
156
162
|
if not self._backend and isinstance(self.backend, str):
|
|
157
163
|
self._index = build_long_term_memory_index(app_name, user_id)
|
|
158
164
|
self._backend = _get_backend_cls(self.backend)(
|
|
@@ -162,6 +168,13 @@ class LongTermMemory(BaseMemoryService, BaseModel):
|
|
|
162
168
|
f"Initialize long term memory backend now, index is {self._index}"
|
|
163
169
|
)
|
|
164
170
|
|
|
171
|
+
if not self._index and self._index != build_long_term_memory_index(
|
|
172
|
+
app_name, user_id
|
|
173
|
+
):
|
|
174
|
+
logger.warning(
|
|
175
|
+
f"The `app_name` or `user_id` is different from the initialized one, skip add session to memory. Initialized index: {self._index}, current built index: {build_long_term_memory_index(app_name, user_id)}"
|
|
176
|
+
)
|
|
177
|
+
return
|
|
165
178
|
event_strings = self._filter_and_convert_events(session.events)
|
|
166
179
|
|
|
167
180
|
logger.info(
|
|
@@ -0,0 +1,129 @@
|
|
|
1
|
+
# Copyright (c) 2025 Beijing Volcano Engine Technology Co., Ltd. and/or its affiliates.
|
|
2
|
+
#
|
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
|
+
# you may not use this file except in compliance with the License.
|
|
5
|
+
# You may obtain a copy of the License at
|
|
6
|
+
#
|
|
7
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
8
|
+
#
|
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
12
|
+
# See the License for the specific language governing permissions and
|
|
13
|
+
# limitations under the License.
|
|
14
|
+
|
|
15
|
+
from typing import Any
|
|
16
|
+
from typing_extensions import override
|
|
17
|
+
from pydantic import Field
|
|
18
|
+
|
|
19
|
+
from veadk.configs.database_configs import Mem0Config
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
from veadk.memory.long_term_memory_backends.base_backend import (
|
|
23
|
+
BaseLongTermMemoryBackend,
|
|
24
|
+
)
|
|
25
|
+
from veadk.utils.logger import get_logger
|
|
26
|
+
|
|
27
|
+
logger = get_logger(__name__)
|
|
28
|
+
|
|
29
|
+
try:
|
|
30
|
+
from mem0 import MemoryClient
|
|
31
|
+
|
|
32
|
+
except ImportError:
|
|
33
|
+
logger.error(
|
|
34
|
+
"Failed to import mem0 or dotenv. Please install them with 'pip install mem0 '"
|
|
35
|
+
)
|
|
36
|
+
raise ImportError("Required packages not installed: mem0")
|
|
37
|
+
|
|
38
|
+
|
|
39
|
+
class Mem0LTMBackend(BaseLongTermMemoryBackend):
|
|
40
|
+
"""Mem0 long term memory backend implementation"""
|
|
41
|
+
|
|
42
|
+
mem0_config: Mem0Config = Field(default_factory=Mem0Config)
|
|
43
|
+
|
|
44
|
+
def model_post_init(self, __context: Any) -> None:
|
|
45
|
+
"""Initialize Mem0 client"""
|
|
46
|
+
|
|
47
|
+
try:
|
|
48
|
+
self._mem0_client = MemoryClient(
|
|
49
|
+
# base_url=self.mem0_config.base_url, # mem0 endpoint
|
|
50
|
+
api_key=self.mem0_config.api_key, # mem0 API key
|
|
51
|
+
)
|
|
52
|
+
logger.info(f"Initialized Mem0 client for index: {self.index}")
|
|
53
|
+
except Exception as e:
|
|
54
|
+
logger.error(f"Failed to initialize Mem0 client: {str(e)}")
|
|
55
|
+
raise
|
|
56
|
+
|
|
57
|
+
def precheck_index_naming(self):
|
|
58
|
+
"""Check if the index name is valid
|
|
59
|
+
For Mem0, there are no specific naming constraints
|
|
60
|
+
"""
|
|
61
|
+
pass
|
|
62
|
+
|
|
63
|
+
@override
|
|
64
|
+
def save_memory(self, event_strings: list[str], **kwargs) -> bool:
|
|
65
|
+
"""Save memory to Mem0
|
|
66
|
+
|
|
67
|
+
Args:
|
|
68
|
+
event_strings: List of event strings to save
|
|
69
|
+
**kwargs: Additional parameters, including 'user_id' for Mem0
|
|
70
|
+
|
|
71
|
+
Returns:
|
|
72
|
+
bool: True if saved successfully, False otherwise
|
|
73
|
+
"""
|
|
74
|
+
user_id = kwargs.get("user_id", "default_user")
|
|
75
|
+
|
|
76
|
+
try:
|
|
77
|
+
logger.info(
|
|
78
|
+
f"Saving {len(event_strings)} events to Mem0 for user: {user_id}"
|
|
79
|
+
)
|
|
80
|
+
|
|
81
|
+
for event_string in event_strings:
|
|
82
|
+
# Save event string to Mem0
|
|
83
|
+
result = self._mem0_client.add(
|
|
84
|
+
[{"role": "user", "content": event_string}],
|
|
85
|
+
user_id=user_id,
|
|
86
|
+
output_format="v1.1",
|
|
87
|
+
)
|
|
88
|
+
logger.debug(f"Saved memory result: {result}")
|
|
89
|
+
|
|
90
|
+
logger.info(f"Successfully saved {len(event_strings)} events to Mem0")
|
|
91
|
+
return True
|
|
92
|
+
except Exception as e:
|
|
93
|
+
logger.error(f"Failed to save memory to Mem0: {str(e)}")
|
|
94
|
+
return False
|
|
95
|
+
|
|
96
|
+
@override
|
|
97
|
+
def search_memory(self, query: str, top_k: int, **kwargs) -> list[str]:
|
|
98
|
+
"""Search memory from Mem0
|
|
99
|
+
|
|
100
|
+
Args:
|
|
101
|
+
query: Search query
|
|
102
|
+
top_k: Number of results to return
|
|
103
|
+
**kwargs: Additional parameters, including 'user_id' for Mem0
|
|
104
|
+
|
|
105
|
+
Returns:
|
|
106
|
+
list[str]: List of memory strings
|
|
107
|
+
"""
|
|
108
|
+
user_id = kwargs.get("user_id", "default_user")
|
|
109
|
+
|
|
110
|
+
try:
|
|
111
|
+
logger.info(
|
|
112
|
+
f"Searching Mem0 for query: {query}, user: {user_id}, top_k: {top_k}"
|
|
113
|
+
)
|
|
114
|
+
|
|
115
|
+
memories = self._mem0_client.search(
|
|
116
|
+
query, user_id=user_id, output_format="v1.1", top_k=top_k
|
|
117
|
+
)
|
|
118
|
+
|
|
119
|
+
memory_list = []
|
|
120
|
+
if memories.get("results", []):
|
|
121
|
+
for mem in memories["results"]:
|
|
122
|
+
if "memory" in mem:
|
|
123
|
+
memory_list.append(mem["memory"])
|
|
124
|
+
|
|
125
|
+
logger.info(f"Found {len(memory_list)} memories matching query: {query}")
|
|
126
|
+
return memory_list
|
|
127
|
+
except Exception as e:
|
|
128
|
+
logger.error(f"Failed to search memory from Mem0: {str(e)}")
|
|
129
|
+
return []
|