praisonaiagents 0.0.36__tar.gz → 0.0.38__tar.gz

Sign up to get free protection for your applications and to get access to all the features.
Files changed (46) hide show
  1. praisonaiagents-0.0.38/PKG-INFO +18 -0
  2. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/__init__.py +4 -0
  3. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/agent/agent.py +51 -3
  4. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/agents/agents.py +10 -2
  5. praisonaiagents-0.0.38/praisonaiagents/knowledge/__init__.py +8 -0
  6. praisonaiagents-0.0.38/praisonaiagents/knowledge/chunking.py +182 -0
  7. praisonaiagents-0.0.38/praisonaiagents/knowledge/knowledge.py +290 -0
  8. praisonaiagents-0.0.38/praisonaiagents.egg-info/PKG-INFO +18 -0
  9. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents.egg-info/SOURCES.txt +3 -0
  10. praisonaiagents-0.0.38/praisonaiagents.egg-info/requires.txt +16 -0
  11. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/pyproject.toml +16 -3
  12. praisonaiagents-0.0.36/PKG-INFO +0 -10
  13. praisonaiagents-0.0.36/praisonaiagents.egg-info/PKG-INFO +0 -10
  14. praisonaiagents-0.0.36/praisonaiagents.egg-info/requires.txt +0 -6
  15. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/agent/__init__.py +0 -0
  16. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/agents/__init__.py +0 -0
  17. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/agents/autoagents.py +0 -0
  18. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/main.py +0 -0
  19. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/memory/memory.py +0 -0
  20. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/process/__init__.py +0 -0
  21. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/process/process.py +0 -0
  22. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/task/__init__.py +0 -0
  23. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/task/task.py +0 -0
  24. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/__init__.py +0 -0
  25. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/arxiv_tools.py +0 -0
  26. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/calculator_tools.py +0 -0
  27. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/csv_tools.py +0 -0
  28. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/duckdb_tools.py +0 -0
  29. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/duckduckgo_tools.py +0 -0
  30. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/excel_tools.py +0 -0
  31. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/file_tools.py +0 -0
  32. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/json_tools.py +0 -0
  33. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/newspaper_tools.py +0 -0
  34. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/pandas_tools.py +0 -0
  35. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/python_tools.py +0 -0
  36. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/shell_tools.py +0 -0
  37. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/spider_tools.py +0 -0
  38. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/test.py +0 -0
  39. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/tools.py +0 -0
  40. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/wikipedia_tools.py +0 -0
  41. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/xml_tools.py +0 -0
  42. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/yaml_tools.py +0 -0
  43. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents/tools/yfinance_tools.py +0 -0
  44. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents.egg-info/dependency_links.txt +0 -0
  45. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/praisonaiagents.egg-info/top_level.txt +0 -0
  46. {praisonaiagents-0.0.36 → praisonaiagents-0.0.38}/setup.cfg +0 -0
@@ -0,0 +1,18 @@
1
+ Metadata-Version: 2.2
2
+ Name: praisonaiagents
3
+ Version: 0.0.38
4
+ Summary: Praison AI agents for completing complex tasks with Self Reflection Agents
5
+ Author: Mervin Praison
6
+ Requires-Dist: pydantic
7
+ Requires-Dist: rich
8
+ Requires-Dist: openai
9
+ Provides-Extra: memory
10
+ Requires-Dist: chromadb>=0.5.23; extra == "memory"
11
+ Provides-Extra: knowledge
12
+ Requires-Dist: mem0ai>=0.1.0; extra == "knowledge"
13
+ Requires-Dist: chromadb==0.5.23; extra == "knowledge"
14
+ Requires-Dist: markitdown; extra == "knowledge"
15
+ Requires-Dist: chonkie; extra == "knowledge"
16
+ Provides-Extra: all
17
+ Requires-Dist: praisonaiagents[memory]; extra == "all"
18
+ Requires-Dist: praisonaiagents[knowledge]; extra == "all"
@@ -7,6 +7,8 @@ from .agents.agents import PraisonAIAgents
7
7
  from .task.task import Task
8
8
  from .tools.tools import Tools
9
9
  from .agents.autoagents import AutoAgents
10
+ from .knowledge.knowledge import Knowledge
11
+ from .knowledge.chunking import Chunking
10
12
  from .memory.memory import Memory
11
13
  from .main import (
12
14
  TaskOutput,
@@ -48,4 +50,6 @@ __all__ = [
48
50
  'register_display_callback',
49
51
  'sync_display_callbacks',
50
52
  'async_display_callbacks',
53
+ 'Knowledge',
54
+ 'Chunking'
51
55
  ]
@@ -20,6 +20,7 @@ from ..main import (
20
20
  adisplay_instruction
21
21
  )
22
22
  import inspect
23
+ import uuid
23
24
 
24
25
  if TYPE_CHECKING:
25
26
  from ..task.task import Task
@@ -176,13 +177,15 @@ class Agent:
176
177
  respect_context_window: bool = True,
177
178
  code_execution_mode: Literal["safe", "unsafe"] = "safe",
178
179
  embedder_config: Optional[Dict[str, Any]] = None,
179
- knowledge_sources: Optional[List[Any]] = None,
180
+ knowledge: Optional[List[str]] = None,
181
+ knowledge_config: Optional[Dict[str, Any]] = None,
180
182
  use_system_prompt: Optional[bool] = True,
181
183
  markdown: bool = True,
182
184
  self_reflect: bool = False,
183
185
  max_reflect: int = 3,
184
186
  min_reflect: int = 1,
185
- reflect_llm: Optional[str] = None
187
+ reflect_llm: Optional[str] = None,
188
+ user_id: Optional[str] = None
186
189
  ):
187
190
  # Handle backward compatibility for required fields
188
191
  if all(x is None for x in [name, role, goal, backstory, instructions]):
@@ -226,7 +229,7 @@ class Agent:
226
229
  self.respect_context_window = respect_context_window
227
230
  self.code_execution_mode = code_execution_mode
228
231
  self.embedder_config = embedder_config
229
- self.knowledge_sources = knowledge_sources
232
+ self.knowledge = knowledge
230
233
  self.use_system_prompt = use_system_prompt
231
234
  self.chat_history = []
232
235
  self.markdown = markdown
@@ -242,6 +245,36 @@ Your Role: {self.role}\n
242
245
  Your Goal: {self.goal}
243
246
  """
244
247
 
248
+ # Generate unique IDs
249
+ self.agent_id = str(uuid.uuid4())
250
+
251
+ # Store user_id
252
+ self.user_id = user_id
253
+
254
+ # Initialize Knowledge with provided or default config
255
+ from praisonaiagents.knowledge import Knowledge
256
+ self.knowledge = Knowledge(knowledge_config or None)
257
+
258
+ # Handle knowledge
259
+ if knowledge:
260
+ for source in knowledge:
261
+ self._process_knowledge(source)
262
+
263
+ def _process_knowledge(self, knowledge_item):
264
+ """Process and store knowledge from a file path, URL, or string."""
265
+ try:
266
+ if os.path.exists(knowledge_item):
267
+ # It's a file path
268
+ self.knowledge.add(knowledge_item, user_id=self.user_id, agent_id=self.agent_id)
269
+ elif knowledge_item.startswith("http://") or knowledge_item.startswith("https://"):
270
+ # It's a URL
271
+ pass
272
+ else:
273
+ # It's a string content
274
+ self.knowledge.store(knowledge_item, user_id=self.user_id, agent_id=self.agent_id)
275
+ except Exception as e:
276
+ logging.error(f"Error processing knowledge item: {knowledge_item}, error: {e}")
277
+
245
278
  def generate_task(self) -> 'Task':
246
279
  """Generate a Task object from the agent's instructions"""
247
280
  from ..task.task import Task
@@ -418,6 +451,21 @@ Your Goal: {self.goal}
418
451
  return None
419
452
 
420
453
  def chat(self, prompt, temperature=0.2, tools=None, output_json=None, output_pydantic=None):
454
+ # Search for existing knowledge if any knowledge is provided
455
+ if self.knowledge:
456
+ search_results = self.knowledge.search(prompt, agent_id=self.agent_id)
457
+ if search_results:
458
+ # Check if search_results is a list of dictionaries or strings
459
+ if isinstance(search_results, dict) and 'results' in search_results:
460
+ # Extract memory content from the results
461
+ knowledge_content = "\n".join([result['memory'] for result in search_results['results']])
462
+ else:
463
+ # If search_results is a list of strings, join them directly
464
+ knowledge_content = "\n".join(search_results)
465
+
466
+ # Append found knowledge to the prompt
467
+ prompt = f"{prompt}\n\nKnowledge: {knowledge_content}"
468
+
421
469
  if self.use_system_prompt:
422
470
  system_prompt = f"""{self.backstory}\n
423
471
  Your Role: {self.role}\n
@@ -12,6 +12,7 @@ from ..agent.agent import Agent
12
12
  from ..task.task import Task
13
13
  from ..process.process import Process, LoopItems
14
14
  import asyncio
15
+ import uuid
15
16
 
16
17
  # Set up logger
17
18
  logger = logging.getLogger(__name__)
@@ -44,10 +45,17 @@ def process_video(video_path: str, seconds_per_frame=2):
44
45
  return base64_frames
45
46
 
46
47
  class PraisonAIAgents:
47
- def __init__(self, agents, tasks=None, verbose=0, completion_checker=None, max_retries=5, process="sequential", manager_llm=None, memory=False, memory_config=None, embedder=None):
48
+ def __init__(self, agents, tasks=None, verbose=0, completion_checker=None, max_retries=5, process="sequential", manager_llm=None, memory=False, memory_config=None, embedder=None, user_id=None):
48
49
  if not agents:
49
50
  raise ValueError("At least one agent must be provided")
50
-
51
+
52
+ self.run_id = str(uuid.uuid4()) # Auto-generate run_id
53
+ self.user_id = user_id # Optional user_id
54
+
55
+ # Pass user_id to each agent
56
+ for agent in agents:
57
+ agent.user_id = self.user_id
58
+
51
59
  self.agents = agents
52
60
  self.tasks = {}
53
61
  if max_retries < 3:
@@ -0,0 +1,8 @@
1
+ """
2
+ PraisonAI Knowledge - Advanced knowledge management system with configurable features
3
+ """
4
+
5
+ from praisonaiagents.knowledge.knowledge import Knowledge
6
+ from praisonaiagents.knowledge.chunking import Chunking
7
+
8
+ __all__ = ["Knowledge", "Chunking"]
@@ -0,0 +1,182 @@
1
+ from typing import List, Union, Optional, Dict, Any
2
+ from functools import cached_property
3
+ import importlib
4
+
5
+ class Chunking:
6
+ """A unified class for text chunking with various chunking strategies."""
7
+
8
+ CHUNKER_PARAMS = {
9
+ 'token': ['chunk_size', 'chunk_overlap', 'tokenizer'],
10
+ 'word': ['chunk_size', 'chunk_overlap', 'tokenizer'],
11
+ 'sentence': ['chunk_size', 'chunk_overlap', 'tokenizer'],
12
+ 'semantic': ['chunk_size', 'embedding_model', 'tokenizer'],
13
+ 'sdpm': ['chunk_size', 'embedding_model', 'tokenizer'],
14
+ 'late': ['chunk_size', 'embedding_model', 'tokenizer'],
15
+ 'recursive': ['chunk_size', 'tokenizer']
16
+ }
17
+
18
+ @cached_property
19
+ def SUPPORTED_CHUNKERS(self) -> Dict[str, Any]:
20
+ """Lazy load chunker classes."""
21
+ try:
22
+ from chonkie.chunker import (
23
+ TokenChunker,
24
+ WordChunker,
25
+ SentenceChunker,
26
+ SemanticChunker,
27
+ SDPMChunker,
28
+ LateChunker,
29
+ RecursiveChunker
30
+ )
31
+ except ImportError:
32
+ raise ImportError(
33
+ "chonkie package not found. Please install it using: pip install 'praisonaiagents[knowledge]'"
34
+ )
35
+
36
+ return {
37
+ 'token': TokenChunker,
38
+ 'word': WordChunker,
39
+ 'sentence': SentenceChunker,
40
+ 'semantic': SemanticChunker,
41
+ 'sdpm': SDPMChunker,
42
+ 'late': LateChunker,
43
+ 'recursive': RecursiveChunker
44
+ }
45
+
46
+ def __init__(
47
+ self,
48
+ chunker_type: str = 'token',
49
+ chunk_size: int = 512,
50
+ chunk_overlap: int = 128,
51
+ tokenizer: str = "gpt2",
52
+ embedding_model: Optional[Union[str, Any]] = None,
53
+ **kwargs
54
+ ):
55
+ """Initialize the Chunking class."""
56
+ if chunker_type not in self.CHUNKER_PARAMS:
57
+ raise ValueError(
58
+ f"Unsupported chunker type: {chunker_type}. "
59
+ f"Must be one of: {list(self.CHUNKER_PARAMS.keys())}"
60
+ )
61
+
62
+ self.chunker_type = chunker_type
63
+ self.chunk_size = chunk_size
64
+ self.chunk_overlap = chunk_overlap
65
+ self.tokenizer = tokenizer
66
+ self._embedding_model = embedding_model
67
+ self.kwargs = kwargs
68
+
69
+ # Initialize these as None for lazy loading
70
+ self._chunker = None
71
+ self._embeddings = None
72
+
73
+ @cached_property
74
+ def embedding_model(self):
75
+ """Lazy load the embedding model."""
76
+ if self._embedding_model is None and self.chunker_type in ['semantic', 'sdpm', 'late']:
77
+ from chonkie.embeddings import AutoEmbeddings
78
+ return AutoEmbeddings.get_embeddings("all-MiniLM-L6-v2")
79
+ elif isinstance(self._embedding_model, str):
80
+ from chonkie.embeddings import AutoEmbeddings
81
+ return AutoEmbeddings.get_embeddings(self._embedding_model)
82
+ return self._embedding_model
83
+
84
+ def _get_chunker_params(self) -> Dict[str, Any]:
85
+ """Get the appropriate parameters for the current chunker type."""
86
+ allowed_params = self.CHUNKER_PARAMS[self.chunker_type]
87
+ params = {'chunk_size': self.chunk_size}
88
+
89
+ if 'chunk_overlap' in allowed_params:
90
+ params['chunk_overlap'] = self.chunk_overlap
91
+
92
+ if 'tokenizer' in allowed_params:
93
+ if self.chunker_type in ['semantic', 'sdpm', 'late']:
94
+ params['tokenizer'] = self.embedding_model.get_tokenizer_or_token_counter()
95
+ else:
96
+ params['tokenizer'] = self.tokenizer
97
+
98
+ if 'embedding_model' in allowed_params:
99
+ params['embedding_model'] = self.embedding_model
100
+
101
+ # Add any additional kwargs that are in allowed_params
102
+ for key, value in self.kwargs.items():
103
+ if key in allowed_params:
104
+ params[key] = value
105
+
106
+ return params
107
+
108
+ @cached_property
109
+ def chunker(self):
110
+ """Lazy load the chunker instance."""
111
+ if self._chunker is None:
112
+ chunker_cls = self.SUPPORTED_CHUNKERS[self.chunker_type]
113
+ common_params = self._get_chunker_params()
114
+ self._chunker = chunker_cls(**common_params)
115
+
116
+ return self._chunker
117
+
118
+ def _get_overlap_refinery(self, context_size: Optional[int] = None, **kwargs):
119
+ """Lazy load the overlap refinery."""
120
+ try:
121
+ from chonkie.refinery import OverlapRefinery
122
+ except ImportError:
123
+ raise ImportError("Failed to import OverlapRefinery from chonkie.refinery")
124
+
125
+ if context_size is None:
126
+ context_size = self.chunk_overlap
127
+
128
+ return OverlapRefinery(
129
+ context_size=context_size,
130
+ tokenizer=self.chunker.tokenizer,
131
+ **kwargs
132
+ )
133
+
134
+ def add_overlap_context(
135
+ self,
136
+ chunks: List[Any],
137
+ context_size: int = None,
138
+ mode: str = "suffix",
139
+ merge_context: bool = True
140
+ ) -> List[Any]:
141
+ """Add overlap context to chunks using OverlapRefinery."""
142
+ refinery = self._get_overlap_refinery(
143
+ context_size=context_size,
144
+ mode=mode,
145
+ merge_context=merge_context
146
+ )
147
+ return refinery.refine(chunks)
148
+
149
+ def chunk(
150
+ self,
151
+ text: Union[str, List[str]],
152
+ add_context: bool = False,
153
+ context_params: Optional[Dict[str, Any]] = None
154
+ ) -> Union[List[Any], List[List[Any]]]:
155
+ """Chunk text using the configured chunking strategy."""
156
+ chunks = self.chunker(text)
157
+
158
+ if add_context:
159
+ context_params = context_params or {}
160
+ if isinstance(text, str):
161
+ chunks = self.add_overlap_context(chunks, **context_params)
162
+ else:
163
+ chunks = [self.add_overlap_context(c, **context_params) for c in chunks]
164
+
165
+ return chunks
166
+
167
+ def __call__(
168
+ self,
169
+ text: Union[str, List[str]],
170
+ add_context: bool = False,
171
+ context_params: Optional[Dict[str, Any]] = None
172
+ ) -> Union[List[Any], List[List[Any]]]:
173
+ """Make the Chunking instance callable."""
174
+ return self.chunk(text, add_context, context_params)
175
+
176
+ def __repr__(self) -> str:
177
+ """String representation of the Chunking instance."""
178
+ return (
179
+ f"Chunking(chunker_type='{self.chunker_type}', "
180
+ f"chunk_size={self.chunk_size}, "
181
+ f"chunk_overlap={self.chunk_overlap})"
182
+ )
@@ -0,0 +1,290 @@
1
+ import os
2
+ import logging
3
+ import uuid
4
+ import time
5
+ from .chunking import Chunking
6
+ from functools import cached_property
7
+
8
+ logger = logging.getLogger(__name__)
9
+
10
+ class CustomMemory:
11
+ @classmethod
12
+ def from_config(cls, config):
13
+ from mem0 import Memory
14
+ return type('CustomMemory', (Memory,), {
15
+ '_add_to_vector_store': cls._add_to_vector_store
16
+ }).from_config(config)
17
+
18
+ @staticmethod
19
+ def _add_to_vector_store(self, messages, metadata, filters):
20
+ # Custom implementation that doesn't use LLM
21
+ parsed_messages = "\n".join([msg["content"] for msg in messages])
22
+
23
+ # Create a simple fact without using LLM
24
+ new_retrieved_facts = [parsed_messages]
25
+
26
+ # Process embeddings and continue with vector store operations
27
+ new_message_embeddings = {}
28
+ for new_mem in new_retrieved_facts:
29
+ messages_embeddings = self.embedding_model.embed(new_mem)
30
+ new_message_embeddings[new_mem] = messages_embeddings
31
+
32
+ # Create the memory
33
+ memory_id = self._create_memory(
34
+ data=parsed_messages,
35
+ existing_embeddings=new_message_embeddings,
36
+ metadata=metadata
37
+ )
38
+
39
+ return [{
40
+ "id": memory_id,
41
+ "memory": parsed_messages,
42
+ "event": "ADD"
43
+ }]
44
+
45
+ class Knowledge:
46
+ def __init__(self, config=None, verbose=None):
47
+ self._config = config
48
+ self._verbose = verbose or 0
49
+ os.environ['ANONYMIZED_TELEMETRY'] = 'False' # Chromadb
50
+
51
+ # Configure logging levels based on verbose setting
52
+ if not self._verbose:
53
+ # Suppress logs from all relevant dependencies
54
+ for logger_name in [
55
+ 'mem0',
56
+ 'chromadb',
57
+ 'local_persistent_hnsw',
58
+ '_client',
59
+ 'main'
60
+ ]:
61
+ logging.getLogger(logger_name).setLevel(logging.WARNING)
62
+
63
+ # Disable OpenAI API request logging
64
+ logging.getLogger('openai').setLevel(logging.WARNING)
65
+
66
+ # Set root logger to warning to catch any uncategorized logs
67
+ logging.getLogger().setLevel(logging.WARNING)
68
+
69
+ @cached_property
70
+ def _deps(self):
71
+ try:
72
+ from markitdown import MarkItDown
73
+ import chromadb
74
+ return {
75
+ 'chromadb': chromadb,
76
+ 'markdown': MarkItDown()
77
+ }
78
+ except ImportError:
79
+ raise ImportError(
80
+ "Required packages not installed. Please install using: "
81
+ 'pip install "praisonaiagents[knowledge]"'
82
+ )
83
+
84
+ @cached_property
85
+ def config(self):
86
+ # Generate unique collection name for each instance
87
+ collection_name = f"test_{int(time.time())}_{str(uuid.uuid4())[:8]}"
88
+ persist_dir = ".praison"
89
+
90
+ # Create persistent client config
91
+ base_config = {
92
+ "vector_store": {
93
+ "provider": "chroma",
94
+ "config": {
95
+ "collection_name": collection_name,
96
+ "path": persist_dir,
97
+ "client": self._deps['chromadb'].PersistentClient(path=persist_dir)
98
+ }
99
+ },
100
+ "version": "v1.1",
101
+ "custom_prompt": "Return {{\"facts\": [text]}} where text is the exact input provided and json response"
102
+ }
103
+
104
+ # If config is provided, merge it with base config
105
+ if self._config:
106
+ if "vector_store" in self._config and "config" in self._config["vector_store"]:
107
+ config_copy = self._config["vector_store"]["config"].copy()
108
+ for key in ["collection_name", "client"]:
109
+ if key in config_copy:
110
+ del config_copy[key]
111
+ base_config["vector_store"]["config"].update(config_copy)
112
+
113
+ return base_config
114
+
115
+ @cached_property
116
+ def memory(self):
117
+ try:
118
+ return CustomMemory.from_config(self.config)
119
+ except (NotImplementedError, ValueError) as e:
120
+ if "list_collections" in str(e) or "Extra fields not allowed" in str(e):
121
+ # Keep only allowed fields
122
+ vector_store_config = {
123
+ "collection_name": self.config["vector_store"]["config"]["collection_name"],
124
+ "path": self.config["vector_store"]["config"]["path"]
125
+ }
126
+ self.config["vector_store"]["config"] = vector_store_config
127
+ from mem0 import Memory
128
+ return Memory.from_config(self.config)
129
+ raise
130
+
131
+ @cached_property
132
+ def markdown(self):
133
+ return self._deps['markdown']
134
+
135
+ @cached_property
136
+ def chunker(self):
137
+ return Chunking(
138
+ chunker_type='recursive',
139
+ chunk_size=512,
140
+ chunk_overlap=50
141
+ )
142
+
143
+ def _log(self, message, level=2):
144
+ """Internal logging helper"""
145
+ if self._verbose and self._verbose >= level:
146
+ logger.info(message)
147
+
148
+ def store(self, content, user_id=None, agent_id=None, run_id=None, metadata=None):
149
+ """Store a memory."""
150
+ try:
151
+ if isinstance(content, str):
152
+ if any(content.lower().endswith(ext) for ext in ['.pdf', '.doc', '.docx', '.txt']):
153
+ self._log(f"Content appears to be a file path, processing file: {content}")
154
+ return self.add(content, user_id=user_id, agent_id=agent_id, run_id=run_id, metadata=metadata)
155
+
156
+ content = content.strip()
157
+ if not content:
158
+ return []
159
+
160
+ result = self.memory.add(content, user_id=user_id, agent_id=agent_id, run_id=run_id, metadata=metadata)
161
+ self._log(f"Store operation result: {result}")
162
+ return result
163
+ except Exception as e:
164
+ logger.error(f"Error storing content: {str(e)}")
165
+ return []
166
+
167
+ def get_all(self, user_id=None, agent_id=None, run_id=None):
168
+ """Retrieve all memories."""
169
+ return self.memory.get_all(user_id=user_id, agent_id=agent_id, run_id=run_id)
170
+
171
+ def get(self, memory_id):
172
+ """Retrieve a specific memory by ID."""
173
+ return self.memory.get(memory_id)
174
+
175
+ def search(self, query, user_id=None, agent_id=None, run_id=None):
176
+ """Search for memories related to a query."""
177
+ return self.memory.search(query, user_id=user_id, agent_id=agent_id, run_id=run_id)
178
+
179
+ def update(self, memory_id, data):
180
+ """Update a memory."""
181
+ return self.memory.update(memory_id, data)
182
+
183
+ def history(self, memory_id):
184
+ """Get the history of changes for a memory."""
185
+ return self.memory.history(memory_id)
186
+
187
+ def delete(self, memory_id):
188
+ """Delete a memory."""
189
+ self.memory.delete(memory_id)
190
+
191
+ def delete_all(self, user_id=None, agent_id=None, run_id=None):
192
+ """Delete all memories."""
193
+ self.memory.delete_all(user_id=user_id, agent_id=agent_id, run_id=run_id)
194
+
195
+ def reset(self):
196
+ """Reset all memories."""
197
+ self.memory.reset()
198
+
199
+ def normalize_content(self, content):
200
+ """Normalize content for consistent storage."""
201
+ # Example normalization: strip whitespace, convert to lowercase
202
+ return content.strip().lower()
203
+
204
+ def add(self, file_path, user_id=None, agent_id=None, run_id=None, metadata=None):
205
+ """Read file content and store it in memory.
206
+
207
+ Args:
208
+ file_path: Can be:
209
+ - A string path to local file
210
+ - A URL string
211
+ - A list containing file paths and/or URLs
212
+ """
213
+ if isinstance(file_path, (list, tuple)):
214
+ results = []
215
+ for path in file_path:
216
+ result = self._process_single_input(path, user_id, agent_id, run_id, metadata)
217
+ results.extend(result.get('results', []))
218
+ return {'results': results, 'relations': []}
219
+
220
+ return self._process_single_input(file_path, user_id, agent_id, run_id, metadata)
221
+
222
+ def _process_single_input(self, input_path, user_id=None, agent_id=None, run_id=None, metadata=None):
223
+ """Process a single input which can be a file path or URL."""
224
+ try:
225
+ # Define supported file extensions
226
+ DOCUMENT_EXTENSIONS = {
227
+ 'document': ('.pdf', '.ppt', '.pptx', '.doc', '.docx', '.xls', '.xlsx'),
228
+ 'media': ('.jpg', '.jpeg', '.png', '.gif', '.bmp', '.tiff', '.mp3', '.wav', '.ogg', '.m4a'),
229
+ 'text': ('.txt', '.csv', '.json', '.xml', '.md', '.html', '.htm'),
230
+ 'archive': '.zip'
231
+ }
232
+
233
+ # Check if input is URL
234
+ if isinstance(input_path, str) and (input_path.startswith('http://') or input_path.startswith('https://')):
235
+ self._log(f"Processing URL: {input_path}")
236
+ raise NotImplementedError("URL processing not yet implemented")
237
+
238
+ # Check if input ends with any supported extension
239
+ is_supported_file = any(input_path.lower().endswith(ext)
240
+ for exts in DOCUMENT_EXTENSIONS.values()
241
+ for ext in (exts if isinstance(exts, tuple) else (exts,)))
242
+
243
+ if is_supported_file:
244
+ self._log(f"Processing as file path: {input_path}")
245
+ if not os.path.exists(input_path):
246
+ logger.error(f"File not found: {input_path}")
247
+ raise FileNotFoundError(f"File not found: {input_path}")
248
+
249
+ file_ext = '.' + input_path.lower().split('.')[-1] # Get extension reliably
250
+
251
+ # Process file based on type
252
+ if file_ext in DOCUMENT_EXTENSIONS['text']:
253
+ with open(input_path, 'r', encoding='utf-8') as file:
254
+ content = file.read().strip()
255
+ if not content:
256
+ raise ValueError("Empty text file")
257
+ memories = [self.normalize_content(content)]
258
+ else:
259
+ # Use MarkItDown for documents and media
260
+ result = self.markdown.convert(input_path)
261
+ content = result.text_content
262
+ if not content:
263
+ raise ValueError("No content could be extracted from file")
264
+ chunks = self.chunker.chunk(content)
265
+ memories = [chunk.text.strip() if hasattr(chunk, 'text') else str(chunk).strip()
266
+ for chunk in chunks if chunk]
267
+
268
+ # Set metadata for file
269
+ if not metadata:
270
+ metadata = {}
271
+ metadata['file_type'] = file_ext.lstrip('.')
272
+ metadata['filename'] = os.path.basename(input_path)
273
+ else:
274
+ # Treat as raw text content only if no file extension
275
+ memories = [self.normalize_content(input_path)]
276
+
277
+ # Store memories
278
+ all_results = []
279
+ for memory in memories:
280
+ if memory:
281
+ memory_result = self.store(memory, user_id=user_id, agent_id=agent_id,
282
+ run_id=run_id, metadata=metadata)
283
+ if memory_result:
284
+ all_results.extend(memory_result.get('results', []))
285
+
286
+ return {'results': all_results, 'relations': []}
287
+
288
+ except Exception as e:
289
+ logger.error(f"Error processing input {input_path}: {str(e)}", exc_info=True)
290
+ raise
@@ -0,0 +1,18 @@
1
+ Metadata-Version: 2.2
2
+ Name: praisonaiagents
3
+ Version: 0.0.38
4
+ Summary: Praison AI agents for completing complex tasks with Self Reflection Agents
5
+ Author: Mervin Praison
6
+ Requires-Dist: pydantic
7
+ Requires-Dist: rich
8
+ Requires-Dist: openai
9
+ Provides-Extra: memory
10
+ Requires-Dist: chromadb>=0.5.23; extra == "memory"
11
+ Provides-Extra: knowledge
12
+ Requires-Dist: mem0ai>=0.1.0; extra == "knowledge"
13
+ Requires-Dist: chromadb==0.5.23; extra == "knowledge"
14
+ Requires-Dist: markitdown; extra == "knowledge"
15
+ Requires-Dist: chonkie; extra == "knowledge"
16
+ Provides-Extra: all
17
+ Requires-Dist: praisonaiagents[memory]; extra == "all"
18
+ Requires-Dist: praisonaiagents[knowledge]; extra == "all"
@@ -11,6 +11,9 @@ praisonaiagents/agent/agent.py
11
11
  praisonaiagents/agents/__init__.py
12
12
  praisonaiagents/agents/agents.py
13
13
  praisonaiagents/agents/autoagents.py
14
+ praisonaiagents/knowledge/__init__.py
15
+ praisonaiagents/knowledge/chunking.py
16
+ praisonaiagents/knowledge/knowledge.py
14
17
  praisonaiagents/memory/memory.py
15
18
  praisonaiagents/process/__init__.py
16
19
  praisonaiagents/process/process.py
@@ -0,0 +1,16 @@
1
+ pydantic
2
+ rich
3
+ openai
4
+
5
+ [all]
6
+ praisonaiagents[memory]
7
+ praisonaiagents[knowledge]
8
+
9
+ [knowledge]
10
+ mem0ai>=0.1.0
11
+ chromadb==0.5.23
12
+ markitdown
13
+ chonkie
14
+
15
+ [memory]
16
+ chromadb>=0.5.23
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "praisonaiagents"
7
- version = "0.0.36"
7
+ version = "0.0.38"
8
8
  description = "Praison AI agents for completing complex tasks with Self Reflection Agents"
9
9
  authors = [
10
10
  { name="Mervin Praison" }
@@ -17,5 +17,18 @@ dependencies = [
17
17
 
18
18
  [project.optional-dependencies]
19
19
  memory = [
20
- "chromadb>=0.6.0"
21
- ]
20
+ "chromadb>=0.5.23"
21
+ ]
22
+
23
+ knowledge = [
24
+ "mem0ai>=0.1.0",
25
+ "chromadb==0.5.23",
26
+ "markitdown",
27
+ "chonkie"
28
+ ]
29
+
30
+ # Combined features
31
+ all = [
32
+ "praisonaiagents[memory]",
33
+ "praisonaiagents[knowledge]"
34
+ ]
@@ -1,10 +0,0 @@
1
- Metadata-Version: 2.2
2
- Name: praisonaiagents
3
- Version: 0.0.36
4
- Summary: Praison AI agents for completing complex tasks with Self Reflection Agents
5
- Author: Mervin Praison
6
- Requires-Dist: pydantic
7
- Requires-Dist: rich
8
- Requires-Dist: openai
9
- Provides-Extra: memory
10
- Requires-Dist: chromadb>=0.6.0; extra == "memory"
@@ -1,10 +0,0 @@
1
- Metadata-Version: 2.2
2
- Name: praisonaiagents
3
- Version: 0.0.36
4
- Summary: Praison AI agents for completing complex tasks with Self Reflection Agents
5
- Author: Mervin Praison
6
- Requires-Dist: pydantic
7
- Requires-Dist: rich
8
- Requires-Dist: openai
9
- Provides-Extra: memory
10
- Requires-Dist: chromadb>=0.6.0; extra == "memory"
@@ -1,6 +0,0 @@
1
- pydantic
2
- rich
3
- openai
4
-
5
- [memory]
6
- chromadb>=0.6.0