PyPI - agentrun-mem0ai - Versions diffs - 0.0.11__py3-none-any.whl - Mend

agentrun-mem0ai 0.0.11__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (150) hide show

agentrun_mem0/__init__.py +6 -0
agentrun_mem0/client/__init__.py +0 -0
agentrun_mem0/client/main.py +1747 -0
agentrun_mem0/client/project.py +931 -0
agentrun_mem0/client/utils.py +115 -0
agentrun_mem0/configs/__init__.py +0 -0
agentrun_mem0/configs/base.py +90 -0
agentrun_mem0/configs/embeddings/__init__.py +0 -0
agentrun_mem0/configs/embeddings/base.py +110 -0
agentrun_mem0/configs/enums.py +7 -0
agentrun_mem0/configs/llms/__init__.py +0 -0
agentrun_mem0/configs/llms/anthropic.py +56 -0
agentrun_mem0/configs/llms/aws_bedrock.py +192 -0
agentrun_mem0/configs/llms/azure.py +57 -0
agentrun_mem0/configs/llms/base.py +62 -0
agentrun_mem0/configs/llms/deepseek.py +56 -0
agentrun_mem0/configs/llms/lmstudio.py +59 -0
agentrun_mem0/configs/llms/ollama.py +56 -0
agentrun_mem0/configs/llms/openai.py +79 -0
agentrun_mem0/configs/llms/vllm.py +56 -0
agentrun_mem0/configs/prompts.py +459 -0
agentrun_mem0/configs/rerankers/__init__.py +0 -0
agentrun_mem0/configs/rerankers/base.py +17 -0
agentrun_mem0/configs/rerankers/cohere.py +15 -0
agentrun_mem0/configs/rerankers/config.py +12 -0
agentrun_mem0/configs/rerankers/huggingface.py +17 -0
agentrun_mem0/configs/rerankers/llm.py +48 -0
agentrun_mem0/configs/rerankers/sentence_transformer.py +16 -0
agentrun_mem0/configs/rerankers/zero_entropy.py +28 -0
agentrun_mem0/configs/vector_stores/__init__.py +0 -0
agentrun_mem0/configs/vector_stores/alibabacloud_mysql.py +64 -0
agentrun_mem0/configs/vector_stores/aliyun_tablestore.py +32 -0
agentrun_mem0/configs/vector_stores/azure_ai_search.py +57 -0
agentrun_mem0/configs/vector_stores/azure_mysql.py +84 -0
agentrun_mem0/configs/vector_stores/baidu.py +27 -0
agentrun_mem0/configs/vector_stores/chroma.py +58 -0
agentrun_mem0/configs/vector_stores/databricks.py +61 -0
agentrun_mem0/configs/vector_stores/elasticsearch.py +65 -0
agentrun_mem0/configs/vector_stores/faiss.py +37 -0
agentrun_mem0/configs/vector_stores/langchain.py +30 -0
agentrun_mem0/configs/vector_stores/milvus.py +42 -0
agentrun_mem0/configs/vector_stores/mongodb.py +25 -0
agentrun_mem0/configs/vector_stores/neptune.py +27 -0
agentrun_mem0/configs/vector_stores/opensearch.py +41 -0
agentrun_mem0/configs/vector_stores/pgvector.py +52 -0
agentrun_mem0/configs/vector_stores/pinecone.py +55 -0
agentrun_mem0/configs/vector_stores/qdrant.py +47 -0
agentrun_mem0/configs/vector_stores/redis.py +24 -0
agentrun_mem0/configs/vector_stores/s3_vectors.py +28 -0
agentrun_mem0/configs/vector_stores/supabase.py +44 -0
agentrun_mem0/configs/vector_stores/upstash_vector.py +34 -0
agentrun_mem0/configs/vector_stores/valkey.py +15 -0
agentrun_mem0/configs/vector_stores/vertex_ai_vector_search.py +28 -0
agentrun_mem0/configs/vector_stores/weaviate.py +41 -0
agentrun_mem0/embeddings/__init__.py +0 -0
agentrun_mem0/embeddings/aws_bedrock.py +100 -0
agentrun_mem0/embeddings/azure_openai.py +55 -0
agentrun_mem0/embeddings/base.py +31 -0
agentrun_mem0/embeddings/configs.py +30 -0
agentrun_mem0/embeddings/gemini.py +39 -0
agentrun_mem0/embeddings/huggingface.py +44 -0
agentrun_mem0/embeddings/langchain.py +35 -0
agentrun_mem0/embeddings/lmstudio.py +29 -0
agentrun_mem0/embeddings/mock.py +11 -0
agentrun_mem0/embeddings/ollama.py +53 -0
agentrun_mem0/embeddings/openai.py +49 -0
agentrun_mem0/embeddings/together.py +31 -0
agentrun_mem0/embeddings/vertexai.py +64 -0
agentrun_mem0/exceptions.py +503 -0
agentrun_mem0/graphs/__init__.py +0 -0
agentrun_mem0/graphs/configs.py +105 -0
agentrun_mem0/graphs/neptune/__init__.py +0 -0
agentrun_mem0/graphs/neptune/base.py +497 -0
agentrun_mem0/graphs/neptune/neptunedb.py +511 -0
agentrun_mem0/graphs/neptune/neptunegraph.py +474 -0
agentrun_mem0/graphs/tools.py +371 -0
agentrun_mem0/graphs/utils.py +97 -0
agentrun_mem0/llms/__init__.py +0 -0
agentrun_mem0/llms/anthropic.py +87 -0
agentrun_mem0/llms/aws_bedrock.py +665 -0
agentrun_mem0/llms/azure_openai.py +141 -0
agentrun_mem0/llms/azure_openai_structured.py +91 -0
agentrun_mem0/llms/base.py +131 -0
agentrun_mem0/llms/configs.py +34 -0
agentrun_mem0/llms/deepseek.py +107 -0
agentrun_mem0/llms/gemini.py +201 -0
agentrun_mem0/llms/groq.py +88 -0
agentrun_mem0/llms/langchain.py +94 -0
agentrun_mem0/llms/litellm.py +87 -0
agentrun_mem0/llms/lmstudio.py +114 -0
agentrun_mem0/llms/ollama.py +117 -0
agentrun_mem0/llms/openai.py +147 -0
agentrun_mem0/llms/openai_structured.py +52 -0
agentrun_mem0/llms/sarvam.py +89 -0
agentrun_mem0/llms/together.py +88 -0
agentrun_mem0/llms/vllm.py +107 -0
agentrun_mem0/llms/xai.py +52 -0
agentrun_mem0/memory/__init__.py +0 -0
agentrun_mem0/memory/base.py +63 -0
agentrun_mem0/memory/graph_memory.py +698 -0
agentrun_mem0/memory/kuzu_memory.py +713 -0
agentrun_mem0/memory/main.py +2229 -0
agentrun_mem0/memory/memgraph_memory.py +689 -0
agentrun_mem0/memory/setup.py +56 -0
agentrun_mem0/memory/storage.py +218 -0
agentrun_mem0/memory/telemetry.py +90 -0
agentrun_mem0/memory/utils.py +208 -0
agentrun_mem0/proxy/__init__.py +0 -0
agentrun_mem0/proxy/main.py +189 -0
agentrun_mem0/reranker/__init__.py +9 -0
agentrun_mem0/reranker/base.py +20 -0
agentrun_mem0/reranker/cohere_reranker.py +85 -0
agentrun_mem0/reranker/huggingface_reranker.py +147 -0
agentrun_mem0/reranker/llm_reranker.py +142 -0
agentrun_mem0/reranker/sentence_transformer_reranker.py +107 -0
agentrun_mem0/reranker/zero_entropy_reranker.py +96 -0
agentrun_mem0/utils/factory.py +283 -0
agentrun_mem0/utils/gcp_auth.py +167 -0
agentrun_mem0/vector_stores/__init__.py +0 -0
agentrun_mem0/vector_stores/alibabacloud_mysql.py +547 -0
agentrun_mem0/vector_stores/aliyun_tablestore.py +252 -0
agentrun_mem0/vector_stores/azure_ai_search.py +396 -0
agentrun_mem0/vector_stores/azure_mysql.py +463 -0
agentrun_mem0/vector_stores/baidu.py +368 -0
agentrun_mem0/vector_stores/base.py +58 -0
agentrun_mem0/vector_stores/chroma.py +332 -0
agentrun_mem0/vector_stores/configs.py +67 -0
agentrun_mem0/vector_stores/databricks.py +761 -0
agentrun_mem0/vector_stores/elasticsearch.py +237 -0
agentrun_mem0/vector_stores/faiss.py +479 -0
agentrun_mem0/vector_stores/langchain.py +180 -0
agentrun_mem0/vector_stores/milvus.py +250 -0
agentrun_mem0/vector_stores/mongodb.py +310 -0
agentrun_mem0/vector_stores/neptune_analytics.py +467 -0
agentrun_mem0/vector_stores/opensearch.py +292 -0
agentrun_mem0/vector_stores/pgvector.py +404 -0
agentrun_mem0/vector_stores/pinecone.py +382 -0
agentrun_mem0/vector_stores/qdrant.py +270 -0
agentrun_mem0/vector_stores/redis.py +295 -0
agentrun_mem0/vector_stores/s3_vectors.py +176 -0
agentrun_mem0/vector_stores/supabase.py +237 -0
agentrun_mem0/vector_stores/upstash_vector.py +293 -0
agentrun_mem0/vector_stores/valkey.py +824 -0
agentrun_mem0/vector_stores/vertex_ai_vector_search.py +635 -0
agentrun_mem0/vector_stores/weaviate.py +343 -0
agentrun_mem0ai-0.0.11.data/data/README.md +205 -0
agentrun_mem0ai-0.0.11.dist-info/METADATA +277 -0
agentrun_mem0ai-0.0.11.dist-info/RECORD +150 -0
agentrun_mem0ai-0.0.11.dist-info/WHEEL +4 -0
agentrun_mem0ai-0.0.11.dist-info/licenses/LICENSE +201 -0

agentrun_mem0/llms/ollama.py ADDED Viewed

@@ -0,0 +1,117 @@
+from typing import Dict, List, Optional, Union
+try:
+    from ollama import Client
+except ImportError:
+    raise ImportError("The 'ollama' library is required. Please install it using 'pip install ollama'.")
+from agentrun_mem0.configs.llms.base import BaseLlmConfig
+from agentrun_mem0.configs.llms.ollama import OllamaConfig
+from agentrun_mem0.llms.base import LLMBase
+class OllamaLLM(LLMBase):
+    def __init__(self, config: Optional[Union[BaseLlmConfig, OllamaConfig, Dict]] = None):
+        # Convert to OllamaConfig if needed
+        if config is None:
+            config = OllamaConfig()
+        elif isinstance(config, dict):
+            config = OllamaConfig(**config)
+        elif isinstance(config, BaseLlmConfig) and not isinstance(config, OllamaConfig):
+            # Convert BaseLlmConfig to OllamaConfig
+            config = OllamaConfig(
+                model=config.model,
+                temperature=config.temperature,
+                api_key=config.api_key,
+                max_tokens=config.max_tokens,
+                top_p=config.top_p,
+                top_k=config.top_k,
+                enable_vision=config.enable_vision,
+                vision_details=config.vision_details,
+                http_client_proxies=config.http_client,
+            )
+        super().__init__(config)
+        if not self.config.model:
+            self.config.model = "llama3.1:70b"
+        self.client = Client(host=self.config.ollama_base_url)
+    def _parse_response(self, response, tools):
+        """
+        Process the response based on whether tools are used or not.
+        Args:
+            response: The raw response from API.
+            tools: The list of tools provided in the request.
+        Returns:
+            str or dict: The processed response.
+        """
+        # Get the content from response
+        if isinstance(response, dict):
+            content = response["message"]["content"]
+        else:
+            content = response.message.content
+        if tools:
+            processed_response = {
+                "content": content,
+                "tool_calls": [],
+            }
+            # Ollama doesn't support tool calls in the same way, so we return the content
+            return processed_response
+        else:
+            return content
+    def generate_response(
+        self,
+        messages: List[Dict[str, str]],
+        response_format=None,
+        tools: Optional[List[Dict]] = None,
+        tool_choice: str = "auto",
+        **kwargs,
+    ):
+        """
+        Generate a response based on the given messages using Ollama.
+        Args:
+            messages (list): List of message dicts containing 'role' and 'content'.
+            response_format (str or object, optional): Format of the response. Defaults to "text".
+            tools (list, optional): List of tools that the model can call. Defaults to None.
+            tool_choice (str, optional): Tool choice method. Defaults to "auto".
+            **kwargs: Additional Ollama-specific parameters.
+        Returns:
+            str: The generated response.
+        """
+        # Build parameters for Ollama
+        params = {
+            "model": self.config.model,
+            "messages": messages,
+        }
+        # Handle JSON response format by using Ollama's native format parameter
+        if response_format and response_format.get("type") == "json_object":
+            params["format"] = "json"
+            # Also add JSON format instruction to the last message as a fallback
+            if messages and messages[-1]["role"] == "user":
+                messages[-1]["content"] += "\n\nPlease respond with valid JSON only."
+            else:
+                messages.append({"role": "user", "content": "Please respond with valid JSON only."})
+        # Add options for Ollama (temperature, num_predict, top_p)
+        options = {
+            "temperature": self.config.temperature,
+            "num_predict": self.config.max_tokens,
+            "top_p": self.config.top_p,
+        }
+        params["options"] = options
+        # Remove OpenAI-specific parameters that Ollama doesn't support
+        params.pop("max_tokens", None)  # Ollama uses different parameter names
+        response = self.client.chat(**params)
+        return self._parse_response(response, tools)

agentrun_mem0/llms/openai.py ADDED Viewed

@@ -0,0 +1,147 @@
+import json
+import logging
+import os
+from typing import Dict, List, Optional, Union
+from openai import OpenAI
+from agentrun_mem0.configs.llms.base import BaseLlmConfig
+from agentrun_mem0.configs.llms.openai import OpenAIConfig
+from agentrun_mem0.llms.base import LLMBase
+from agentrun_mem0.memory.utils import extract_json
+class OpenAILLM(LLMBase):
+    def __init__(self, config: Optional[Union[BaseLlmConfig, OpenAIConfig, Dict]] = None):
+        # Convert to OpenAIConfig if needed
+        if config is None:
+            config = OpenAIConfig()
+        elif isinstance(config, dict):
+            config = OpenAIConfig(**config)
+        elif isinstance(config, BaseLlmConfig) and not isinstance(config, OpenAIConfig):
+            # Convert BaseLlmConfig to OpenAIConfig
+            config = OpenAIConfig(
+                model=config.model,
+                temperature=config.temperature,
+                api_key=config.api_key,
+                max_tokens=config.max_tokens,
+                top_p=config.top_p,
+                top_k=config.top_k,
+                enable_vision=config.enable_vision,
+                vision_details=config.vision_details,
+                http_client_proxies=config.http_client,
+            )
+        super().__init__(config)
+        if not self.config.model:
+            self.config.model = "gpt-4.1-nano-2025-04-14"
+        if os.environ.get("OPENROUTER_API_KEY"):  # Use OpenRouter
+            self.client = OpenAI(
+                api_key=os.environ.get("OPENROUTER_API_KEY"),
+                base_url=self.config.openrouter_base_url
+                or os.getenv("OPENROUTER_API_BASE")
+                or "https://openrouter.ai/api/v1",
+            )
+        else:
+            api_key = self.config.api_key or os.getenv("OPENAI_API_KEY")
+            base_url = self.config.openai_base_url or os.getenv("OPENAI_BASE_URL") or "https://api.openai.com/v1"
+            self.client = OpenAI(api_key=api_key, base_url=base_url)
+    def _parse_response(self, response, tools):
+        """
+        Process the response based on whether tools are used or not.
+        Args:
+            response: The raw response from API.
+            tools: The list of tools provided in the request.
+        Returns:
+            str or dict: The processed response.
+        """
+        if tools:
+            processed_response = {
+                "content": response.choices[0].message.content,
+                "tool_calls": [],
+            }
+            if response.choices[0].message.tool_calls:
+                for tool_call in response.choices[0].message.tool_calls:
+                    processed_response["tool_calls"].append(
+                        {
+                            "name": tool_call.function.name,
+                            "arguments": json.loads(extract_json(tool_call.function.arguments)),
+                        }
+                    )
+            return processed_response
+        else:
+            return response.choices[0].message.content
+    def generate_response(
+        self,
+        messages: List[Dict[str, str]],
+        response_format=None,
+        tools: Optional[List[Dict]] = None,
+        tool_choice: str = "auto",
+        **kwargs,
+    ):
+        """
+        Generate a JSON response based on the given messages using OpenAI.
+        Args:
+            messages (list): List of message dicts containing 'role' and 'content'.
+            response_format (str or object, optional): Format of the response. Defaults to "text".
+            tools (list, optional): List of tools that the model can call. Defaults to None.
+            tool_choice (str, optional): Tool choice method. Defaults to "auto".
+            **kwargs: Additional OpenAI-specific parameters.
+        Returns:
+            json: The generated response.
+        """
+        params = self._get_supported_params(messages=messages, **kwargs)
+        params.update({
+            "model": self.config.model,
+            "messages": messages,
+        })
+        if os.getenv("OPENROUTER_API_KEY"):
+            openrouter_params = {}
+            if self.config.models:
+                openrouter_params["models"] = self.config.models
+                openrouter_params["route"] = self.config.route
+                params.pop("model")
+            if self.config.site_url and self.config.app_name:
+                extra_headers = {
+                    "HTTP-Referer": self.config.site_url,
+                    "X-Title": self.config.app_name,
+                }
+                openrouter_params["extra_headers"] = extra_headers
+            params.update(**openrouter_params)
+        else:
+            openai_specific_generation_params = ["store"]
+            for param in openai_specific_generation_params:
+                if hasattr(self.config, param):
+                    params[param] = getattr(self.config, param)
+        if response_format:
+            params["response_format"] = response_format
+        if tools:  # TODO: Remove tools if no issues found with new memory addition logic
+            params["tools"] = tools
+            params["tool_choice"] = tool_choice
+        response = self.client.chat.completions.create(**params)
+        parsed_response = self._parse_response(response, tools)
+        if self.config.response_callback:
+            try:
+                self.config.response_callback(self, response, params)
+            except Exception as e:
+                # Log error but don't propagate
+                logging.error(f"Error due to callback: {e}")
+                pass
+        return parsed_response

agentrun_mem0/llms/openai_structured.py ADDED Viewed

@@ -0,0 +1,52 @@
+import os
+from typing import Dict, List, Optional
+from openai import OpenAI
+from agentrun_mem0.configs.llms.base import BaseLlmConfig
+from agentrun_mem0.llms.base import LLMBase
+class OpenAIStructuredLLM(LLMBase):
+    def __init__(self, config: Optional[BaseLlmConfig] = None):
+        super().__init__(config)
+        if not self.config.model:
+            self.config.model = "gpt-4o-2024-08-06"
+        api_key = self.config.api_key or os.getenv("OPENAI_API_KEY")
+        base_url = self.config.openai_base_url or os.getenv("OPENAI_API_BASE") or "https://api.openai.com/v1"
+        self.client = OpenAI(api_key=api_key, base_url=base_url)
+    def generate_response(
+        self,
+        messages: List[Dict[str, str]],
+        response_format: Optional[str] = None,
+        tools: Optional[List[Dict]] = None,
+        tool_choice: str = "auto",
+    ) -> str:
+        """
+        Generate a response based on the given messages using OpenAI.
+        Args:
+            messages (List[Dict[str, str]]): A list of dictionaries, each containing a 'role' and 'content' key.
+            response_format (Optional[str]): The desired format of the response. Defaults to None.
+        Returns:
+            str: The generated response.
+        """
+        params = {
+            "model": self.config.model,
+            "messages": messages,
+            "temperature": self.config.temperature,
+        }
+        if response_format:
+            params["response_format"] = response_format
+        if tools:
+            params["tools"] = tools
+            params["tool_choice"] = tool_choice
+        response = self.client.beta.chat.completions.parse(**params)
+        return response.choices[0].message.content

agentrun_mem0/llms/sarvam.py ADDED Viewed

@@ -0,0 +1,89 @@
+import os
+from typing import Dict, List, Optional
+import requests
+from agentrun_mem0.configs.llms.base import BaseLlmConfig
+from agentrun_mem0.llms.base import LLMBase
+class SarvamLLM(LLMBase):
+    def __init__(self, config: Optional[BaseLlmConfig] = None):
+        super().__init__(config)
+        # Set default model if not provided
+        if not self.config.model:
+            self.config.model = "sarvam-m"
+        # Get API key from config or environment variable
+        self.api_key = self.config.api_key or os.getenv("SARVAM_API_KEY")
+        if not self.api_key:
+            raise ValueError(
+                "Sarvam API key is required. Set SARVAM_API_KEY environment variable or provide api_key in config."
+            )
+        # Set base URL - use config value or environment or default
+        self.base_url = (
+            getattr(self.config, "sarvam_base_url", None) or os.getenv("SARVAM_API_BASE") or "https://api.sarvam.ai/v1"
+        )
+    def generate_response(self, messages: List[Dict[str, str]], response_format=None) -> str:
+        """
+        Generate a response based on the given messages using Sarvam-M.
+        Args:
+            messages (list): List of message dicts containing 'role' and 'content'.
+            response_format (str or object, optional): Format of the response.
+                                                     Currently not used by Sarvam API.
+        Returns:
+            str: The generated response.
+        """
+        url = f"{self.base_url}/chat/completions"
+        headers = {"Authorization": f"Bearer {self.api_key}", "Content-Type": "application/json"}
+        # Prepare the request payload
+        params = {
+            "messages": messages,
+            "model": self.config.model if isinstance(self.config.model, str) else "sarvam-m",
+        }
+        # Add standard parameters that already exist in BaseLlmConfig
+        if self.config.temperature is not None:
+            params["temperature"] = self.config.temperature
+        if self.config.max_tokens is not None:
+            params["max_tokens"] = self.config.max_tokens
+        if self.config.top_p is not None:
+            params["top_p"] = self.config.top_p
+        # Handle Sarvam-specific parameters if model is passed as dict
+        if isinstance(self.config.model, dict):
+            # Extract model name
+            params["model"] = self.config.model.get("name", "sarvam-m")
+            # Add Sarvam-specific parameters
+            sarvam_specific_params = ["reasoning_effort", "frequency_penalty", "presence_penalty", "seed", "stop", "n"]
+            for param in sarvam_specific_params:
+                if param in self.config.model:
+                    params[param] = self.config.model[param]
+        try:
+            response = requests.post(url, headers=headers, json=params, timeout=30)
+            response.raise_for_status()
+            result = response.json()
+            if "choices" in result and len(result["choices"]) > 0:
+                return result["choices"][0]["message"]["content"]
+            else:
+                raise ValueError("No response choices found in Sarvam API response")
+        except requests.exceptions.RequestException as e:
+            raise RuntimeError(f"Sarvam API request failed: {e}")
+        except KeyError as e:
+            raise ValueError(f"Unexpected response format from Sarvam API: {e}")

agentrun_mem0/llms/together.py ADDED Viewed

@@ -0,0 +1,88 @@
+import json
+import os
+from typing import Dict, List, Optional
+try:
+    from together import Together
+except ImportError:
+    raise ImportError("The 'together' library is required. Please install it using 'pip install together'.")
+from agentrun_mem0.configs.llms.base import BaseLlmConfig
+from agentrun_mem0.llms.base import LLMBase
+from agentrun_mem0.memory.utils import extract_json
+class TogetherLLM(LLMBase):
+    def __init__(self, config: Optional[BaseLlmConfig] = None):
+        super().__init__(config)
+        if not self.config.model:
+            self.config.model = "mistralai/Mixtral-8x7B-Instruct-v0.1"
+        api_key = self.config.api_key or os.getenv("TOGETHER_API_KEY")
+        self.client = Together(api_key=api_key)
+    def _parse_response(self, response, tools):
+        """
+        Process the response based on whether tools are used or not.
+        Args:
+            response: The raw response from API.
+            tools: The list of tools provided in the request.
+        Returns:
+            str or dict: The processed response.
+        """
+        if tools:
+            processed_response = {
+                "content": response.choices[0].message.content,
+                "tool_calls": [],
+            }
+            if response.choices[0].message.tool_calls:
+                for tool_call in response.choices[0].message.tool_calls:
+                    processed_response["tool_calls"].append(
+                        {
+                            "name": tool_call.function.name,
+                            "arguments": json.loads(extract_json(tool_call.function.arguments)),
+                        }
+                    )
+            return processed_response
+        else:
+            return response.choices[0].message.content
+    def generate_response(
+        self,
+        messages: List[Dict[str, str]],
+        response_format=None,
+        tools: Optional[List[Dict]] = None,
+        tool_choice: str = "auto",
+    ):
+        """
+        Generate a response based on the given messages using TogetherAI.
+        Args:
+            messages (list): List of message dicts containing 'role' and 'content'.
+            response_format (str or object, optional): Format of the response. Defaults to "text".
+            tools (list, optional): List of tools that the model can call. Defaults to None.
+            tool_choice (str, optional): Tool choice method. Defaults to "auto".
+        Returns:
+            str: The generated response.
+        """
+        params = {
+            "model": self.config.model,
+            "messages": messages,
+            "temperature": self.config.temperature,
+            "max_tokens": self.config.max_tokens,
+            "top_p": self.config.top_p,
+        }
+        if response_format:
+            params["response_format"] = response_format
+        if tools:  # TODO: Remove tools if no issues found with new memory addition logic
+            params["tools"] = tools
+            params["tool_choice"] = tool_choice
+        response = self.client.chat.completions.create(**params)
+        return self._parse_response(response, tools)

agentrun_mem0/llms/vllm.py ADDED Viewed

@@ -0,0 +1,107 @@
+import json
+import os
+from typing import Dict, List, Optional, Union
+from openai import OpenAI
+from agentrun_mem0.configs.llms.base import BaseLlmConfig
+from agentrun_mem0.configs.llms.vllm import VllmConfig
+from agentrun_mem0.llms.base import LLMBase
+from agentrun_mem0.memory.utils import extract_json
+class VllmLLM(LLMBase):
+    def __init__(self, config: Optional[Union[BaseLlmConfig, VllmConfig, Dict]] = None):
+        # Convert to VllmConfig if needed
+        if config is None:
+            config = VllmConfig()
+        elif isinstance(config, dict):
+            config = VllmConfig(**config)
+        elif isinstance(config, BaseLlmConfig) and not isinstance(config, VllmConfig):
+            # Convert BaseLlmConfig to VllmConfig
+            config = VllmConfig(
+                model=config.model,
+                temperature=config.temperature,
+                api_key=config.api_key,
+                max_tokens=config.max_tokens,
+                top_p=config.top_p,
+                top_k=config.top_k,
+                enable_vision=config.enable_vision,
+                vision_details=config.vision_details,
+                http_client_proxies=config.http_client,
+            )
+        super().__init__(config)
+        if not self.config.model:
+            self.config.model = "Qwen/Qwen2.5-32B-Instruct"
+        self.config.api_key = self.config.api_key or os.getenv("VLLM_API_KEY") or "vllm-api-key"
+        base_url = self.config.vllm_base_url or os.getenv("VLLM_BASE_URL")
+        self.client = OpenAI(api_key=self.config.api_key, base_url=base_url)
+    def _parse_response(self, response, tools):
+        """
+        Process the response based on whether tools are used or not.
+        Args:
+            response: The raw response from API.
+            tools: The list of tools provided in the request.
+        Returns:
+            str or dict: The processed response.
+        """
+        if tools:
+            processed_response = {
+                "content": response.choices[0].message.content,
+                "tool_calls": [],
+            }
+            if response.choices[0].message.tool_calls:
+                for tool_call in response.choices[0].message.tool_calls:
+                    processed_response["tool_calls"].append(
+                        {
+                            "name": tool_call.function.name,
+                            "arguments": json.loads(extract_json(tool_call.function.arguments)),
+                        }
+                    )
+            return processed_response
+        else:
+            return response.choices[0].message.content
+    def generate_response(
+        self,
+        messages: List[Dict[str, str]],
+        response_format=None,
+        tools: Optional[List[Dict]] = None,
+        tool_choice: str = "auto",
+        **kwargs,
+    ):
+        """
+        Generate a response based on the given messages using vLLM.
+        Args:
+            messages (list): List of message dicts containing 'role' and 'content'.
+            response_format (str or object, optional): Format of the response. Defaults to "text".
+            tools (list, optional): List of tools that the model can call. Defaults to None.
+            tool_choice (str, optional): Tool choice method. Defaults to "auto".
+            **kwargs: Additional vLLM-specific parameters.
+        Returns:
+            str: The generated response.
+        """
+        params = self._get_supported_params(messages=messages, **kwargs)
+        params.update(
+            {
+                "model": self.config.model,
+                "messages": messages,
+            }
+        )
+        if tools:
+            params["tools"] = tools
+            params["tool_choice"] = tool_choice
+        response = self.client.chat.completions.create(**params)
+        return self._parse_response(response, tools)

agentrun_mem0/llms/xai.py ADDED Viewed

@@ -0,0 +1,52 @@
+import os
+from typing import Dict, List, Optional
+from openai import OpenAI
+from agentrun_mem0.configs.llms.base import BaseLlmConfig
+from agentrun_mem0.llms.base import LLMBase
+class XAILLM(LLMBase):
+    def __init__(self, config: Optional[BaseLlmConfig] = None):
+        super().__init__(config)
+        if not self.config.model:
+            self.config.model = "grok-2-latest"
+        api_key = self.config.api_key or os.getenv("XAI_API_KEY")
+        base_url = self.config.xai_base_url or os.getenv("XAI_API_BASE") or "https://api.x.ai/v1"
+        self.client = OpenAI(api_key=api_key, base_url=base_url)
+    def generate_response(
+        self,
+        messages: List[Dict[str, str]],
+        response_format=None,
+        tools: Optional[List[Dict]] = None,
+        tool_choice: str = "auto",
+    ):
+        """
+        Generate a response based on the given messages using XAI.
+        Args:
+            messages (list): List of message dicts containing 'role' and 'content'.
+            response_format (str or object, optional): Format of the response. Defaults to "text".
+            tools (list, optional): List of tools that the model can call. Defaults to None.
+            tool_choice (str, optional): Tool choice method. Defaults to "auto".
+        Returns:
+            str: The generated response.
+        """
+        params = {
+            "model": self.config.model,
+            "messages": messages,
+            "temperature": self.config.temperature,
+            "max_tokens": self.config.max_tokens,
+            "top_p": self.config.top_p,
+        }
+        if response_format:
+            params["response_format"] = response_format
+        response = self.client.chat.completions.create(**params)
+        return response.choices[0].message.content

agentrun_mem0/memory/__init__.py ADDED Viewed

File without changes