PyPI - mem-llm - Versions diffs - 1.2.0__py3-none-any.whl → 1.3.1__py3-none-any.whl - Mend

mem-llm 1.2.0py3-none-any.whl → 1.3.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mem-llm might be problematic. Click here for more details.

Files changed (13) hide show

mem_llm/__init__.py +12 -3
mem_llm/base_llm_client.py +175 -0
mem_llm/clients/__init__.py +25 -0
mem_llm/clients/gemini_client.py +381 -0
mem_llm/clients/lmstudio_client.py +280 -0
mem_llm/clients/ollama_client.py +268 -0
mem_llm/llm_client_factory.py +277 -0
mem_llm/mem_agent.py +123 -37
{mem_llm-1.2.0.dist-info → mem_llm-1.3.1.dist-info}/METADATA +103 -36
{mem_llm-1.2.0.dist-info → mem_llm-1.3.1.dist-info}/RECORD +13 -7
{mem_llm-1.2.0.dist-info → mem_llm-1.3.1.dist-info}/WHEEL +0 -0
{mem_llm-1.2.0.dist-info → mem_llm-1.3.1.dist-info}/entry_points.txt +0 -0
{mem_llm-1.2.0.dist-info → mem_llm-1.3.1.dist-info}/top_level.txt +0 -0

mem_llm/llm_client_factory.py ADDED Viewed

@@ -0,0 +1,277 @@
+"""
+LLM Client Factory
+==================
+Factory pattern for creating LLM clients.
+Supports multiple backends with automatic detection.
+Supported Backends:
+- Ollama: Local Ollama service
+- LM Studio: Local LM Studio server
+- Gemini: Google Gemini API (cloud)
+Usage:
+    # Create specific backend
+    client = LLMClientFactory.create('ollama', model='llama3')
+    # Auto-detect available backend
+    client = LLMClientFactory.auto_detect()
+    # Get all available backends
+    backends = LLMClientFactory.get_available_backends()
+Author: C. Emre Karataş
+Version: 1.3.0
+"""
+from typing import Optional, Dict, List, Any
+import logging
+from .clients.ollama_client import OllamaClient
+from .clients.lmstudio_client import LMStudioClient
+from .clients.gemini_client import GeminiClient
+from .base_llm_client import BaseLLMClient
+class LLMClientFactory:
+    """
+    Factory for creating LLM clients
+    Provides unified interface for creating different LLM backends.
+    Supports auto-detection of available local services.
+    """
+    # Registry of supported backends
+    BACKENDS = {
+        'ollama': {
+            'class': OllamaClient,
+            'description': 'Local Ollama service',
+            'type': 'local',
+            'default_url': 'http://localhost:11434',
+            'default_model': 'granite4:tiny-h'
+        },
+        'lmstudio': {
+            'class': LMStudioClient,
+            'description': 'LM Studio local server (OpenAI-compatible)',
+            'type': 'local',
+            'default_url': 'http://localhost:1234',
+            'default_model': 'local-model'
+        },
+        'gemini': {
+            'class': GeminiClient,
+            'description': 'Google Gemini API (cloud)',
+            'type': 'cloud',
+            'default_model': 'gemini-2.5-flash',
+            'requires_api_key': True
+        }
+    }
+    @staticmethod
+    def create(backend: str, model: Optional[str] = None, **kwargs) -> BaseLLMClient:
+        """
+        Create LLM client for specified backend
+        Args:
+            backend: Backend name ('ollama', 'lmstudio', 'gemini')
+            model: Model name (uses default if None)
+            **kwargs: Backend-specific configuration
+                     - base_url: API endpoint (for local backends)
+                     - api_key: API key (for cloud backends)
+                     - temperature: Default temperature
+                     - max_tokens: Default max tokens
+        Returns:
+            Configured LLM client
+        Raises:
+            ValueError: If backend is not supported
+        Examples:
+            # Ollama
+            client = LLMClientFactory.create('ollama', model='llama3')
+            # LM Studio
+            client = LLMClientFactory.create(
+                'lmstudio',
+                model='llama-3-8b',
+                base_url='http://localhost:1234'
+            )
+            # Gemini
+            client = LLMClientFactory.create(
+                'gemini',
+                model='gemini-2.5-flash',
+                api_key='your-api-key'
+            )
+        """
+        backend = backend.lower()
+        if backend not in LLMClientFactory.BACKENDS:
+            available = ', '.join(LLMClientFactory.BACKENDS.keys())
+            raise ValueError(
+                f"Unsupported backend: '{backend}'. "
+                f"Available backends: {available}"
+            )
+        backend_info = LLMClientFactory.BACKENDS[backend]
+        client_class = backend_info['class']
+        # Use default model if not specified
+        if not model:
+            model = backend_info.get('default_model')
+        # Add default base_url for local backends if not provided
+        if backend_info['type'] == 'local' and 'base_url' not in kwargs:
+            kwargs['base_url'] = backend_info.get('default_url')
+        # Create and return client
+        try:
+            return client_class(model=model, **kwargs)
+        except Exception as e:
+            raise ValueError(f"Failed to create {backend} client: {str(e)}") from e
+    @staticmethod
+    def auto_detect(preferred_backends: Optional[List[str]] = None) -> Optional[BaseLLMClient]:
+        """
+        Auto-detect available LLM service
+        Checks common local services and returns the first available one.
+        Useful for applications that should work with any available backend.
+        Args:
+            preferred_backends: List of backends to check in order
+                              (if None, checks all in default order)
+        Returns:
+            First available LLM client, or None if none available
+        Example:
+            # Try to find any available backend
+            client = LLMClientFactory.auto_detect()
+            if client:
+                print(f"Using {client.get_info()['backend']}")
+            else:
+                print("No LLM service found")
+            # Try specific backends in order
+            client = LLMClientFactory.auto_detect(['lmstudio', 'ollama'])
+        """
+        logger = logging.getLogger('LLMClientFactory')
+        # Default check order: local services first
+        if preferred_backends is None:
+            preferred_backends = ['ollama', 'lmstudio']
+        for backend_name in preferred_backends:
+            if backend_name not in LLMClientFactory.BACKENDS:
+                logger.warning(f"Unknown backend in auto-detect: {backend_name}")
+                continue
+            backend_info = LLMClientFactory.BACKENDS[backend_name]
+            # Skip cloud services in auto-detect (they require API keys)
+            if backend_info['type'] == 'cloud':
+                logger.debug(f"Skipping cloud backend in auto-detect: {backend_name}")
+                continue
+            try:
+                # Try to create client with defaults
+                client = LLMClientFactory.create(backend_name)
+                # Check if service is actually running
+                if client.check_connection():
+                    logger.info(f"✅ Detected {backend_name} at {backend_info.get('default_url')}")
+                    return client
+                else:
+                    logger.debug(f"Service not running: {backend_name}")
+            except Exception as e:
+                logger.debug(f"Failed to detect {backend_name}: {e}")
+                continue
+        logger.warning("⚠️  No local LLM service detected")
+        return None
+    @staticmethod
+    def get_available_backends() -> List[Dict[str, Any]]:
+        """
+        Get list of all supported backends with their info
+        Returns:
+            List of backend information dictionaries
+        Example:
+            backends = LLMClientFactory.get_available_backends()
+            for backend in backends:
+                print(f"{backend['name']}: {backend['description']}")
+        """
+        result = []
+        for name, info in LLMClientFactory.BACKENDS.items():
+            backend_dict = {
+                'name': name,
+                'description': info['description'],
+                'type': info['type'],
+                'default_model': info.get('default_model'),
+                'requires_api_key': info.get('requires_api_key', False)
+            }
+            if info['type'] == 'local':
+                backend_dict['default_url'] = info.get('default_url')
+            result.append(backend_dict)
+        return result
+    @staticmethod
+    def check_backend_availability(backend: str, **kwargs) -> bool:
+        """
+        Check if a specific backend is available
+        Args:
+            backend: Backend name
+            **kwargs: Configuration for creating the client
+        Returns:
+            True if backend is available and responding
+        Example:
+            # Check if Ollama is running
+            if LLMClientFactory.check_backend_availability('ollama'):
+                print("Ollama is available")
+            # Check custom LM Studio URL
+            if LLMClientFactory.check_backend_availability(
+                'lmstudio',
+                base_url='http://localhost:5000'
+            ):
+                print("LM Studio is available")
+        """
+        try:
+            client = LLMClientFactory.create(backend, **kwargs)
+            return client.check_connection()
+        except Exception:
+            return False
+    @staticmethod
+    def get_backend_info(backend: str) -> Dict[str, Any]:
+        """
+        Get information about a specific backend
+        Args:
+            backend: Backend name
+        Returns:
+            Backend information dictionary
+        Raises:
+            ValueError: If backend not found
+        """
+        if backend not in LLMClientFactory.BACKENDS:
+            raise ValueError(f"Unknown backend: {backend}")
+        info = LLMClientFactory.BACKENDS[backend].copy()
+        # Remove class reference for JSON serialization
+        info.pop('class', None)
+        return info

mem_llm/mem_agent.py CHANGED Viewed

@@ -37,7 +37,9 @@ import os
 # Core dependencies
 from .memory_manager import MemoryManager
-from .llm_client import OllamaClient
+from .llm_client import OllamaClient  # Backward compatibility
+from .llm_client_factory import LLMClientFactory
+from .base_llm_client import BaseLLMClient
 # Advanced features (optional)
 try:
@@ -61,25 +63,48 @@ class MemAgent:
     def __init__(self,
                  model: str = "granite4:tiny-h",
+                 backend: str = "ollama",
                  config_file: Optional[str] = None,
                  use_sql: bool = True,
                  memory_dir: Optional[str] = None,
                  db_path: Optional[str] = None,
                  load_knowledge_base: bool = True,
                  ollama_url: str = "http://localhost:11434",
+                 base_url: Optional[str] = None,
+                 api_key: Optional[str] = None,
+                 auto_detect_backend: bool = False,
                  check_connection: bool = False,
-                 enable_security: bool = False):
+                 enable_security: bool = False,
+                 **llm_kwargs):
         """
         Args:
             model: LLM model to use
+            backend: LLM backend ('ollama', 'lmstudio', 'gemini') - NEW in v1.3.0
             config_file: Configuration file (optional)
             use_sql: Use SQL database (True) or JSON (False)
             memory_dir: Memory directory (for JSON mode or if db_path not specified)
             db_path: SQLite database path (for SQL mode, e.g., ":memory:" or "path/to/db.db")
             load_knowledge_base: Automatically load knowledge base
-            ollama_url: Ollama API URL
-            check_connection: Verify Ollama connection on startup (default: False)
+            ollama_url: Ollama API URL (backward compatibility, use base_url instead)
+            base_url: Backend API URL (for local backends) - NEW in v1.3.0
+            api_key: API key (for cloud backends like Gemini) - NEW in v1.3.0
+            auto_detect_backend: Auto-detect available LLM backend - NEW in v1.3.0
+            check_connection: Verify LLM connection on startup (default: False)
             enable_security: Enable prompt injection protection (v1.1.0+, default: False for backward compatibility)
+            **llm_kwargs: Additional backend-specific parameters
+        Examples:
+            # Default Ollama
+            agent = MemAgent()
+            # LM Studio
+            agent = MemAgent(backend='lmstudio', model='llama-3-8b')
+            # Gemini
+            agent = MemAgent(backend='gemini', model='gemini-1.5-flash', api_key='your-key')
+            # Auto-detect
+            agent = MemAgent(auto_detect_backend=True)
         """
         # Setup logging first
@@ -158,48 +183,109 @@ class MemAgent:
         # LLM client
         self.model = model  # Store model name
         self.use_sql = use_sql  # Store SQL usage flag
-        self.llm = OllamaClient(model, ollama_url)
+        # Initialize LLM client (v1.3.0: Multi-backend support)
+        # Prepare backend configuration
+        llm_config = llm_kwargs.copy()
+        # Handle backward compatibility: ollama_url -> base_url
+        if base_url is None and backend == "ollama":
+            base_url = ollama_url
+        # Add base_url for local backends
+        if base_url and backend in ['ollama', 'lmstudio']:
+            llm_config['base_url'] = base_url
+        # Add api_key for cloud backends
+        if api_key and backend in ['gemini']:
+            llm_config['api_key'] = api_key
+        # Auto-detect backend if requested
+        if auto_detect_backend:
+            self.logger.info("🔍 Auto-detecting available LLM backend...")
+            self.llm = LLMClientFactory.auto_detect()
+            if self.llm:
+                detected_backend = self.llm.__class__.__name__
+                self.logger.info(f"✅ Detected and using: {detected_backend}")
+            else:
+                self.logger.error("❌ No LLM backend available.")
+                raise RuntimeError(
+                    "No LLM backend detected. Please start a local LLM service (Ollama/LM Studio) "
+                    "or provide Gemini API key."
+                )
+        else:
+            # Create client using factory
+            try:
+                self.llm = LLMClientFactory.create(
+                    backend=backend,
+                    model=model,
+                    **llm_config
+                )
+                self.logger.info(f"✅ Initialized {backend} backend with model: {model}")
+            except Exception as e:
+                self.logger.error(f"❌ Failed to initialize {backend} backend: {e}")
+                raise
         # Optional connection check on startup
         if check_connection:
-            self.logger.info("Checking Ollama connection...")
+            backend_name = backend if not auto_detect_backend else "LLM service"
+            self.logger.info(f"Checking {backend_name} connection...")
             if not self.llm.check_connection():
-                error_msg = (
-                    "❌ ERROR: Cannot connect to Ollama service!\n"
-                    "   \n"
-                    "   Solutions:\n"
-                    "   1. Start Ollama: ollama serve\n"
-                    "   2. Check if Ollama is running: http://localhost:11434\n"
-                    "   3. Verify ollama_url parameter is correct\n"
-                    "   \n"
-                    "   To skip this check, use: MemAgent(check_connection=False)"
-                )
+                error_msg = f"❌ ERROR: Cannot connect to {backend_name}!\n"
+                if backend == "ollama":
+                    error_msg += (
+                        "   \n"
+                        "   Solutions:\n"
+                        "   1. Start Ollama: ollama serve\n"
+                        "   2. Check if Ollama is running: http://localhost:11434\n"
+                        "   3. Verify base_url parameter is correct\n"
+                    )
+                elif backend == "lmstudio":
+                    error_msg += (
+                        "   \n"
+                        "   Solutions:\n"
+                        "   1. Start LM Studio\n"
+                        "   2. Load a model in LM Studio\n"
+                        "   3. Start local server (default: http://localhost:1234)\n"
+                        "   4. Verify base_url parameter is correct\n"
+                    )
+                elif backend == "gemini":
+                    error_msg += (
+                        "   \n"
+                        "   Solutions:\n"
+                        "   1. Check your internet connection\n"
+                        "   2. Verify Gemini API key is correct\n"
+                        "   3. Check API quota/billing status\n"
+                        "   Get key: https://makersuite.google.com/app/apikey\n"
+                    )
+                error_msg += "   \n   To skip this check, use: MemAgent(check_connection=False)"
                 self.logger.error(error_msg)
-                raise ConnectionError("Ollama service not available")
+                raise ConnectionError(f"{backend_name} not available")
-            # Check if model exists
-            available_models = self.llm.list_models()
-            if model not in available_models:
-                error_msg = (
-                    f"❌ ERROR: Model '{model}' not found!\n"
-                    f"   \n"
-                    f"   Solutions:\n"
-                    f"   1. Download model: ollama pull {model}\n"
-                    f"   2. Use an available model: {', '.join(available_models[:3])}\n"
-                    f"   \n"
-                    f"   Available models: {len(available_models)} found\n"
-                    f"   To skip this check, use: MemAgent(check_connection=False)"
-                )
-                self.logger.error(error_msg)
-                raise ValueError(f"Model '{model}' not available")
+            # Check if model exists (for backends that support listing)
+            try:
+                available_models = self.llm.list_models()
+                if available_models and model not in available_models:
+                    error_msg = (
+                        f"❌ ERROR: Model '{model}' not found in {backend}!\n"
+                        f"   \n"
+                        f"   Available models: {', '.join(available_models[:5])}\n"
+                        f"   Total: {len(available_models)} models available\n"
+                        f"   \n"
+                        f"   To skip this check, use: MemAgent(check_connection=False)"
+                    )
+                    self.logger.error(error_msg)
+                    raise ValueError(f"Model '{model}' not available")
+            except:
+                # Some backends may not support list_models, skip check
+                pass
-            self.logger.info(f"✅ Ollama connection verified, model '{model}' ready")
+            self.logger.info(f"✅ {backend_name} connection verified, model '{model}' ready")
-        self.logger.info(f"LLM client ready: {model}")
+        self.logger.info(f"LLM client ready: {model} on {backend}")
-        # Initialize state variables FIRST
-        self.current_user: Optional[str] = None
-        self.current_system_prompt: Optional[str] = None
         # Advanced features (if available)
         if ADVANCED_AVAILABLE:

mem-llm 1.2.0__py3-none-any.whl → 1.3.1__py3-none-any.whl

Potentially problematic release.

mem-llm 1.2.0py3-none-any.whl → 1.3.1py3-none-any.whl