PyPI - mem-llm - Versions diffs - 2.0.0__py3-none-any.whl - Mend

mem-llm 2.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

mem_llm/__init__.py +98 -0
mem_llm/api_server.py +595 -0
mem_llm/base_llm_client.py +201 -0
mem_llm/builtin_tools.py +311 -0
mem_llm/cli.py +254 -0
mem_llm/clients/__init__.py +22 -0
mem_llm/clients/lmstudio_client.py +393 -0
mem_llm/clients/ollama_client.py +354 -0
mem_llm/config.yaml.example +52 -0
mem_llm/config_from_docs.py +180 -0
mem_llm/config_manager.py +231 -0
mem_llm/conversation_summarizer.py +372 -0
mem_llm/data_export_import.py +640 -0
mem_llm/dynamic_prompt.py +298 -0
mem_llm/knowledge_loader.py +88 -0
mem_llm/llm_client.py +225 -0
mem_llm/llm_client_factory.py +260 -0
mem_llm/logger.py +129 -0
mem_llm/mem_agent.py +1611 -0
mem_llm/memory_db.py +612 -0
mem_llm/memory_manager.py +321 -0
mem_llm/memory_tools.py +253 -0
mem_llm/prompt_security.py +304 -0
mem_llm/response_metrics.py +221 -0
mem_llm/retry_handler.py +193 -0
mem_llm/thread_safe_db.py +301 -0
mem_llm/tool_system.py +429 -0
mem_llm/vector_store.py +278 -0
mem_llm/web_launcher.py +129 -0
mem_llm/web_ui/README.md +44 -0
mem_llm/web_ui/__init__.py +7 -0
mem_llm/web_ui/index.html +641 -0
mem_llm/web_ui/memory.html +569 -0
mem_llm/web_ui/metrics.html +75 -0
mem_llm-2.0.0.dist-info/METADATA +667 -0
mem_llm-2.0.0.dist-info/RECORD +39 -0
mem_llm-2.0.0.dist-info/WHEEL +5 -0
mem_llm-2.0.0.dist-info/entry_points.txt +3 -0
mem_llm-2.0.0.dist-info/top_level.txt +1 -0

mem_llm/config_manager.py ADDED Viewed

@@ -0,0 +1,231 @@
+"""
+Configuration Manager
+Reads and manages configuration from YAML file
+"""
+import yaml
+from pathlib import Path
+from typing import Any, Dict, Optional
+import os
+class ConfigManager:
+    """Manages configuration file"""
+    def __init__(self, config_file: str = "config.yaml"):
+        """
+        Args:
+            config_file: Configuration file path
+        """
+        self.config_file = Path(config_file)
+        self.config: Dict[str, Any] = {}
+        self._load_config()
+    def _load_config(self) -> None:
+        """Load configuration file"""
+        if self.config_file.exists():
+            with open(self.config_file, 'r', encoding='utf-8') as f:
+                self.config = yaml.safe_load(f) or {}
+        else:
+            # Default configuration
+            self.config = self._get_default_config()
+            self.save_config()
+    def _get_default_config(self) -> Dict[str, Any]:
+        """Returns default configuration"""
+        return {
+            "llm": {
+                "model": "granite4:3b",
+                "base_url": "http://localhost:11434",
+                "temperature": 0.7,
+                "max_tokens": 500
+            },
+            "memory": {
+                "backend": "sql",
+                "json_dir": "memories",
+                "db_path": "memories/memories.db",
+                "max_conversations_per_user": 1000,
+                "auto_cleanup": True,
+                "cleanup_after_days": 90
+            },
+            "prompt": {
+                "template": "customer_service",
+                "variables": {
+                    "company_name": "Our Company",
+                    "tone": "friendly and professional"
+                },
+                "custom_prompt": None
+            },
+            "knowledge_base": {
+                "enabled": True,
+                "auto_load": True,
+                "default_kb": "ecommerce",
+                "custom_kb_file": None,
+                "search_limit": 5,
+                "min_relevance_score": 0.3,
+                "enable_vector_search": False,  # v1.3.2+ - Optional semantic search
+                "embedding_model": "all-MiniLM-L6-v2"  # Sentence transformers model
+            },
+            "response": {
+                "use_knowledge_base": True,
+                "use_memory": True,
+                "recent_conversations_limit": 5,
+                "format": {
+                    "include_greeting": True,
+                    "include_follow_up": True,
+                    "max_length": 500
+                }
+            },
+            "security": {
+                "filter_sensitive_data": True,
+                "sensitive_keywords": [
+                    "credit card", "password", "passcode", "CVV", "TR ID"
+                ],
+                "rate_limit": {
+                    "enabled": True,
+                    "max_requests_per_minute": 60,
+                    "max_requests_per_user_per_minute": 10
+                }
+            },
+            "logging": {
+                "enabled": True,
+                "level": "INFO",
+                "file": "mem_agent.log",
+                "max_size_mb": 10,
+                "backup_count": 5,
+                "log_user_messages": True,
+                "log_bot_responses": True,
+                "mask_sensitive": True
+            },
+            "performance": {
+                "enable_cache": True,
+                "cache_ttl_seconds": 3600,
+                "enable_parallel": False,
+                "max_workers": 4
+            },
+            "analytics": {
+                "enabled": True,
+                "track_response_time": True,
+                "track_user_satisfaction": False,
+                "track_conversation_length": True,
+                "export_interval_hours": 24,
+                "export_path": "analytics"
+            }
+        }
+    def get(self, key_path: str, default: Any = None) -> Any:
+        """
+        Get configuration value with dot notation
+        Args:
+            key_path: Key path (e.g: "llm.model")
+            default: Value to return if not found
+        Returns:
+            Configuration value
+        """
+        keys = key_path.split('.')
+        value = self.config
+        for key in keys:
+            if isinstance(value, dict) and key in value:
+                value = value[key]
+            else:
+                return default
+        return value
+    def set(self, key_path: str, value: Any) -> None:
+        """
+        Set configuration value with dot notation
+        Args:
+            key_path: Key path (e.g: "llm.model")
+            value: Value to set
+        """
+        keys = key_path.split('.')
+        config = self.config
+        for key in keys[:-1]:
+            if key not in config or not isinstance(config[key], dict):
+                config[key] = {}
+            config = config[key]
+        config[keys[-1]] = value
+    def save_config(self) -> None:
+        """Save configuration to file"""
+        with open(self.config_file, 'w', encoding='utf-8') as f:
+            yaml.dump(self.config, f, default_flow_style=False,
+                     allow_unicode=True, sort_keys=False)
+    def reload(self) -> None:
+        """Reload configuration"""
+        self._load_config()
+    def get_llm_config(self) -> Dict[str, Any]:
+        """Returns LLM configuration"""
+        return self.get("llm", {})
+    def get_memory_config(self) -> Dict[str, Any]:
+        """Returns memory configuration"""
+        return self.get("memory", {})
+    def get_prompt_config(self) -> Dict[str, Any]:
+        """Returns prompt configuration"""
+        return self.get("prompt", {})
+    def get_kb_config(self) -> Dict[str, Any]:
+        """Returns knowledge base configuration"""
+        return self.get("knowledge_base", {})
+    def is_kb_enabled(self) -> bool:
+        """Is knowledge base enabled?"""
+        return self.get("knowledge_base.enabled", True)
+    def is_memory_enabled(self) -> bool:
+        """Is memory enabled?"""
+        return self.get("response.use_memory", True)
+    def get_memory_backend(self) -> str:
+        """Returns memory backend type (json or sql)"""
+        return self.get("memory.backend", "sql")
+    def get_db_path(self) -> str:
+        """Returns database file path"""
+        return self.get("memory.db_path", "memories.db")
+    def get_json_dir(self) -> str:
+        """Returns JSON memory directory"""
+        return self.get("memory.json_dir", "memories")
+    def __repr__(self) -> str:
+        return f"ConfigManager(file='{self.config_file}')"
+# Global instance
+_config_manager: Optional[ConfigManager] = None
+def get_config(config_file: str = "config.yaml") -> ConfigManager:
+    """
+    Returns global configuration manager
+    Args:
+        config_file: Configuration file
+    Returns:
+        ConfigManager instance
+    """
+    global _config_manager
+    if _config_manager is None:
+        _config_manager = ConfigManager(config_file)
+    return _config_manager
+def reload_config() -> None:
+    """Reloads global configuration"""
+    global _config_manager
+    if _config_manager:
+        _config_manager.reload()

mem_llm/conversation_summarizer.py ADDED Viewed

@@ -0,0 +1,372 @@
+"""
+Conversation Summarizer
+=======================
+Automatically summarizes long conversation histories to optimize context window usage.
+Features:
+- Summarizes last N conversations
+- Extracts key facts and context
+- Saves tokens by condensing history
+- Periodic auto-summary updates
+- User profile extraction from summaries
+Usage:
+```python
+from mem_llm import ConversationSummarizer
+summarizer = ConversationSummarizer(llm_client)
+summary = summarizer.summarize_conversations(conversations, user_id="alice")
+```
+"""
+from typing import List, Dict, Optional, Any
+from datetime import datetime
+import json
+import logging
+class ConversationSummarizer:
+    """Summarizes conversation histories to optimize context"""
+    def __init__(self, llm_client, logger: Optional[logging.Logger] = None):
+        """
+        Initialize summarizer
+        Args:
+            llm_client: OllamaClient instance for generating summaries
+            logger: Logger instance (optional)
+        """
+        self.llm = llm_client
+        self.logger = logger or logging.getLogger(__name__)
+    def summarize_conversations(
+        self,
+        conversations: List[Dict],
+        user_id: str,
+        max_conversations: int = 20,
+        include_facts: bool = True
+    ) -> Dict[str, Any]:
+        """
+        Summarize a list of conversations
+        Args:
+            conversations: List of conversation dicts with user_message and bot_response
+            user_id: User identifier
+            max_conversations: Maximum number of conversations to summarize
+            include_facts: Extract key facts about the user
+        Returns:
+            Summary dict with text, facts, and metadata
+        """
+        if not conversations:
+            return {
+                "summary": "No conversation history available.",
+                "key_facts": [],
+                "conversation_count": 0,
+                "user_id": user_id,
+                "generated_at": datetime.now().isoformat()
+            }
+        # Limit conversations
+        convs_to_summarize = conversations[-max_conversations:] if len(conversations) > max_conversations else conversations
+        # Build prompt
+        prompt = self._build_summary_prompt(convs_to_summarize, user_id, include_facts)
+        try:
+            # Generate summary
+            self.logger.info(f"Generating summary for {user_id}: {len(convs_to_summarize)} conversations")
+            response = self.llm.chat(
+                messages=[{"role": "user", "content": prompt}],
+                temperature=0.3,  # Lower temperature for consistent summaries
+                max_tokens=500
+            )
+            # Parse response
+            summary_data = self._parse_summary_response(response, convs_to_summarize, user_id)
+            self.logger.info(f"✅ Summary generated: {len(summary_data['summary'])} chars")
+            return summary_data
+        except Exception as e:
+            self.logger.error(f"Summary generation failed: {e}")
+            return {
+                "summary": f"Error generating summary: {str(e)}",
+                "key_facts": [],
+                "conversation_count": len(convs_to_summarize),
+                "user_id": user_id,
+                "generated_at": datetime.now().isoformat(),
+                "error": str(e)
+            }
+    def _build_summary_prompt(
+        self,
+        conversations: List[Dict],
+        user_id: str,
+        include_facts: bool
+    ) -> str:
+        """Build the summarization prompt"""
+        # Format conversations
+        conv_text = ""
+        for i, conv in enumerate(conversations, 1):
+            user_msg = conv.get('user_message', '')
+            bot_msg = conv.get('bot_response', '')
+            conv_text += f"\n{i}. User: {user_msg}\n   Bot: {bot_msg}\n"
+        prompt = f"""You are a conversation summarizer. Summarize the following conversations for user '{user_id}'.
+CONVERSATIONS:
+{conv_text}
+TASK:
+Create a concise summary (max 200 words) that captures:
+1. Main topics discussed
+2. User's questions and concerns
+3. Important context for future conversations"""
+        if include_facts:
+            prompt += """
+4. Key facts about the user (preferences, background, needs)
+FORMAT YOUR RESPONSE AS:
+SUMMARY: [Your summary here]
+KEY_FACTS: [Comma-separated list of facts about the user]
+"""
+        else:
+            prompt += "\n\nProvide only the summary."
+        return prompt
+    def _parse_summary_response(
+        self,
+        response: str,
+        conversations: List[Dict],
+        user_id: str
+    ) -> Dict[str, Any]:
+        """Parse LLM response into structured summary"""
+        summary_text = ""
+        key_facts = []
+        # Try to parse structured format
+        if "SUMMARY:" in response and "KEY_FACTS:" in response:
+            parts = response.split("KEY_FACTS:")
+            summary_part = parts[0].replace("SUMMARY:", "").strip()
+            facts_part = parts[1].strip() if len(parts) > 1 else ""
+            summary_text = summary_part
+            # Parse facts
+            if facts_part:
+                # Split by common delimiters
+                facts_raw = facts_part.replace("\n", ",").split(",")
+                key_facts = [f.strip() for f in facts_raw if f.strip() and len(f.strip()) > 3]
+        else:
+            # Fallback: use entire response as summary
+            summary_text = response.strip()
+        return {
+            "summary": summary_text,
+            "key_facts": key_facts,
+            "conversation_count": len(conversations),
+            "user_id": user_id,
+            "generated_at": datetime.now().isoformat()
+        }
+    def should_update_summary(
+        self,
+        last_summary_time: Optional[str],
+        new_conversations_count: int,
+        update_threshold: int = 10
+    ) -> bool:
+        """
+        Determine if summary should be updated
+        Args:
+            last_summary_time: ISO timestamp of last summary
+            new_conversations_count: Number of new conversations since last summary
+            update_threshold: Minimum conversations before update
+        Returns:
+            True if summary should be updated
+        """
+        # Always update if no previous summary
+        if not last_summary_time:
+            return new_conversations_count >= 5  # Need at least 5 convs for meaningful summary
+        # Update if threshold reached
+        return new_conversations_count >= update_threshold
+    def extract_user_insights(self, summary: str) -> Dict[str, Any]:
+        """
+        Extract structured insights from summary
+        Args:
+            summary: Summary text
+        Returns:
+            Insights dict with topics, preferences, etc.
+        """
+        insights = {
+            "topics": [],
+            "preferences": [],
+            "needs": [],
+            "background": []
+        }
+        # Simple keyword-based extraction
+        # (Could be enhanced with NER or another LLM call)
+        summary_lower = summary.lower()
+        # Common topic keywords
+        topic_keywords = {
+            "programming": ["python", "javascript", "code", "programming", "development"],
+            "business": ["business", "startup", "company", "market"],
+            "technical": ["technical", "bug", "error", "issue", "problem"],
+            "personal": ["personal", "preference", "like", "prefer"]
+        }
+        for topic, keywords in topic_keywords.items():
+            if any(kw in summary_lower for kw in keywords):
+                insights["topics"].append(topic)
+        return insights
+    def get_summary_stats(self, original_text: str, summary_text: str) -> Dict[str, Any]:
+        """
+        Calculate compression statistics
+        Args:
+            original_text: Original conversation text
+            summary_text: Summarized text
+        Returns:
+            Stats dict with compression ratio, token savings, etc.
+        """
+        orig_length = len(original_text)
+        summary_length = len(summary_text)
+        # Rough token estimation (1 token ≈ 4 chars)
+        orig_tokens = orig_length // 4
+        summary_tokens = summary_length // 4
+        compression_ratio = (1 - summary_length / orig_length) * 100 if orig_length > 0 else 0
+        return {
+            "original_length": orig_length,
+            "summary_length": summary_length,
+            "compression_ratio": round(compression_ratio, 2),
+            "original_tokens_est": orig_tokens,
+            "summary_tokens_est": summary_tokens,
+            "tokens_saved": orig_tokens - summary_tokens
+        }
+class AutoSummarizer:
+    """Automatically manages conversation summaries with periodic updates"""
+    def __init__(
+        self,
+        summarizer: ConversationSummarizer,
+        memory_manager,
+        update_threshold: int = 10,
+        logger: Optional[logging.Logger] = None
+    ):
+        """
+        Initialize auto-summarizer
+        Args:
+            summarizer: ConversationSummarizer instance
+            memory_manager: Memory manager (SQL or JSON)
+            update_threshold: Update summary every N conversations
+            logger: Logger instance
+        """
+        self.summarizer = summarizer
+        self.memory = memory_manager
+        self.update_threshold = update_threshold
+        self.logger = logger or logging.getLogger(__name__)
+        # Track summaries per user
+        self.summaries = {}  # {user_id: summary_data}
+        self.conversation_counts = {}  # {user_id: count_since_last_summary}
+    def check_and_update(self, user_id: str) -> Optional[Dict[str, Any]]:
+        """
+        Check if summary needs updating and update if necessary
+        Args:
+            user_id: User identifier
+        Returns:
+            New summary if updated, None otherwise
+        """
+        # Get conversation count since last summary
+        count_since_last = self.conversation_counts.get(user_id, 0)
+        last_summary_time = self.summaries.get(user_id, {}).get("generated_at")
+        if self.summarizer.should_update_summary(last_summary_time, count_since_last, self.update_threshold):
+            return self.update_summary(user_id)
+        return None
+    def update_summary(self, user_id: str, max_conversations: int = 20) -> Dict[str, Any]:
+        """
+        Force update summary for user
+        Args:
+            user_id: User identifier
+            max_conversations: Max conversations to summarize
+        Returns:
+            Summary data
+        """
+        try:
+            # Get recent conversations
+            if hasattr(self.memory, 'get_recent_conversations'):
+                conversations = self.memory.get_recent_conversations(user_id, max_conversations)
+            else:
+                conversations = []
+            # Generate summary
+            summary = self.summarizer.summarize_conversations(
+                conversations,
+                user_id,
+                max_conversations=max_conversations
+            )
+            # Store summary
+            self.summaries[user_id] = summary
+            self.conversation_counts[user_id] = 0
+            self.logger.info(f"✅ Auto-summary updated for {user_id}")
+            return summary
+        except Exception as e:
+            self.logger.error(f"Auto-summary update failed for {user_id}: {e}")
+            return {}
+    def get_summary(self, user_id: str) -> Optional[Dict[str, Any]]:
+        """
+        Get current summary for user
+        Args:
+            user_id: User identifier
+        Returns:
+            Summary data or None
+        """
+        return self.summaries.get(user_id)
+    def increment_conversation_count(self, user_id: str):
+        """Increment conversation count for user"""
+        self.conversation_counts[user_id] = self.conversation_counts.get(user_id, 0) + 1
+    def reset_summary(self, user_id: str):
+        """Reset summary for user"""
+        if user_id in self.summaries:
+            del self.summaries[user_id]
+        self.conversation_counts[user_id] = 0