PyPI - lollms-client - Versions diffs - 1.3.0__py3-none-any.whl → 1.3.2__py3-none-any.whl - Mend

lollms-client 1.3.0py3-none-any.whl → 1.3.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lollms-client might be problematic. Click here for more details.

Files changed (10) hide show

lollms_client/__init__.py CHANGED Viewed

@@ -8,7 +8,7 @@ from lollms_client.lollms_utilities import PromptReshaper # Keep general utiliti
 from lollms_client.lollms_mcp_binding import LollmsMCPBinding, LollmsMCPBindingManager
 from lollms_client.lollms_llm_binding import LollmsLLMBindingManager
-__version__ = "1.3.0" # Updated version
+__version__ = "1.3.2" # Updated version
 # Optionally, you could define __all__ if you want to be explicit about exports
 __all__ = [

lollms_client/llm_bindings/ollama/__init__.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# bindings/ollama/binding.py
+# bindings/ollama/__init__.py
 import requests
 import json
 from lollms_client.lollms_llm_binding import LollmsLLMBinding
@@ -13,7 +13,7 @@ from ascii_colors import ASCIIColors, trace_exception
 import pipmaster as pm
 from lollms_client.lollms_utilities import ImageTokenizer
 pm.ensure_packages(["ollama","pillow","tiktoken"])
+import re
 import ollama
 import tiktoken
@@ -256,22 +256,22 @@ class OllamaBinding(LollmsLLMBinding):
             return {"status": False, "error": error_message}
     def generate_from_messages(self,
-                     messages: List[Dict],
-                     n_predict: Optional[int] = None,
-                     stream: Optional[bool] = None,
-                     temperature: Optional[float] = None,
-                     top_k: Optional[int] = None,
-                     top_p: Optional[float] = None,
-                     repeat_penalty: Optional[float] = None,
-                     repeat_last_n: Optional[int] = None,
-                     seed: Optional[int] = None,
-                     n_threads: Optional[int] = None,
-                     ctx_size: int | None = None,
-                     streaming_callback: Optional[Callable[[str, MSG_TYPE], None]] = None,
-                     **kwargs
-                     ) -> Union[str, dict]:
+                        messages: List[Dict],
+                        n_predict: Optional[int] = None,
+                        stream: Optional[bool] = None,
+                        temperature: Optional[float] = None,
+                        top_k: Optional[int] = None,
+                        top_p: Optional[float] = None,
+                        repeat_penalty: Optional[float] = None,
+                        repeat_last_n: Optional[int] = None,
+                        seed: Optional[int] = None,
+                        n_threads: Optional[int] = None,
+                        ctx_size: int | None = None,
+                        streaming_callback: Optional[Callable[[str, MSG_TYPE], None]] = None,
+                        **kwargs
+                        ) -> Union[str, dict]:
         if not self.ollama_client:
-             return {"status": False, "error": "Ollama client not initialized."}
+            return {"status": False, "error": "Ollama client not initialized."}
         options = {}
         if n_predict is not None: options['num_predict'] = n_predict
@@ -283,34 +283,91 @@ class OllamaBinding(LollmsLLMBinding):
         if seed is not None: options['seed'] = seed
         if n_threads is not None: options['num_thread'] = n_threads
         if ctx_size is not None: options['num_ctx'] = ctx_size
+        def normalize_message(msg: Dict) -> Dict:
+            role = msg.get("role", "user")
+            content = msg.get("content", "")
+            text_parts = []
+            images = []
+            if isinstance(content, str):
+                text_parts.append(content)
+            elif isinstance(content, list):
+                for item in content:
+                    if item.get("type") == "text":
+                        text_parts.append(item.get("text", ""))
+                    elif item.get("type") == "image_url":
+                        base64_data = item.get("image_url", {}).get("base64")
+                        url = item.get("image_url", {}).get("url")
+                        if base64_data:
+                            # ⚠️ remove prefix "data:image/...;base64,"
+                            cleaned = re.sub(r"^data:image/[^;]+;base64,", "", base64_data)
+                            images.append(cleaned)
+                        elif url:
+                            images.append(url)
+            return {
+                "role": role,
+                "content": "\n".join([p for p in text_parts if p.strip()]),
+                "images": images if images else None
+            }
+        ollama_messages = []
+        for m in messages:
+            nm = normalize_message(m)
+            if nm["images"]:
+                ollama_messages.append({
+                    "role": nm["role"],
+                    "content": nm["content"],
+                    "images": nm["images"]
+                })
+            else:
+                ollama_messages.append({
+                    "role": nm["role"],
+                    "content": nm["content"]
+                })
         full_response_text = ""
         try:
             if stream:
                 response_stream = self.ollama_client.chat(
                     model=self.model_name,
-                    messages=messages,
+                    messages=ollama_messages,
                     stream=True,
                     options=options if options else None
                 )
                 for chunk_dict in response_stream:
                     chunk_content = chunk_dict.get('message', {}).get('content', '')
-                    if chunk_content: # Ensure there is content to process
+                    if chunk_content:
                         full_response_text += chunk_content
                         if streaming_callback:
                             if not streaming_callback(chunk_content, MSG_TYPE.MSG_TYPE_CHUNK):
-                                break # Callback requested stop
+                                break
                 return full_response_text
-            else: # Not streaming
+            else:
                 response_dict = self.ollama_client.chat(
                     model=self.model_name,
-                    messages=messages,
+                    messages=ollama_messages,
                     stream=False,
                     options=options if options else None
                 )
                 return response_dict.get('message', {}).get('content', '')
+        except ollama.ResponseError as e:
+            error_message = f"Ollama API ResponseError: {e.error or 'Unknown error'} (status code: {e.status_code})"
+            ASCIIColors.error(error_message)
+            return {"status": False, "error": error_message, "status_code": e.status_code}
+        except ollama.RequestError as e:
+            error_message = f"Ollama API RequestError: {str(e)}"
+            ASCIIColors.error(error_message)
+            return {"status": False, "error": error_message}
+        except Exception as ex:
+            error_message = f"An unexpected error occurred: {str(ex)}"
+            trace_exception(ex)
+            return {"status": False, "error": error_message}
         except ollama.ResponseError as e:
             error_message = f"Ollama API ResponseError: {e.error or 'Unknown error'} (status code: {e.status_code})"
             ASCIIColors.error(error_message)

lollms_client/lollms_agentic.py ADDED Viewed

@@ -0,0 +1,361 @@
+import json
+import re
+import uuid
+import base64
+import time
+import asyncio
+from typing import Dict, List, Any, Optional, Union, Callable, Tuple
+from dataclasses import dataclass, field
+from enum import Enum
+import threading
+from concurrent.futures import ThreadPoolExecutor, as_completed
+import hashlib
+class TaskStatus(Enum):
+    PENDING = "pending"
+    RUNNING = "running"
+    COMPLETED = "completed"
+    FAILED = "failed"
+    SKIPPED = "skipped"
+class ConfidenceLevel(Enum):
+    LOW = "low"
+    MEDIUM = "medium"
+    HIGH = "high"
+    VERY_HIGH = "very_high"
+@dataclass
+class SubTask:
+    id: str
+    description: str
+    dependencies: List[str] = field(default_factory=list)
+    status: TaskStatus = TaskStatus.PENDING
+    result: Optional[Dict] = None
+    confidence: float = 0.0
+    tools_required: List[str] = field(default_factory=list)
+    estimated_complexity: int = 1  # 1-5 scale
+@dataclass
+class ExecutionPlan:
+    tasks: List[SubTask]
+    total_estimated_steps: int
+    execution_order: List[str]
+    fallback_strategies: Dict[str, List[str]] = field(default_factory=dict)
+@dataclass
+class MemoryEntry:
+    timestamp: float
+    context: str
+    action: str
+    result: Dict
+    confidence: float
+    success: bool
+    user_feedback: Optional[str] = None
+@dataclass
+class ToolPerformance:
+    success_rate: float = 0.0
+    avg_confidence: float = 0.0
+    total_calls: int = 0
+    avg_response_time: float = 0.0
+    last_used: float = 0.0
+    failure_patterns: List[str] = field(default_factory=list)
+class TaskPlanner:
+    def __init__(self, llm_client):
+        self.llm_client = llm_client
+    def decompose_task(self, user_request: str, context: str = "") -> ExecutionPlan:
+        """Break down complex requests into manageable subtasks"""
+        decomposition_prompt = f"""
+Analyze this user request and break it down into specific, actionable subtasks:
+USER REQUEST: "{user_request}"
+CONTEXT: {context}
+Create a JSON plan with subtasks that are:
+1. Specific and actionable
+2. Have clear success criteria
+3. Include estimated complexity (1-5 scale)
+4. List required tool types
+Output format:
+{{
+  "tasks": [
+    {{
+      "id": "task_1",
+      "description": "specific action to take",
+      "dependencies": ["task_id"],
+      "estimated_complexity": 2,
+      "tools_required": ["tool_type"]
+    }}
+  ],
+  "execution_strategy": "sequential|parallel|hybrid"
+}}
+"""
+        try:
+            plan_data = self.llm_client.generate_structured_content(
+                prompt=decomposition_prompt,
+                schema={"tasks": "array", "execution_strategy": "string"},
+                temperature=0.3
+            )
+            tasks = []
+            for task_data in plan_data.get("tasks", []):
+                task = SubTask(
+                    id=task_data.get("id", str(uuid.uuid4())),
+                    description=task_data.get("description", ""),
+                    dependencies=task_data.get("dependencies", []),
+                    estimated_complexity=task_data.get("estimated_complexity", 1),
+                    tools_required=task_data.get("tools_required", [])
+                )
+                tasks.append(task)
+            execution_order = self._calculate_execution_order(tasks)
+            total_steps = sum(task.estimated_complexity for task in tasks)
+            return ExecutionPlan(
+                tasks=tasks,
+                total_estimated_steps=total_steps,
+                execution_order=execution_order
+            )
+        except Exception as e:
+            # Fallback: create single task
+            single_task = SubTask(
+                id="fallback_task",
+                description=user_request,
+                estimated_complexity=3
+            )
+            return ExecutionPlan(
+                tasks=[single_task],
+                total_estimated_steps=3,
+                execution_order=["fallback_task"]
+            )
+    def _calculate_execution_order(self, tasks: List[SubTask]) -> List[str]:
+        """Calculate optimal execution order based on dependencies"""
+        task_map = {task.id: task for task in tasks}
+        executed = set()
+        order = []
+        def can_execute(task_id: str) -> bool:
+            task = task_map[task_id]
+            return all(dep in executed for dep in task.dependencies)
+        while len(order) < len(tasks):
+            ready_tasks = [tid for tid in task_map.keys()
+                          if tid not in executed and can_execute(tid)]
+            if not ready_tasks:
+                # Handle circular dependencies - execute remaining tasks
+                remaining = [tid for tid in task_map.keys() if tid not in executed]
+                ready_tasks = remaining[:1] if remaining else []
+            # Sort by complexity (simpler tasks first)
+            ready_tasks.sort(key=lambda tid: task_map[tid].estimated_complexity)
+            for task_id in ready_tasks:
+                order.append(task_id)
+                executed.add(task_id)
+        return order
+class MemoryManager:
+    def __init__(self, max_entries: int = 1000):
+        self.memory: List[MemoryEntry] = []
+        self.max_entries = max_entries
+        self.cache: Dict[str, Any] = {}
+        self.cache_ttl: Dict[str, float] = {}
+    def add_memory(self, context: str, action: str, result: Dict,
+                   confidence: float, success: bool, user_feedback: str = None):
+        """Add a new memory entry"""
+        entry = MemoryEntry(
+            timestamp=time.time(),
+            context=context,
+            action=action,
+            result=result,
+            confidence=confidence,
+            success=success,
+            user_feedback=user_feedback
+        )
+        self.memory.append(entry)
+        # Prune old memories
+        if len(self.memory) > self.max_entries:
+            self.memory = self.memory[-self.max_entries:]
+    def get_relevant_patterns(self, current_context: str, limit: int = 5) -> List[MemoryEntry]:
+        """Retrieve relevant past experiences"""
+        # Simple similarity scoring based on context overlap
+        scored_memories = []
+        current_words = set(current_context.lower().split())
+        for memory in self.memory:
+            memory_words = set(memory.context.lower().split())
+            overlap = len(current_words & memory_words)
+            if overlap > 0:
+                score = overlap / max(len(current_words), len(memory_words))
+                scored_memories.append((score, memory))
+        scored_memories.sort(key=lambda x: x[0], reverse=True)
+        return [memory for _, memory in scored_memories[:limit]]
+    def compress_scratchpad(self, scratchpad: str, current_goal: str,
+                           max_length: int = 8000) -> str:
+        """Intelligently compress scratchpad while preserving key insights"""
+        if len(scratchpad) <= max_length:
+            return scratchpad
+        # Extract key sections
+        sections = re.split(r'\n### ', scratchpad)
+        # Prioritize recent steps and successful outcomes
+        important_sections = []
+        for section in sections[-10:]:  # Keep last 10 sections
+            if any(keyword in section.lower() for keyword in
+                   ['success', 'completed', 'found', 'generated', current_goal.lower()]):
+                important_sections.append(section)
+        # If still too long, summarize older sections
+        if len('\n### '.join(important_sections)) > max_length:
+            summary = f"### Previous Steps Summary\n- Completed {len(sections)-len(important_sections)} earlier steps\n- Working toward: {current_goal}\n"
+            return summary + '\n### '.join(important_sections[-5:])
+        return '\n### '.join(important_sections)
+    def cache_result(self, key: str, value: Any, ttl: int = 300):
+        """Cache expensive operation results"""
+        self.cache[key] = value
+        self.cache_ttl[key] = time.time() + ttl
+    def get_cached_result(self, key: str) -> Optional[Any]:
+        """Retrieve cached result if still valid"""
+        if key in self.cache:
+            if time.time() < self.cache_ttl.get(key, 0):
+                return self.cache[key]
+            else:
+                # Expired - remove
+                del self.cache[key]
+                if key in self.cache_ttl:
+                    del self.cache_ttl[key]
+        return None
+class ToolPerformanceTracker:
+    def __init__(self):
+        self.tool_stats: Dict[str, ToolPerformance] = {}
+        self.lock = threading.Lock()
+    def record_tool_usage(self, tool_name: str, success: bool,
+                         confidence: float, response_time: float,
+                         error_msg: str = None):
+        """Record tool usage statistics"""
+        with self.lock:
+            if tool_name not in self.tool_stats:
+                self.tool_stats[tool_name] = ToolPerformance()
+            stats = self.tool_stats[tool_name]
+            stats.total_calls += 1
+            stats.last_used = time.time()
+            # Update success rate
+            old_successes = stats.success_rate * (stats.total_calls - 1)
+            new_successes = old_successes + (1 if success else 0)
+            stats.success_rate = new_successes / stats.total_calls
+            # Update average confidence
+            old_conf_total = stats.avg_confidence * (stats.total_calls - 1)
+            stats.avg_confidence = (old_conf_total + confidence) / stats.total_calls
+            # Update response time
+            old_time_total = stats.avg_response_time * (stats.total_calls - 1)
+            stats.avg_response_time = (old_time_total + response_time) / stats.total_calls
+            # Record failure patterns
+            if not success and error_msg:
+                stats.failure_patterns.append(error_msg[:100])
+                # Keep only last 10 failure patterns
+                stats.failure_patterns = stats.failure_patterns[-10:]
+    def get_tool_reliability_score(self, tool_name: str) -> float:
+        """Calculate overall tool reliability score (0-1)"""
+        if tool_name not in self.tool_stats:
+            return 0.5  # Neutral for unknown tools
+        stats = self.tool_stats[tool_name]
+        # Weighted combination of success rate and confidence
+        reliability = (stats.success_rate * 0.7) + (stats.avg_confidence * 0.3)
+        # Penalty for tools not used recently (older than 1 hour)
+        if time.time() - stats.last_used > 3600:
+            reliability *= 0.8
+        return reliability
+    def rank_tools_for_task(self, available_tools: List[str],
+                           task_description: str) -> List[Tuple[str, float]]:
+        """Rank tools by suitability for a specific task"""
+        tool_scores = []
+        for tool_name in available_tools:
+            base_score = self.get_tool_reliability_score(tool_name)
+            # Simple keyword matching bonus
+            task_lower = task_description.lower()
+            if any(keyword in tool_name.lower() for keyword in
+                   ['search', 'research'] if 'find' in task_lower or 'search' in task_lower):
+                base_score *= 1.2
+            elif 'generate' in tool_name.lower() and 'create' in task_lower:
+                base_score *= 1.2
+            tool_scores.append((tool_name, min(base_score, 1.0)))
+        tool_scores.sort(key=lambda x: x[1], reverse=True)
+        return tool_scores
+class UncertaintyManager:
+    @staticmethod
+    def calculate_confidence(reasoning_step: str, tool_results: List[Dict],
+                           memory_patterns: List[MemoryEntry]) -> Tuple[float, ConfidenceLevel]:
+        """Calculate confidence in current reasoning step"""
+        base_confidence = 0.5
+        # Boost confidence if similar patterns succeeded before
+        if memory_patterns:
+            successful_patterns = [m for m in memory_patterns if m.success]
+            if successful_patterns:
+                avg_success_confidence = sum(m.confidence for m in successful_patterns) / len(successful_patterns)
+                base_confidence = (base_confidence + avg_success_confidence) / 2
+        # Adjust based on tool result consistency
+        if tool_results:
+            success_results = [r for r in tool_results if r.get('status') == 'success']
+            if success_results:
+                base_confidence += 0.2
+            # Check for consistent information across tools
+            if len(tool_results) > 1:
+                base_confidence += 0.1
+        # Reasoning quality indicators
+        if len(reasoning_step) > 50 and any(word in reasoning_step.lower()
+                                           for word in ['because', 'therefore', 'analysis', 'evidence']):
+            base_confidence += 0.1
+        confidence = max(0.0, min(1.0, base_confidence))
+        # Map to confidence levels
+        if confidence >= 0.8:
+            level = ConfidenceLevel.VERY_HIGH
+        elif confidence >= 0.6:
+            level = ConfidenceLevel.HIGH
+        elif confidence >= 0.4:
+            level = ConfidenceLevel.MEDIUM
+        else:
+            level = ConfidenceLevel.LOW
+        return confidence, level

lollms-client 1.3.0__py3-none-any.whl → 1.3.2__py3-none-any.whl

Potentially problematic release.

lollms-client 1.3.0py3-none-any.whl → 1.3.2py3-none-any.whl