PyPI - loom-agent - Versions diffs - 0.0.3__py3-none-any.whl → 0.0.5__py3-none-any.whl - Mend

loom-agent 0.0.3py3-none-any.whl → 0.0.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of loom-agent might be problematic. Click here for more details.

Files changed (16) hide show

loom/__init__.py +51 -0
loom/api/__init__.py +19 -0
loom/api/v0_0_3.py +300 -0
loom/builtin/retriever/faiss_store.py +403 -0
loom/core/agent_executor.py +212 -26
loom/core/events.py +3 -0
loom/core/recursion_control.py +298 -0
loom/core/turn_state.py +58 -6
loom/retrieval/__init__.py +61 -0
loom/retrieval/domain_adapter.py +195 -0
loom/retrieval/embedding_retriever.py +393 -0
loom_agent-0.0.5.dist-info/METADATA +561 -0
{loom_agent-0.0.3.dist-info → loom_agent-0.0.5.dist-info}/RECORD +15 -8
loom_agent-0.0.3.dist-info/METADATA +0 -292
{loom_agent-0.0.3.dist-info → loom_agent-0.0.5.dist-info}/WHEEL +0 -0
{loom_agent-0.0.3.dist-info → loom_agent-0.0.5.dist-info}/licenses/LICENSE +0 -0

loom/builtin/retriever/faiss_store.py ADDED Viewed

@@ -0,0 +1,403 @@
+"""
+FAISS Vector Store
+Lightweight, in-memory vector storage using FAISS.
+Ideal for development and small to medium scale deployments.
+"""
+from __future__ import annotations
+import logging
+from typing import Any, Dict, List, Optional, Tuple
+from loom.interfaces.vector_store import BaseVectorStore
+from loom.interfaces.retriever import Document
+logger = logging.getLogger(__name__)
+class FAISSVectorStore(BaseVectorStore):
+    """
+    FAISS-based vector storage
+    Lightweight, in-memory vector database using Facebook's FAISS library.
+    Ideal for:
+    - Development and testing
+    - Small to medium scale deployments (< 1M documents)
+    - Applications without persistence requirements
+    Features:
+    - Fast similarity search
+    - Multiple index types (Flat, IVF, HNSW)
+    - In-memory storage
+    - Optional persistence
+    Example:
+        # Basic usage
+        store = FAISSVectorStore(dimension=1536)
+        await store.initialize()
+        # Add documents
+        await store.add_documents(
+            documents=[doc1, doc2],
+            embeddings=[[0.1, ...], [0.2, ...]]
+        )
+        # Search
+        results = await store.search(
+            query_embedding=[0.15, ...],
+            top_k=5
+        )
+        # Advanced: Use IVF index for larger datasets
+        store = FAISSVectorStore(
+            dimension=1536,
+            index_type="IVF",
+            nlist=100  # Number of clusters
+        )
+    """
+    def __init__(
+        self,
+        dimension: int,
+        index_type: str = "Flat",
+        metric: str = "L2",
+        nlist: int = 100,
+        nprobe: int = 10
+    ):
+        """
+        Args:
+            dimension: Embedding dimension
+            index_type: Index type ("Flat", "IVF", "HNSW")
+            metric: Distance metric ("L2" or "IP" for inner product)
+            nlist: Number of clusters for IVF index
+            nprobe: Number of clusters to search in IVF
+        """
+        self.dimension = dimension
+        self.index_type = index_type
+        self.metric = metric
+        self.nlist = nlist
+        self.nprobe = nprobe
+        # FAISS index
+        self.index = None
+        # Document storage
+        self.documents: Dict[str, Document] = {}
+        self.id_to_index: Dict[str, int] = {}
+        self.index_to_id: Dict[int, str] = {}
+        self._initialized = False
+    async def initialize(self) -> None:
+        """Initialize FAISS index"""
+        if self._initialized:
+            return
+        try:
+            import faiss
+        except ImportError:
+            raise ImportError(
+                "FAISS is required for FAISSVectorStore. "
+                "Install it with: pip install faiss-cpu  or  pip install faiss-gpu"
+            )
+        # Create index based on type
+        if self.index_type == "Flat":
+            if self.metric == "L2":
+                self.index = faiss.IndexFlatL2(self.dimension)
+            else:  # IP (Inner Product)
+                self.index = faiss.IndexFlatIP(self.dimension)
+        elif self.index_type == "IVF":
+            if self.metric == "L2":
+                quantizer = faiss.IndexFlatL2(self.dimension)
+                self.index = faiss.IndexIVFFlat(
+                    quantizer,
+                    self.dimension,
+                    self.nlist
+                )
+            else:
+                quantizer = faiss.IndexFlatIP(self.dimension)
+                self.index = faiss.IndexIVFFlat(
+                    quantizer,
+                    self.dimension,
+                    self.nlist
+                )
+            # IVF needs training (will be done when first batch is added)
+            self.index.nprobe = self.nprobe
+        elif self.index_type == "HNSW":
+            self.index = faiss.IndexHNSWFlat(self.dimension, 32)
+        else:
+            raise ValueError(f"Unknown index type: {self.index_type}")
+        self._initialized = True
+        logger.info(f"FAISS index initialized: type={self.index_type}, dimension={self.dimension}")
+    async def add_documents(
+        self,
+        documents: List[Document],
+        embeddings: List[List[float]]
+    ) -> None:
+        """
+        Add documents with their embeddings
+        Args:
+            documents: List of documents
+            embeddings: List of embedding vectors
+        """
+        if not self._initialized:
+            await self.initialize()
+        if len(documents) != len(embeddings):
+            raise ValueError("Number of documents must match number of embeddings")
+        import numpy as np
+        # Convert embeddings to numpy array
+        embeddings_array = np.array(embeddings, dtype=np.float32)
+        # Train IVF index if needed
+        if self.index_type == "IVF" and not self.index.is_trained:
+            logger.info(f"Training IVF index with {len(embeddings)} vectors")
+            self.index.train(embeddings_array)
+        # Get current index size
+        start_index = len(self.id_to_index)
+        # Add to FAISS
+        self.index.add(embeddings_array)
+        # Store documents and mappings
+        for i, doc in enumerate(documents):
+            index = start_index + i
+            self.documents[doc.doc_id] = doc
+            self.id_to_index[doc.doc_id] = index
+            self.index_to_id[index] = doc.doc_id
+        logger.debug(f"Added {len(documents)} documents. Total: {len(self.documents)}")
+    async def search(
+        self,
+        query_embedding: List[float],
+        top_k: int = 5,
+        filters: Optional[Dict[str, Any]] = None
+    ) -> List[Document]:
+        """
+        Search for similar documents
+        Args:
+            query_embedding: Query embedding vector
+            top_k: Number of results to return
+            filters: Metadata filters (applied post-search)
+        Returns:
+            List of documents with similarity scores
+        """
+        if not self._initialized:
+            await self.initialize()
+        if self.index.ntotal == 0:
+            logger.warning("No documents in index")
+            return []
+        import numpy as np
+        # Convert query to numpy array
+        query_array = np.array([query_embedding], dtype=np.float32)
+        # Search
+        # Get more results if we need to filter
+        search_k = top_k * 3 if filters else top_k
+        distances, indices = self.index.search(query_array, search_k)
+        # Convert results to documents
+        results = []
+        for i, idx in enumerate(indices[0]):
+            if idx == -1:  # FAISS returns -1 for missing results
+                break
+            # Get document
+            doc_id = self.index_to_id[idx]
+            doc = self.documents[doc_id]
+            # Apply filters
+            if filters and not self._match_filters(doc, filters):
+                continue
+            # Calculate similarity score
+            distance = distances[0][i]
+            score = self._distance_to_score(distance)
+            # Create result document with score
+            result_doc = Document(
+                doc_id=doc.doc_id,
+                content=doc.content,
+                score=score,
+                metadata=doc.metadata
+            )
+            results.append(result_doc)
+            if len(results) >= top_k:
+                break
+        return results
+    async def get_document(self, doc_id: str) -> Optional[Document]:
+        """
+        Get document by ID
+        Args:
+            doc_id: Document identifier
+        Returns:
+            Document if found, None otherwise
+        """
+        return self.documents.get(doc_id)
+    async def delete(self, doc_ids: List[str]) -> None:
+        """
+        Delete documents
+        Note: FAISS doesn't support efficient deletion.
+        This implementation removes from metadata but not from index.
+        For true deletion, rebuild the index.
+        Args:
+            doc_ids: List of document IDs to delete
+        """
+        for doc_id in doc_ids:
+            if doc_id in self.documents:
+                del self.documents[doc_id]
+                if doc_id in self.id_to_index:
+                    index = self.id_to_index[doc_id]
+                    del self.id_to_index[doc_id]
+                    del self.index_to_id[index]
+        logger.warning(
+            f"Deleted {len(doc_ids)} documents from metadata. "
+            "Note: FAISS index still contains vectors. Rebuild index for full deletion."
+        )
+    def _match_filters(self, doc: Document, filters: Dict[str, Any]) -> bool:
+        """Check if document matches metadata filters"""
+        if not doc.metadata:
+            return False
+        for key, value in filters.items():
+            if doc.metadata.get(key) != value:
+                return False
+        return True
+    def _distance_to_score(self, distance: float) -> float:
+        """
+        Convert distance to similarity score
+        Args:
+            distance: Distance from FAISS (L2 or IP)
+        Returns:
+            Similarity score (0-1, higher is better)
+        """
+        if self.metric == "L2":
+            # L2 distance: lower is better
+            # Convert to similarity: 1 / (1 + distance)
+            return 1.0 / (1.0 + distance)
+        else:
+            # Inner product: higher is better
+            # Assuming normalized vectors, IP is in [-1, 1]
+            # Convert to [0, 1]
+            return (distance + 1.0) / 2.0
+    async def persist(self, path: str) -> None:
+        """
+        Save index to disk
+        Args:
+            path: File path to save index
+        """
+        if not self._initialized:
+            raise RuntimeError("Index not initialized")
+        import faiss
+        import pickle
+        # Save FAISS index
+        faiss.write_index(self.index, f"{path}.index")
+        # Save metadata
+        metadata = {
+            "documents": self.documents,
+            "id_to_index": self.id_to_index,
+            "index_to_id": self.index_to_id,
+            "dimension": self.dimension,
+            "index_type": self.index_type,
+            "metric": self.metric,
+            "nlist": self.nlist,
+            "nprobe": self.nprobe
+        }
+        with open(f"{path}.metadata", "wb") as f:
+            pickle.dump(metadata, f)
+        logger.info(f"Index persisted to {path}")
+    @classmethod
+    async def load(cls, path: str) -> "FAISSVectorStore":
+        """
+        Load index from disk
+        Args:
+            path: File path to load index from
+        Returns:
+            FAISSVectorStore instance
+        """
+        import faiss
+        import pickle
+        # Load metadata
+        with open(f"{path}.metadata", "rb") as f:
+            metadata = pickle.load(f)
+        # Create instance
+        instance = cls(
+            dimension=metadata["dimension"],
+            index_type=metadata["index_type"],
+            metric=metadata["metric"],
+            nlist=metadata["nlist"],
+            nprobe=metadata["nprobe"]
+        )
+        # Load FAISS index
+        instance.index = faiss.read_index(f"{path}.index")
+        instance._initialized = True
+        # Load metadata
+        instance.documents = metadata["documents"]
+        instance.id_to_index = metadata["id_to_index"]
+        instance.index_to_id = metadata["index_to_id"]
+        logger.info(f"Index loaded from {path}")
+        return instance
+    def get_stats(self) -> Dict[str, Any]:
+        """
+        Get statistics
+        Returns:
+            Statistics dictionary
+        """
+        return {
+            "initialized": self._initialized,
+            "total_documents": len(self.documents),
+            "index_size": self.index.ntotal if self.index else 0,
+            "dimension": self.dimension,
+            "index_type": self.index_type,
+            "metric": self.metric
+        }

loom/core/agent_executor.py CHANGED Viewed

@@ -20,6 +20,7 @@ from loom.core.context_assembly import ComponentPriority, ContextAssembler
 from loom.core.events import AgentEvent, AgentEventType, ToolResult
 from loom.core.execution_context import ExecutionContext
 from loom.core.permissions import PermissionManager
+from loom.core.recursion_control import RecursionMonitor, RecursionState
 from loom.core.steering_control import SteeringControl
 from loom.core.tool_orchestrator import ToolOrchestrator
 from loom.core.tool_pipeline import ToolExecutionPipeline
@@ -127,6 +128,9 @@ class AgentExecutor:
         task_handlers: Optional[List[TaskHandler]] = None,
         unified_context: Optional["UnifiedExecutionContext"] = None,
         enable_unified_coordination: bool = True,
+        # Phase 2: Recursion Control
+        enable_recursion_control: bool = True,
+        recursion_monitor: Optional[RecursionMonitor] = None,
     ) -> None:
         self.llm = llm
         self.tools = tools or {}
@@ -144,11 +148,17 @@ class AgentExecutor:
         self.callbacks = callbacks or []
         self.enable_steering = enable_steering
         self.task_handlers = task_handlers or []
         # Unified coordination
         self.unified_context = unified_context
         self.enable_unified_coordination = enable_unified_coordination
+        # Phase 2: Recursion control
+        self.enable_recursion_control = enable_recursion_control
+        self.recursion_monitor = recursion_monitor or RecursionMonitor(
+            max_iterations=max_iterations
+        )
         # Initialize unified coordination if enabled
         if self.enable_unified_coordination and UnifiedExecutionContext and IntelligentCoordinator:
             self._setup_unified_coordination()
@@ -301,6 +311,56 @@ class AgentExecutor:
             metadata={"parent_turn_id": turn_state.parent_turn_id},
         )
+        # Phase 2: Advanced recursion control (optional)
+        if self.enable_recursion_control:
+            # Build recursion state from turn state
+            recursion_state = RecursionState(
+                iteration=turn_state.turn_counter,
+                tool_call_history=turn_state.tool_call_history,
+                error_count=turn_state.error_count,
+                last_outputs=turn_state.last_outputs
+            )
+            # Check for termination conditions
+            termination_reason = self.recursion_monitor.check_termination(
+                recursion_state
+            )
+            if termination_reason:
+                # Emit termination event
+                yield AgentEvent(
+                    type=AgentEventType.RECURSION_TERMINATED,
+                    metadata={
+                        "reason": termination_reason.value,
+                        "iteration": turn_state.turn_counter,
+                        "tool_call_history": turn_state.tool_call_history[-5:],
+                        "error_count": turn_state.error_count
+                    }
+                )
+                # Add termination message to prompt LLM to finish
+                termination_msg = self.recursion_monitor.build_termination_message(
+                    termination_reason
+                )
+                # Add termination guidance as system message
+                messages = messages + [
+                    Message(role="system", content=termination_msg)
+                ]
+                # Note: We continue execution but with termination guidance
+                # The LLM will receive the termination message and should wrap up
+            # Check for early warnings (not terminating yet, just warning)
+            elif warning_msg := self.recursion_monitor.should_add_warning(
+                recursion_state,
+                warning_threshold=0.8
+            ):
+                # Add warning as system message
+                messages = messages + [
+                    Message(role="system", content=warning_msg)
+                ]
         # Base case 1: Maximum recursion depth reached
         if turn_state.is_final:
             yield AgentEvent(
@@ -581,22 +641,37 @@ class AgentExecutor:
         # Phase 5: Recursive Call (Tail Recursion)
         # ==========================================
-        # Prepare next turn state
-        next_state = turn_state.next_turn(compacted=compacted_this_turn)
+        # Phase 2: Track tool calls and errors for recursion control
+        tool_names_called = [tc.name for tc in tc_models]
+        had_tool_errors = any(r.is_error for r in tool_results)
+        # Extract output for loop detection (use first tool result or content)
+        output_sample = None
+        if tool_results:
+            output_sample = tool_results[0].content[:200]  # First 200 chars
+        elif content:
+            output_sample = content[:200]
+        # Prepare next turn state with recursion tracking
+        next_state = turn_state.next_turn(
+            compacted=compacted_this_turn,
+            tool_calls=tool_names_called,
+            had_error=had_tool_errors,
+            output=output_sample
+        )
-        # Prepare next turn messages with intelligent context guidance
-        next_messages = self._prepare_recursive_messages(
+        # Phase 3: Prepare next turn messages with intelligent context guidance
+        # This now includes tool results, compression, and recursion hints
+        next_messages = await self._prepare_recursive_messages(
             messages, tool_results, turn_state, context
         )
-        # Add tool results
-        for r in tool_results:
-            next_messages.append(
-                Message(
-                    role="tool",
-                    content=r.content,
-                    tool_call_id=r.tool_call_id,
-                )
+        # Check if compression was applied and emit event
+        if "last_compression" in context.metadata:
+            comp_info = context.metadata.pop("last_compression")
+            yield AgentEvent(
+                type=AgentEventType.COMPRESSION_APPLIED,
+                metadata=comp_info
             )
         # Emit recursion event
@@ -606,6 +681,8 @@ class AgentExecutor:
                 "from_turn": turn_state.turn_id,
                 "to_turn": next_state.turn_id,
                 "depth": next_state.turn_counter,
+                "tools_called": tool_names_called,
+                "message_count": len(next_messages),
             },
         )
@@ -617,7 +694,7 @@ class AgentExecutor:
     # Intelligent Recursion Methods
     # ==========================================
-    def _prepare_recursive_messages(
+    async def _prepare_recursive_messages(
         self,
         messages: List[Message],
         tool_results: List[ToolResult],
@@ -625,22 +702,131 @@ class AgentExecutor:
         context: ExecutionContext,
     ) -> List[Message]:
         """
-        智能准备递归调用的消息
-        基于工具结果类型、任务上下文和递归深度，生成合适的用户指导消息
+        Phase 3: 智能准备递归调用的消息
+        确保工具结果正确传递到下一轮，并进行必要的上下文优化
+        Args:
+            messages: 当前轮次的消息
+            tool_results: 工具执行结果
+            turn_state: 当前轮次状态
+            context: 执行上下文
+        Returns:
+            准备好的下一轮消息列表
         """
-        # 分析工具结果
+        # 1. 分析工具结果（用于生成智能指导）
         result_analysis = self._analyze_tool_results(tool_results)
-        # 获取原始任务
         original_task = self._extract_original_task(messages)
-        # 生成智能指导消息
+        # 2. 生成智能指导消息
         guidance_message = self._generate_recursion_guidance(
             original_task, result_analysis, turn_state.turn_counter
         )
-        return [Message(role="user", content=guidance_message)]
+        # 3. 构建下一轮消息：用户指导
+        next_messages = [Message(role="user", content=guidance_message)]
+        # 4. 添加工具结果消息（关键：确保工具结果被传递）
+        for result in tool_results:
+            next_messages.append(Message(
+                role="tool",
+                content=result.content,
+                tool_call_id=result.tool_call_id,
+                metadata=result.metadata or {}
+            ))
+        # 5. Phase 3: 检查上下文长度
+        estimated_tokens = self._estimate_tokens(next_messages)
+        compression_applied = False
+        if estimated_tokens > self.max_context_tokens:
+            # 触发压缩（如果有 compressor）
+            if self.compressor:
+                tokens_before = estimated_tokens
+                next_messages = await self._compress_messages(next_messages)
+                tokens_after = self._estimate_tokens(next_messages)
+                compression_applied = True
+                # Store compression info for later emission
+                context.metadata["last_compression"] = {
+                    "tokens_before": tokens_before,
+                    "tokens_after": tokens_after,
+                    "trigger": "recursive_message_preparation"
+                }
+        # 6. Phase 3: 添加递归深度提示（深度递归时）
+        if turn_state.turn_counter > 3:
+            hint_content = self._build_recursion_hint(
+                turn_state.turn_counter,
+                turn_state.max_iterations
+            )
+            hint = Message(
+                role="system",
+                content=hint_content
+            )
+            next_messages.append(hint)
+        return next_messages
+    def _estimate_tokens(self, messages: List[Message]) -> int:
+        """
+        估算消息列表的 token 数量
+        使用简单的启发式方法：字符数 / 4
+        生产环境中应使用具体模型的 tokenizer
+        """
+        return count_messages_tokens(messages)
+    async def _compress_messages(
+        self,
+        messages: List[Message]
+    ) -> List[Message]:
+        """
+        压缩消息列表（如果有 compressor）
+        这个方法会调用配置的 compressor 来减少上下文长度
+        """
+        if not self.compressor:
+            return messages
+        try:
+            compressed, metadata = await self.compressor.compress(messages)
+            # Update compression metrics
+            self.metrics.metrics.compressions = (
+                getattr(self.metrics.metrics, "compressions", 0) + 1
+            )
+            return compressed
+        except Exception as e:
+            # If compression fails, return original messages
+            self.metrics.metrics.total_errors += 1
+            await self._emit(
+                "error",
+                {"stage": "message_compression", "message": str(e)}
+            )
+            return messages
+    def _build_recursion_hint(self, current_depth: int, max_depth: int) -> str:
+        """
+        构建递归深度提示消息
+        在深度递归时提醒 LLM 注意进度和避免重复
+        """
+        remaining = max_depth - current_depth
+        progress = (current_depth / max_depth) * 100
+        hint = f"""🔄 Recursion Status:
+- Depth: {current_depth}/{max_depth} ({progress:.0f}% of maximum)
+- Remaining iterations: {remaining}
+Please review the tool results above and make meaningful progress towards completing the task.
+Avoid calling the same tool repeatedly with the same arguments unless necessary.
+If you have enough information, please provide your final answer."""
+        return hint
     def _analyze_tool_results(self, tool_results: List[ToolResult]) -> Dict[str, Any]:
         """分析工具结果类型和质量"""

loom-agent 0.0.3__py3-none-any.whl → 0.0.5__py3-none-any.whl

Potentially problematic release.

loom-agent 0.0.3py3-none-any.whl → 0.0.5py3-none-any.whl