PyPI - agno - Versions diffs - 2.2.10__py3-none-any.whl → 2.2.12__py3-none-any.whl - Mend

agno 2.2.10py3-none-any.whl → 2.2.12py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (73) hide show

agno/agent/agent.py +75 -48
agno/db/dynamo/utils.py +1 -1
agno/db/firestore/utils.py +1 -1
agno/db/gcs_json/utils.py +1 -1
agno/db/in_memory/utils.py +1 -1
agno/db/json/utils.py +1 -1
agno/db/mongo/utils.py +3 -3
agno/db/mysql/mysql.py +1 -1
agno/db/mysql/utils.py +1 -1
agno/db/postgres/utils.py +1 -1
agno/db/redis/utils.py +1 -1
agno/db/singlestore/singlestore.py +1 -1
agno/db/singlestore/utils.py +1 -1
agno/db/sqlite/async_sqlite.py +1 -1
agno/db/sqlite/sqlite.py +1 -1
agno/db/sqlite/utils.py +1 -1
agno/filters.py +354 -0
agno/knowledge/chunking/agentic.py +8 -9
agno/knowledge/chunking/strategy.py +59 -15
agno/knowledge/embedder/sentence_transformer.py +6 -2
agno/knowledge/knowledge.py +43 -22
agno/knowledge/reader/base.py +6 -2
agno/knowledge/utils.py +20 -0
agno/models/anthropic/claude.py +45 -9
agno/models/base.py +4 -0
agno/os/app.py +23 -7
agno/os/interfaces/slack/router.py +53 -33
agno/os/interfaces/slack/slack.py +9 -1
agno/os/router.py +25 -1
agno/os/routers/health.py +5 -3
agno/os/routers/knowledge/knowledge.py +43 -17
agno/os/routers/knowledge/schemas.py +4 -3
agno/run/agent.py +11 -1
agno/run/base.py +3 -2
agno/session/agent.py +10 -5
agno/team/team.py +57 -18
agno/tools/file_generation.py +4 -4
agno/tools/gmail.py +179 -0
agno/tools/parallel.py +314 -0
agno/utils/agent.py +22 -17
agno/utils/gemini.py +15 -5
agno/utils/knowledge.py +12 -5
agno/utils/log.py +1 -0
agno/utils/models/claude.py +2 -1
agno/utils/print_response/agent.py +5 -4
agno/utils/print_response/team.py +5 -4
agno/vectordb/base.py +2 -4
agno/vectordb/cassandra/cassandra.py +12 -5
agno/vectordb/chroma/chromadb.py +10 -4
agno/vectordb/clickhouse/clickhousedb.py +12 -4
agno/vectordb/couchbase/couchbase.py +12 -3
agno/vectordb/lancedb/lance_db.py +69 -144
agno/vectordb/langchaindb/langchaindb.py +13 -4
agno/vectordb/lightrag/lightrag.py +8 -3
agno/vectordb/llamaindex/llamaindexdb.py +10 -4
agno/vectordb/milvus/milvus.py +16 -5
agno/vectordb/mongodb/mongodb.py +14 -3
agno/vectordb/pgvector/pgvector.py +73 -15
agno/vectordb/pineconedb/pineconedb.py +6 -2
agno/vectordb/qdrant/qdrant.py +25 -13
agno/vectordb/redis/redisdb.py +37 -30
agno/vectordb/singlestore/singlestore.py +9 -4
agno/vectordb/surrealdb/surrealdb.py +13 -3
agno/vectordb/upstashdb/upstashdb.py +8 -5
agno/vectordb/weaviate/weaviate.py +29 -12
agno/workflow/step.py +3 -2
agno/workflow/types.py +20 -1
agno/workflow/workflow.py +103 -14
{agno-2.2.10.dist-info → agno-2.2.12.dist-info}/METADATA +4 -1
{agno-2.2.10.dist-info → agno-2.2.12.dist-info}/RECORD +73 -71
{agno-2.2.10.dist-info → agno-2.2.12.dist-info}/WHEEL +0 -0
{agno-2.2.10.dist-info → agno-2.2.12.dist-info}/licenses/LICENSE +0 -0
{agno-2.2.10.dist-info → agno-2.2.12.dist-info}/top_level.txt +0 -0

agno/filters.py ADDED Viewed

@@ -0,0 +1,354 @@
+"""Search filter expressions for filtering knowledge base documents and search results.
+This module provides a set of filter operators for constructing complex search queries
+that can be applied to knowledge bases, vector databases, and other searchable content.
+Filter Types:
+    - Comparison: EQ (equals), GT (greater than), LT (less than)
+    - Inclusion: IN (value in list)
+    - Logical: AND, OR, NOT
+Example:
+    >>> from agno.filters import EQ, GT, IN, AND, OR, NOT
+    >>>
+    >>> # Simple equality filter
+    >>> filter = EQ("category", "technology")
+    >>>
+    >>> # Complex filter with multiple conditions
+    >>> filter = AND(
+    ...     EQ("status", "published"),
+    ...     GT("views", 1000),
+    ...     IN("category", ["tech", "science"])
+    ... )
+    >>>
+    >>> # Using OR logic
+    >>> filter = OR(EQ("priority", "high"), EQ("urgent", True))
+    >>>
+    >>> # Negating conditions
+    >>> filter = NOT(EQ("status", "archived"))
+    >>>
+    >>> # Complex nested logic
+    >>> filter = OR(
+    ...     AND(EQ("type", "article"), GT("word_count", 500)),
+    ...     AND(EQ("type", "tutorial"), NOT(EQ("difficulty", "beginner")))
+    ... )
+"""
+from __future__ import annotations
+from typing import Any, List
+# ============================================================
+# Base Expression
+# ============================================================
+class FilterExpr:
+    """Base class for all filter expressions.
+    Filters can be combined using AND, OR, and NOT classes:
+    - AND: Combine filters where both expressions must be true
+    - OR: Combine filters where either expression can be true
+    - NOT: Negate a filter expression
+    Example:
+        >>> # Create complex filters using AND, OR, NOT
+        >>> filter = OR(AND(EQ("status", "active"), GT("age", 18)), EQ("role", "admin"))
+        >>> # Equivalent to: (status == "active" AND age > 18) OR role == "admin"
+    """
+    # Logical operator overloads
+    def __or__(self, other: FilterExpr) -> OR:
+        """Combine two filters with OR logic."""
+        return OR(self, other)
+    def __and__(self, other: FilterExpr) -> AND:
+        """Combine two filters with AND logic."""
+        return AND(self, other)
+    def __invert__(self) -> NOT:
+        """Negate a filter."""
+        return NOT(self)
+    def to_dict(self) -> dict:
+        """Convert the filter expression to a dictionary representation."""
+        raise NotImplementedError("Subclasses must implement to_dict()")
+    def __repr__(self) -> str:
+        return f"{self.__class__.__name__}({self.__dict__})"
+# ============================================================
+# Comparison & Inclusion Filters
+# ============================================================
+class EQ(FilterExpr):
+    """Equality filter - matches documents where a field equals a specific value.
+    Args:
+        key: The field name to compare
+        value: The value to match against
+    Example:
+        >>> # Match documents where status is "published"
+        >>> filter = EQ("status", "published")
+        >>>
+        >>> # Match documents where author_id is 123
+        >>> filter = EQ("author_id", 123)
+    """
+    def __init__(self, key: str, value: Any):
+        self.key = key
+        self.value = value
+    def to_dict(self) -> dict:
+        return {"op": "EQ", "key": self.key, "value": self.value}
+class IN(FilterExpr):
+    """Inclusion filter - matches documents where a field's value is in a list of values.
+    Args:
+        key: The field name to check
+        values: List of acceptable values
+    Example:
+        >>> # Match documents where category is either "tech", "science", or "engineering"
+        >>> filter = IN("category", ["tech", "science", "engineering"])
+        >>>
+        >>> # Match documents where status is either "draft" or "published"
+        >>> filter = IN("status", ["draft", "published"])
+    """
+    def __init__(self, key: str, values: List[Any]):
+        self.key = key
+        self.values = values
+    def to_dict(self) -> dict:
+        return {"op": "IN", "key": self.key, "values": self.values}
+class GT(FilterExpr):
+    """Greater than filter - matches documents where a field's value is greater than a threshold.
+    Args:
+        key: The field name to compare
+        value: The threshold value
+    Example:
+        >>> # Match documents where age is greater than 18
+        >>> filter = GT("age", 18)
+        >>>
+        >>> # Match documents where price is greater than 100.0
+        >>> filter = GT("price", 100.0)
+        >>>
+        >>> # Match documents created after a certain timestamp
+        >>> filter = GT("created_at", 1234567890)
+    """
+    def __init__(self, key: str, value: Any):
+        self.key = key
+        self.value = value
+    def to_dict(self) -> dict:
+        return {"op": "GT", "key": self.key, "value": self.value}
+class LT(FilterExpr):
+    """Less than filter - matches documents where a field's value is less than a threshold.
+    Args:
+        key: The field name to compare
+        value: The threshold value
+    Example:
+        >>> # Match documents where age is less than 65
+        >>> filter = LT("age", 65)
+        >>>
+        >>> # Match documents where price is less than 50.0
+        >>> filter = LT("price", 50.0)
+        >>>
+        >>> # Match documents created before a certain timestamp
+        >>> filter = LT("created_at", 1234567890)
+    """
+    def __init__(self, key: str, value: Any):
+        self.key = key
+        self.value = value
+    def to_dict(self) -> dict:
+        return {"op": "LT", "key": self.key, "value": self.value}
+# ============================================================
+# Logical Operators
+# ============================================================
+class AND(FilterExpr):
+    """Logical AND operator - matches documents where ALL expressions are true.
+    Combines multiple filter expressions where every expression must be satisfied
+    for a document to match.
+    Args:
+        *expressions: Variable number of FilterExpr expressions to combine with AND logic
+    Example:
+        >>> # Match documents where status is "published" AND age > 18
+        >>> filter = AND(EQ("status", "published"), GT("age", 18))
+        >>>
+        >>> # Multiple expressions
+        >>> filter = AND(
+        ...     EQ("status", "active"),
+        ...     GT("score", 80),
+        ...     IN("category", ["tech", "science"])
+        ... )
+    """
+    def __init__(self, *expressions: FilterExpr):
+        self.expressions = list(expressions)
+    def to_dict(self) -> dict:
+        return {"op": "AND", "conditions": [e.to_dict() for e in self.expressions]}
+class OR(FilterExpr):
+    """Logical OR operator - matches documents where ANY expression is true.
+    Combines multiple filter expressions where at least one expression must be satisfied
+    for a document to match.
+    Args:
+        *expressions: Variable number of FilterExpr expressions to combine with OR logic
+    Example:
+        >>> # Match documents where status is "published" OR status is "archived"
+        >>> filter = OR(EQ("status", "published"), EQ("status", "archived"))
+        >>>
+        >>> # Complex: Match VIP users OR users with high score
+        >>> filter = OR(
+        ...     EQ("membership", "VIP"),
+        ...     GT("score", 1000)
+        ... )
+    """
+    def __init__(self, *expressions: FilterExpr):
+        self.expressions = list(expressions)
+    def to_dict(self) -> dict:
+        return {"op": "OR", "conditions": [e.to_dict() for e in self.expressions]}
+class NOT(FilterExpr):
+    """Logical NOT operator - matches documents where the expression is NOT true.
+    Negates a filter expression, matching documents that don't satisfy the expression.
+    Args:
+        expression: The FilterExpr expression to negate
+    Example:
+        >>> # Match documents where status is NOT "draft"
+        >>> filter = NOT(EQ("status", "draft"))
+        >>>
+        >>> # Exclude inactive users with low scores
+        >>> filter = NOT(AND(EQ("status", "inactive"), LT("score", 10)))
+        >>>
+        >>> # Match users who are NOT in the blocked list
+        >>> filter = NOT(IN("user_id", [101, 102, 103]))
+    """
+    def __init__(self, expression: FilterExpr):
+        self.expression = expression
+    def to_dict(self) -> dict:
+        return {"op": "NOT", "condition": self.expression.to_dict()}
+# ============================================================
+# Deserialization
+# ============================================================
+def from_dict(filter_dict: dict) -> FilterExpr:
+    """Reconstruct a FilterExpr object from its dictionary representation.
+    This function deserializes filter expressions that were serialized using the
+    to_dict() method, enabling filters to be passed through JSON APIs and reconstructed
+    on the server side.
+    Args:
+        filter_dict: Dictionary representation of a filter expression with an "op" key
+    Returns:
+        FilterExpr: The reconstructed filter expression object
+    Raises:
+        ValueError: If the filter dictionary has an invalid structure or unknown operator
+    Example:
+        >>> # Serialize and deserialize a simple filter
+        >>> original = EQ("status", "published")
+        >>> serialized = original.to_dict()
+        >>> # {"op": "EQ", "key": "status", "value": "published"}
+        >>> reconstructed = from_dict(serialized)
+        >>>
+        >>> # Complex filter with nested expressions
+        >>> complex_filter = OR(AND(EQ("type", "article"), GT("views", 1000)), IN("priority", ["high", "urgent"]))
+        >>> serialized = complex_filter.to_dict()
+        >>> reconstructed = from_dict(serialized)
+        >>>
+        >>> # From JSON API
+        >>> import json
+        >>> json_str = '{"op": "AND", "conditions": [{"op": "EQ", "key": "status", "value": "active"}, {"op": "GT", "key": "age", "value": 18}]}'
+        >>> filter_dict = json.loads(json_str)
+        >>> filter_expr = from_dict(filter_dict)
+    """
+    if not isinstance(filter_dict, dict) or "op" not in filter_dict:
+        raise ValueError(f"Invalid filter dictionary: must contain 'op' key. Got: {filter_dict}")
+    op = filter_dict["op"]
+    # Comparison and inclusion operators
+    if op == "EQ":
+        if "key" not in filter_dict or "value" not in filter_dict:
+            raise ValueError(f"EQ filter requires 'key' and 'value' fields. Got: {filter_dict}")
+        return EQ(filter_dict["key"], filter_dict["value"])
+    elif op == "IN":
+        if "key" not in filter_dict or "values" not in filter_dict:
+            raise ValueError(f"IN filter requires 'key' and 'values' fields. Got: {filter_dict}")
+        return IN(filter_dict["key"], filter_dict["values"])
+    elif op == "GT":
+        if "key" not in filter_dict or "value" not in filter_dict:
+            raise ValueError(f"GT filter requires 'key' and 'value' fields. Got: {filter_dict}")
+        return GT(filter_dict["key"], filter_dict["value"])
+    elif op == "LT":
+        if "key" not in filter_dict or "value" not in filter_dict:
+            raise ValueError(f"LT filter requires 'key' and 'value' fields. Got: {filter_dict}")
+        return LT(filter_dict["key"], filter_dict["value"])
+    # Logical operators
+    elif op == "AND":
+        if "conditions" not in filter_dict:
+            raise ValueError(f"AND filter requires 'conditions' field. Got: {filter_dict}")
+        conditions = [from_dict(cond) for cond in filter_dict["conditions"]]
+        return AND(*conditions)
+    elif op == "OR":
+        if "conditions" not in filter_dict:
+            raise ValueError(f"OR filter requires 'conditions' field. Got: {filter_dict}")
+        conditions = [from_dict(cond) for cond in filter_dict["conditions"]]
+        return OR(*conditions)
+    elif op == "NOT":
+        if "condition" not in filter_dict:
+            raise ValueError(f"NOT filter requires 'condition' field. Got: {filter_dict}")
+        return NOT(from_dict(filter_dict["condition"]))
+    else:
+        raise ValueError(f"Unknown filter operator: {op}")

agno/knowledge/chunking/agentic.py CHANGED Viewed

@@ -20,13 +20,12 @@ class AgenticChunking(ChunkingStrategy):
             except Exception:
                 raise ValueError("`openai` isn't installed. Please install it with `pip install openai`")
             model = OpenAIChat(DEFAULT_OPENAI_MODEL_ID)
-        self.max_chunk_size = max_chunk_size
+        self.chunk_size = max_chunk_size
         self.model = model
     def chunk(self, document: Document) -> List[Document]:
         """Split text into chunks using LLM to determine natural breakpoints based on context"""
-        if len(document.content) <= self.max_chunk_size:
+        if len(document.content) <= self.chunk_size:
             return [document]
         chunks: List[Document] = []
@@ -35,22 +34,22 @@ class AgenticChunking(ChunkingStrategy):
         chunk_number = 1
         while remaining_text:
-            # Ask model to find a good breakpoint within max_chunk_size
-            prompt = f"""Analyze this text and determine a natural breakpoint within the first {self.max_chunk_size} characters.
+            # Ask model to find a good breakpoint within chunk_size
+            prompt = f"""Analyze this text and determine a natural breakpoint within the first {self.chunk_size} characters.
             Consider semantic completeness, paragraph boundaries, and topic transitions.
             Return only the character position number of where to break the text:
-            {remaining_text[: self.max_chunk_size]}"""
+            {remaining_text[: self.chunk_size]}"""
             try:
                 response = self.model.response([Message(role="user", content=prompt)])
                 if response and response.content:
-                    break_point = min(int(response.content.strip()), self.max_chunk_size)
+                    break_point = min(int(response.content.strip()), self.chunk_size)
                 else:
-                    break_point = self.max_chunk_size
+                    break_point = self.chunk_size
             except Exception:
                 # Fallback to max size if model fails
-                break_point = self.max_chunk_size
+                break_point = self.chunk_size
             # Extract chunk and update remaining text
             chunk = remaining_text[:break_point].strip()

agno/knowledge/chunking/strategy.py CHANGED Viewed

@@ -1,6 +1,6 @@
 from abc import ABC, abstractmethod
 from enum import Enum
-from typing import List
+from typing import List, Optional
 from agno.knowledge.document.base import Document
@@ -60,7 +60,13 @@ class ChunkingStrategyFactory:
     """Factory for creating chunking strategy instances."""
     @classmethod
-    def create_strategy(cls, strategy_type: ChunkingStrategyType, **kwargs) -> ChunkingStrategy:
+    def create_strategy(
+        cls,
+        strategy_type: ChunkingStrategyType,
+        chunk_size: Optional[int] = None,
+        overlap: Optional[int] = None,
+        **kwargs,
+    ) -> ChunkingStrategy:
         """Create an instance of the chunking strategy with the given parameters."""
         strategy_map = {
             ChunkingStrategyType.AGENTIC_CHUNKER: cls._create_agentic_chunking,
@@ -71,51 +77,89 @@ class ChunkingStrategyFactory:
             ChunkingStrategyType.ROW_CHUNKER: cls._create_row_chunking,
             ChunkingStrategyType.MARKDOWN_CHUNKER: cls._create_markdown_chunking,
         }
-        return strategy_map[strategy_type](**kwargs)
+        return strategy_map[strategy_type](chunk_size=chunk_size, overlap=overlap, **kwargs)
     @classmethod
-    def _create_agentic_chunking(cls, **kwargs) -> ChunkingStrategy:
+    def _create_agentic_chunking(
+        cls, chunk_size: Optional[int] = None, overlap: Optional[int] = None, **kwargs
+    ) -> ChunkingStrategy:
         from agno.knowledge.chunking.agentic import AgenticChunking
-        # Map chunk_size to max_chunk_size for AgenticChunking
-        if "chunk_size" in kwargs and "max_chunk_size" not in kwargs:
-            kwargs["max_chunk_size"] = kwargs.pop("chunk_size")
+        # AgenticChunking accepts max_chunk_size (not chunk_size) and no overlap
+        if chunk_size is not None:
+            kwargs["max_chunk_size"] = chunk_size
+        # Remove overlap since AgenticChunking doesn't support it
         return AgenticChunking(**kwargs)
     @classmethod
-    def _create_document_chunking(cls, **kwargs) -> ChunkingStrategy:
+    def _create_document_chunking(
+        cls, chunk_size: Optional[int] = None, overlap: Optional[int] = None, **kwargs
+    ) -> ChunkingStrategy:
         from agno.knowledge.chunking.document import DocumentChunking
+        # DocumentChunking accepts both chunk_size and overlap
+        if chunk_size is not None:
+            kwargs["chunk_size"] = chunk_size
+        if overlap is not None:
+            kwargs["overlap"] = overlap
         return DocumentChunking(**kwargs)
     @classmethod
-    def _create_recursive_chunking(cls, **kwargs) -> ChunkingStrategy:
+    def _create_recursive_chunking(
+        cls, chunk_size: Optional[int] = None, overlap: Optional[int] = None, **kwargs
+    ) -> ChunkingStrategy:
         from agno.knowledge.chunking.recursive import RecursiveChunking
+        # RecursiveChunking accepts both chunk_size and overlap
+        if chunk_size is not None:
+            kwargs["chunk_size"] = chunk_size
+        if overlap is not None:
+            kwargs["overlap"] = overlap
         return RecursiveChunking(**kwargs)
     @classmethod
-    def _create_semantic_chunking(cls, **kwargs) -> ChunkingStrategy:
+    def _create_semantic_chunking(
+        cls, chunk_size: Optional[int] = None, overlap: Optional[int] = None, **kwargs
+    ) -> ChunkingStrategy:
         from agno.knowledge.chunking.semantic import SemanticChunking
+        # SemanticChunking accepts chunk_size but not overlap
+        if chunk_size is not None:
+            kwargs["chunk_size"] = chunk_size
+        # Remove overlap since SemanticChunking doesn't support it
         return SemanticChunking(**kwargs)
     @classmethod
-    def _create_fixed_chunking(cls, **kwargs) -> ChunkingStrategy:
+    def _create_fixed_chunking(
+        cls, chunk_size: Optional[int] = None, overlap: Optional[int] = None, **kwargs
+    ) -> ChunkingStrategy:
         from agno.knowledge.chunking.fixed import FixedSizeChunking
+        # FixedSizeChunking accepts both chunk_size and overlap
+        if chunk_size is not None:
+            kwargs["chunk_size"] = chunk_size
+        if overlap is not None:
+            kwargs["overlap"] = overlap
         return FixedSizeChunking(**kwargs)
     @classmethod
-    def _create_row_chunking(cls, **kwargs) -> ChunkingStrategy:
+    def _create_row_chunking(
+        cls, chunk_size: Optional[int] = None, overlap: Optional[int] = None, **kwargs
+    ) -> ChunkingStrategy:
         from agno.knowledge.chunking.row import RowChunking
-        # Remove chunk_size if present since RowChunking doesn't use it
-        kwargs.pop("chunk_size", None)
+        # RowChunking doesn't accept chunk_size or overlap, only skip_header and clean_rows
         return RowChunking(**kwargs)
     @classmethod
-    def _create_markdown_chunking(cls, **kwargs) -> ChunkingStrategy:
+    def _create_markdown_chunking(
+        cls, chunk_size: Optional[int] = None, overlap: Optional[int] = None, **kwargs
+    ) -> ChunkingStrategy:
         from agno.knowledge.chunking.markdown import MarkdownChunking
+        # MarkdownChunking accepts both chunk_size and overlap
+        if chunk_size is not None:
+            kwargs["chunk_size"] = chunk_size
+        if overlap is not None:
+            kwargs["overlap"] = overlap
         return MarkdownChunking(**kwargs)

agno/knowledge/embedder/sentence_transformer.py CHANGED Viewed

@@ -25,10 +25,14 @@ class SentenceTransformerEmbedder(Embedder):
     prompt: Optional[str] = None
     normalize_embeddings: bool = False
-    def get_embedding(self, text: Union[str, List[str]]) -> List[float]:
-        if not self.sentence_transformer_client:
+    def __post_init__(self):
+        # Initialize the SentenceTransformer model eagerly to avoid race conditions in async contexts
+        if self.sentence_transformer_client is None:
             self.sentence_transformer_client = SentenceTransformer(model_name_or_path=self.id)
+    def get_embedding(self, text: Union[str, List[str]]) -> List[float]:
+        if self.sentence_transformer_client is None:
+            raise RuntimeError("SentenceTransformer model not initialized")
         model = self.sentence_transformer_client
         embedding = model.encode(text, prompt=self.prompt, normalize_embeddings=self.normalize_embeddings)
         try:

agno/knowledge/knowledge.py CHANGED Viewed

@@ -13,6 +13,7 @@ from httpx import AsyncClient
 from agno.db.base import AsyncBaseDb, BaseDb
 from agno.db.schemas.knowledge import KnowledgeRow
+from agno.filters import FilterExpr
 from agno.knowledge.content import Content, ContentAuth, ContentStatus, FileData
 from agno.knowledge.document import Document
 from agno.knowledge.reader import Reader, ReaderFactory
@@ -403,7 +404,7 @@ class Knowledge:
         if path.is_file():
             if self._should_include_file(str(path), include, exclude):
-                log_info(f"Adding file {path} due to include/exclude filters")
+                log_debug(f"Adding file {path} due to include/exclude filters")
                 await self._add_to_contents_db(content)
                 if self._should_skip(content.content_hash, skip_if_exists):  # type: ignore[arg-type]
@@ -1392,7 +1393,7 @@ class Knowledge:
         self,
         query: str,
         max_results: Optional[int] = None,
-        filters: Optional[Dict[str, Any]] = None,
+        filters: Optional[Union[Dict[str, Any], List[FilterExpr]]] = None,
         search_type: Optional[str] = None,
     ) -> List[Document]:
         """Returns relevant documents matching a query"""
@@ -1423,7 +1424,7 @@ class Knowledge:
         self,
         query: str,
         max_results: Optional[int] = None,
-        filters: Optional[Dict[str, Any]] = None,
+        filters: Optional[Union[Dict[str, Any], List[FilterExpr]]] = None,
         search_type: Optional[str] = None,
     ) -> List[Document]:
         """Returns relevant documents matching a query"""
@@ -1465,38 +1466,58 @@ class Knowledge:
         self.valid_metadata_filters.update(await self._aget_filters_from_db())
         return self.valid_metadata_filters
-    def _validate_filters(self, filters: Optional[Dict[str, Any]]) -> Tuple[Dict[str, Any], List[str]]:
+    def _validate_filters(self, filters: Optional[Union[Dict[str, Any], List[FilterExpr]]]) -> Tuple[Any, List[str]]:
+        """Internal method to validate filters against known metadata keys."""
         if not filters:
-            return {}, []
+            return None, []
-        valid_filters: Dict[str, Any] = {}
+        valid_filters: Optional[Dict[str, Any]] = None
         invalid_keys = []
-        # If no metadata filters tracked yet, all keys are considered invalid
-        if self.valid_metadata_filters is None:
-            invalid_keys = list(filters.keys())
-            log_debug(f"No valid metadata filters tracked yet. All filter keys considered invalid: {invalid_keys}")
-            return {}, invalid_keys
-        for key, value in filters.items():
-            # Handle both normal keys and prefixed keys like meta_data.key
-            base_key = key.split(".")[-1] if "." in key else key
-            if base_key in self.valid_metadata_filters or key in self.valid_metadata_filters:
-                valid_filters[key] = value
-            else:
-                invalid_keys.append(key)
-                log_debug(f"Invalid filter key: {key} - not present in knowledge base")
+        if isinstance(filters, dict):
+            # If no metadata filters tracked yet, all keys are considered invalid
+            if self.valid_metadata_filters is None:
+                invalid_keys = list(filters.keys())
+                log_debug(f"No valid metadata filters tracked yet. All filter keys considered invalid: {invalid_keys}")
+                return None, invalid_keys
+            valid_filters = {}
+            for key, value in filters.items():
+                # Handle both normal keys and prefixed keys like meta_data.key
+                base_key = key.split(".")[-1] if "." in key else key
+                if base_key in self.valid_metadata_filters or key in self.valid_metadata_filters:
+                    valid_filters[key] = value
+                else:
+                    invalid_keys.append(key)
+                    log_debug(f"Invalid filter key: {key} - not present in knowledge base")
+        elif isinstance(filters, List):
+            # Validate that list contains FilterExpr instances
+            for i, filter_item in enumerate(filters):
+                if not isinstance(filter_item, FilterExpr):
+                    log_warning(
+                        f"Invalid filter at index {i}: expected FilterExpr instance, "
+                        f"got {type(filter_item).__name__}. "
+                        f"Use filter expressions like EQ('key', 'value'), IN('key', [values]), "
+                        f"AND(...), OR(...), NOT(...) from agno.filters"
+                    )
+            # Filter expressions are already validated, return empty dict/list
+            # The actual filtering happens in the vector_db layer
+            return filters, []
         return valid_filters, invalid_keys
-    def validate_filters(self, filters: Optional[Dict[str, Any]]) -> Tuple[Dict[str, Any], List[str]]:
+    def validate_filters(self, filters: Optional[Union[Dict[str, Any], List[FilterExpr]]]) -> Tuple[Any, List[str]]:
         if self.valid_metadata_filters is None:
             self.valid_metadata_filters = set()
         self.valid_metadata_filters.update(self._get_filters_from_db())
         return self._validate_filters(filters)
-    async def async_validate_filters(self, filters: Optional[Dict[str, Any]]) -> Tuple[Dict[str, Any], List[str]]:
+    async def async_validate_filters(
+        self, filters: Optional[Union[Dict[str, Any], List[FilterExpr]]]
+    ) -> Tuple[Any, List[str]]:
         if self.valid_metadata_filters is None:
             self.valid_metadata_filters = set()
         self.valid_metadata_filters.update(await self._aget_filters_from_db())

agno/knowledge/reader/base.py CHANGED Viewed

@@ -44,11 +44,15 @@ class Reader:
         self.max_results = max_results
         self.encoding = encoding
-    def set_chunking_strategy_from_string(self, strategy_name: str, **kwargs) -> None:
+    def set_chunking_strategy_from_string(
+        self, strategy_name: str, chunk_size: Optional[int] = None, overlap: Optional[int] = None, **kwargs
+    ) -> None:
         """Set the chunking strategy from a string name."""
         try:
             strategy_type = ChunkingStrategyType.from_string(strategy_name)
-            self.chunking_strategy = ChunkingStrategyFactory.create_strategy(strategy_type, **kwargs)
+            self.chunking_strategy = ChunkingStrategyFactory.create_strategy(
+                strategy_type, chunk_size=chunk_size, overlap=overlap, **kwargs
+            )
         except ValueError as e:
             raise ValueError(f"Failed to set chunking strategy: {e}")

agno 2.2.10__py3-none-any.whl → 2.2.12__py3-none-any.whl

agno 2.2.10py3-none-any.whl → 2.2.12py3-none-any.whl