PyPI - agno - Versions diffs - 2.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl - Mend

agno 2.1.2py3-none-any.whl → 2.3.13py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (314) hide show

agno/agent/agent.py +5540 -2273
agno/api/api.py +2 -0
agno/api/os.py +1 -1
agno/compression/__init__.py +3 -0
agno/compression/manager.py +247 -0
agno/culture/__init__.py +3 -0
agno/culture/manager.py +956 -0
agno/db/async_postgres/__init__.py +3 -0
agno/db/base.py +689 -6
agno/db/dynamo/dynamo.py +933 -37
agno/db/dynamo/schemas.py +174 -10
agno/db/dynamo/utils.py +63 -4
agno/db/firestore/firestore.py +831 -9
agno/db/firestore/schemas.py +51 -0
agno/db/firestore/utils.py +102 -4
agno/db/gcs_json/gcs_json_db.py +660 -12
agno/db/gcs_json/utils.py +60 -26
agno/db/in_memory/in_memory_db.py +287 -14
agno/db/in_memory/utils.py +60 -2
agno/db/json/json_db.py +590 -14
agno/db/json/utils.py +60 -26
agno/db/migrations/manager.py +199 -0
agno/db/migrations/v1_to_v2.py +43 -13
agno/db/migrations/versions/__init__.py +0 -0
agno/db/migrations/versions/v2_3_0.py +938 -0
agno/db/mongo/__init__.py +15 -1
agno/db/mongo/async_mongo.py +2760 -0
agno/db/mongo/mongo.py +879 -11
agno/db/mongo/schemas.py +42 -0
agno/db/mongo/utils.py +80 -8
agno/db/mysql/__init__.py +2 -1
agno/db/mysql/async_mysql.py +2912 -0
agno/db/mysql/mysql.py +946 -68
agno/db/mysql/schemas.py +72 -10
agno/db/mysql/utils.py +198 -7
agno/db/postgres/__init__.py +2 -1
agno/db/postgres/async_postgres.py +2579 -0
agno/db/postgres/postgres.py +942 -57
agno/db/postgres/schemas.py +81 -18
agno/db/postgres/utils.py +164 -2
agno/db/redis/redis.py +671 -7
agno/db/redis/schemas.py +50 -0
agno/db/redis/utils.py +65 -7
agno/db/schemas/__init__.py +2 -1
agno/db/schemas/culture.py +120 -0
agno/db/schemas/evals.py +1 -0
agno/db/schemas/memory.py +17 -2
agno/db/singlestore/schemas.py +63 -0
agno/db/singlestore/singlestore.py +949 -83
agno/db/singlestore/utils.py +60 -2
agno/db/sqlite/__init__.py +2 -1
agno/db/sqlite/async_sqlite.py +2911 -0
agno/db/sqlite/schemas.py +62 -0
agno/db/sqlite/sqlite.py +965 -46
agno/db/sqlite/utils.py +169 -8
agno/db/surrealdb/__init__.py +3 -0
agno/db/surrealdb/metrics.py +292 -0
agno/db/surrealdb/models.py +334 -0
agno/db/surrealdb/queries.py +71 -0
agno/db/surrealdb/surrealdb.py +1908 -0
agno/db/surrealdb/utils.py +147 -0
agno/db/utils.py +2 -0
agno/eval/__init__.py +10 -0
agno/eval/accuracy.py +75 -55
agno/eval/agent_as_judge.py +861 -0
agno/eval/base.py +29 -0
agno/eval/performance.py +16 -7
agno/eval/reliability.py +28 -16
agno/eval/utils.py +35 -17
agno/exceptions.py +27 -2
agno/filters.py +354 -0
agno/guardrails/prompt_injection.py +1 -0
agno/hooks/__init__.py +3 -0
agno/hooks/decorator.py +164 -0
agno/integrations/discord/client.py +1 -1
agno/knowledge/chunking/agentic.py +13 -10
agno/knowledge/chunking/fixed.py +4 -1
agno/knowledge/chunking/semantic.py +9 -4
agno/knowledge/chunking/strategy.py +59 -15
agno/knowledge/embedder/fastembed.py +1 -1
agno/knowledge/embedder/nebius.py +1 -1
agno/knowledge/embedder/ollama.py +8 -0
agno/knowledge/embedder/openai.py +8 -8
agno/knowledge/embedder/sentence_transformer.py +6 -2
agno/knowledge/embedder/vllm.py +262 -0
agno/knowledge/knowledge.py +1618 -318
agno/knowledge/reader/base.py +6 -2
agno/knowledge/reader/csv_reader.py +8 -10
agno/knowledge/reader/docx_reader.py +5 -6
agno/knowledge/reader/field_labeled_csv_reader.py +16 -20
agno/knowledge/reader/json_reader.py +5 -4
agno/knowledge/reader/markdown_reader.py +8 -8
agno/knowledge/reader/pdf_reader.py +17 -19
agno/knowledge/reader/pptx_reader.py +101 -0
agno/knowledge/reader/reader_factory.py +32 -3
agno/knowledge/reader/s3_reader.py +3 -3
agno/knowledge/reader/tavily_reader.py +193 -0
agno/knowledge/reader/text_reader.py +22 -10
agno/knowledge/reader/web_search_reader.py +1 -48
agno/knowledge/reader/website_reader.py +10 -10
agno/knowledge/reader/wikipedia_reader.py +33 -1
agno/knowledge/types.py +1 -0
agno/knowledge/utils.py +72 -7
agno/media.py +22 -6
agno/memory/__init__.py +14 -1
agno/memory/manager.py +544 -83
agno/memory/strategies/__init__.py +15 -0
agno/memory/strategies/base.py +66 -0
agno/memory/strategies/summarize.py +196 -0
agno/memory/strategies/types.py +37 -0
agno/models/aimlapi/aimlapi.py +17 -0
agno/models/anthropic/claude.py +515 -40
agno/models/aws/bedrock.py +102 -21
agno/models/aws/claude.py +131 -274
agno/models/azure/ai_foundry.py +41 -19
agno/models/azure/openai_chat.py +39 -8
agno/models/base.py +1249 -525
agno/models/cerebras/cerebras.py +91 -21
agno/models/cerebras/cerebras_openai.py +21 -2
agno/models/cohere/chat.py +40 -6
agno/models/cometapi/cometapi.py +18 -1
agno/models/dashscope/dashscope.py +2 -3
agno/models/deepinfra/deepinfra.py +18 -1
agno/models/deepseek/deepseek.py +69 -3
agno/models/fireworks/fireworks.py +18 -1
agno/models/google/gemini.py +877 -80
agno/models/google/utils.py +22 -0
agno/models/groq/groq.py +51 -18
agno/models/huggingface/huggingface.py +17 -6
agno/models/ibm/watsonx.py +16 -6
agno/models/internlm/internlm.py +18 -1
agno/models/langdb/langdb.py +13 -1
agno/models/litellm/chat.py +44 -9
agno/models/litellm/litellm_openai.py +18 -1
agno/models/message.py +28 -5
agno/models/meta/llama.py +47 -14
agno/models/meta/llama_openai.py +22 -17
agno/models/mistral/mistral.py +8 -4
agno/models/nebius/nebius.py +6 -7
agno/models/nvidia/nvidia.py +20 -3
agno/models/ollama/chat.py +24 -8
agno/models/openai/chat.py +104 -29
agno/models/openai/responses.py +101 -81
agno/models/openrouter/openrouter.py +60 -3
agno/models/perplexity/perplexity.py +17 -1
agno/models/portkey/portkey.py +7 -6
agno/models/requesty/requesty.py +24 -4
agno/models/response.py +73 -2
agno/models/sambanova/sambanova.py +20 -3
agno/models/siliconflow/siliconflow.py +19 -2
agno/models/together/together.py +20 -3
agno/models/utils.py +254 -8
agno/models/vercel/v0.py +20 -3
agno/models/vertexai/__init__.py +0 -0
agno/models/vertexai/claude.py +190 -0
agno/models/vllm/vllm.py +19 -14
agno/models/xai/xai.py +19 -2
agno/os/app.py +549 -152
agno/os/auth.py +190 -3
agno/os/config.py +23 -0
agno/os/interfaces/a2a/router.py +8 -11
agno/os/interfaces/a2a/utils.py +1 -1
agno/os/interfaces/agui/router.py +18 -3
agno/os/interfaces/agui/utils.py +152 -39
agno/os/interfaces/slack/router.py +55 -37
agno/os/interfaces/slack/slack.py +9 -1
agno/os/interfaces/whatsapp/router.py +0 -1
agno/os/interfaces/whatsapp/security.py +3 -1
agno/os/mcp.py +110 -52
agno/os/middleware/__init__.py +2 -0
agno/os/middleware/jwt.py +676 -112
agno/os/router.py +40 -1478
agno/os/routers/agents/__init__.py +3 -0
agno/os/routers/agents/router.py +599 -0
agno/os/routers/agents/schema.py +261 -0
agno/os/routers/evals/evals.py +96 -39
agno/os/routers/evals/schemas.py +65 -33
agno/os/routers/evals/utils.py +80 -10
agno/os/routers/health.py +10 -4
agno/os/routers/knowledge/knowledge.py +196 -38
agno/os/routers/knowledge/schemas.py +82 -22
agno/os/routers/memory/memory.py +279 -52
agno/os/routers/memory/schemas.py +46 -17
agno/os/routers/metrics/metrics.py +20 -8
agno/os/routers/metrics/schemas.py +16 -16
agno/os/routers/session/session.py +462 -34
agno/os/routers/teams/__init__.py +3 -0
agno/os/routers/teams/router.py +512 -0
agno/os/routers/teams/schema.py +257 -0
agno/os/routers/traces/__init__.py +3 -0
agno/os/routers/traces/schemas.py +414 -0
agno/os/routers/traces/traces.py +499 -0
agno/os/routers/workflows/__init__.py +3 -0
agno/os/routers/workflows/router.py +624 -0
agno/os/routers/workflows/schema.py +75 -0
agno/os/schema.py +256 -693
agno/os/scopes.py +469 -0
agno/os/utils.py +514 -36
agno/reasoning/anthropic.py +80 -0
agno/reasoning/gemini.py +73 -0
agno/reasoning/openai.py +5 -0
agno/reasoning/vertexai.py +76 -0
agno/run/__init__.py +6 -0
agno/run/agent.py +155 -32
agno/run/base.py +55 -3
agno/run/requirement.py +181 -0
agno/run/team.py +125 -38
agno/run/workflow.py +72 -18
agno/session/agent.py +102 -89
agno/session/summary.py +56 -15
agno/session/team.py +164 -90
agno/session/workflow.py +405 -40
agno/table.py +10 -0
agno/team/team.py +3974 -1903
agno/tools/dalle.py +2 -4
agno/tools/eleven_labs.py +23 -25
agno/tools/exa.py +21 -16
agno/tools/file.py +153 -23
agno/tools/file_generation.py +16 -10
agno/tools/firecrawl.py +15 -7
agno/tools/function.py +193 -38
agno/tools/gmail.py +238 -14
agno/tools/google_drive.py +271 -0
agno/tools/googlecalendar.py +36 -8
agno/tools/googlesheets.py +20 -5
agno/tools/jira.py +20 -0
agno/tools/mcp/__init__.py +10 -0
agno/tools/mcp/mcp.py +331 -0
agno/tools/mcp/multi_mcp.py +347 -0
agno/tools/mcp/params.py +24 -0
agno/tools/mcp_toolbox.py +3 -3
agno/tools/models/nebius.py +5 -5
agno/tools/models_labs.py +20 -10
agno/tools/nano_banana.py +151 -0
agno/tools/notion.py +204 -0
agno/tools/parallel.py +314 -0
agno/tools/postgres.py +76 -36
agno/tools/redshift.py +406 -0
agno/tools/scrapegraph.py +1 -1
agno/tools/shopify.py +1519 -0
agno/tools/slack.py +18 -3
agno/tools/spotify.py +919 -0
agno/tools/tavily.py +146 -0
agno/tools/toolkit.py +25 -0
agno/tools/workflow.py +8 -1
agno/tools/yfinance.py +12 -11
agno/tracing/__init__.py +12 -0
agno/tracing/exporter.py +157 -0
agno/tracing/schemas.py +276 -0
agno/tracing/setup.py +111 -0
agno/utils/agent.py +938 -0
agno/utils/cryptography.py +22 -0
agno/utils/dttm.py +33 -0
agno/utils/events.py +151 -3
agno/utils/gemini.py +15 -5
agno/utils/hooks.py +118 -4
agno/utils/http.py +113 -2
agno/utils/knowledge.py +12 -5
agno/utils/log.py +1 -0
agno/utils/mcp.py +92 -2
agno/utils/media.py +187 -1
agno/utils/merge_dict.py +3 -3
agno/utils/message.py +60 -0
agno/utils/models/ai_foundry.py +9 -2
agno/utils/models/claude.py +49 -14
agno/utils/models/cohere.py +9 -2
agno/utils/models/llama.py +9 -2
agno/utils/models/mistral.py +4 -2
agno/utils/print_response/agent.py +109 -16
agno/utils/print_response/team.py +223 -30
agno/utils/print_response/workflow.py +251 -34
agno/utils/streamlit.py +1 -1
agno/utils/team.py +98 -9
agno/utils/tokens.py +657 -0
agno/vectordb/base.py +39 -7
agno/vectordb/cassandra/cassandra.py +21 -5
agno/vectordb/chroma/chromadb.py +43 -12
agno/vectordb/clickhouse/clickhousedb.py +21 -5
agno/vectordb/couchbase/couchbase.py +29 -5
agno/vectordb/lancedb/lance_db.py +92 -181
agno/vectordb/langchaindb/langchaindb.py +24 -4
agno/vectordb/lightrag/lightrag.py +17 -3
agno/vectordb/llamaindex/llamaindexdb.py +25 -5
agno/vectordb/milvus/milvus.py +50 -37
agno/vectordb/mongodb/__init__.py +7 -1
agno/vectordb/mongodb/mongodb.py +36 -30
agno/vectordb/pgvector/pgvector.py +201 -77
agno/vectordb/pineconedb/pineconedb.py +41 -23
agno/vectordb/qdrant/qdrant.py +67 -54
agno/vectordb/redis/__init__.py +9 -0
agno/vectordb/redis/redisdb.py +682 -0
agno/vectordb/singlestore/singlestore.py +50 -29
agno/vectordb/surrealdb/surrealdb.py +31 -41
agno/vectordb/upstashdb/upstashdb.py +34 -6
agno/vectordb/weaviate/weaviate.py +53 -14
agno/workflow/__init__.py +2 -0
agno/workflow/agent.py +299 -0
agno/workflow/condition.py +120 -18
agno/workflow/loop.py +77 -10
agno/workflow/parallel.py +231 -143
agno/workflow/router.py +118 -17
agno/workflow/step.py +609 -170
agno/workflow/steps.py +73 -6
agno/workflow/types.py +96 -21
agno/workflow/workflow.py +2039 -262
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/METADATA +201 -66
agno-2.3.13.dist-info/RECORD +613 -0
agno/tools/googlesearch.py +0 -98
agno/tools/mcp.py +0 -679
agno/tools/memori.py +0 -339
agno-2.1.2.dist-info/RECORD +0 -543
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/WHEEL +0 -0
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/licenses/LICENSE +0 -0
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/top_level.txt +0 -0

agno/knowledge/reader/tavily_reader.py ADDED Viewed

@@ -0,0 +1,193 @@
+import asyncio
+from dataclasses import dataclass
+from typing import Dict, List, Literal, Optional
+from agno.knowledge.chunking.semantic import SemanticChunking
+from agno.knowledge.chunking.strategy import ChunkingStrategy, ChunkingStrategyType
+from agno.knowledge.document.base import Document
+from agno.knowledge.reader.base import Reader
+from agno.knowledge.types import ContentType
+from agno.utils.log import log_debug, logger
+try:
+    from tavily import TavilyClient  # type: ignore[attr-defined]
+except ImportError:
+    raise ImportError(
+        "The `tavily-python` package is not installed. Please install it via `pip install tavily-python`."
+    )
+@dataclass
+class TavilyReader(Reader):
+    api_key: Optional[str] = None
+    params: Optional[Dict] = None
+    extract_format: Literal["markdown", "text"] = "markdown"
+    extract_depth: Literal["basic", "advanced"] = "basic"
+    def __init__(
+        self,
+        api_key: Optional[str] = None,
+        params: Optional[Dict] = None,
+        extract_format: Literal["markdown", "text"] = "markdown",
+        extract_depth: Literal["basic", "advanced"] = "basic",
+        chunk: bool = True,
+        chunk_size: int = 5000,
+        chunking_strategy: Optional[ChunkingStrategy] = SemanticChunking(),
+        name: Optional[str] = None,
+        description: Optional[str] = None,
+    ) -> None:
+        """
+        Initialize TavilyReader for extracting content from URLs using Tavily's Extract API.
+        Args:
+            api_key: Tavily API key (or use TAVILY_API_KEY env var)
+            params: Additional parameters to pass to the extract API
+            extract_format: Output format - "markdown" or "text"
+            extract_depth: Extraction depth - "basic" (1 credit/5 URLs) or "advanced" (2 credits/5 URLs)
+            chunk: Whether to chunk the extracted content
+            chunk_size: Size of chunks when chunking is enabled
+            chunking_strategy: Strategy to use for chunking
+            name: Name of the reader
+            description: Description of the reader
+        """
+        # Initialize base Reader (handles chunk_size / strategy)
+        super().__init__(
+            chunk=chunk, chunk_size=chunk_size, chunking_strategy=chunking_strategy, name=name, description=description
+        )
+        # Tavily-specific attributes
+        self.api_key = api_key
+        self.params = params or {}
+        self.extract_format = extract_format
+        self.extract_depth = extract_depth
+    @classmethod
+    def get_supported_chunking_strategies(self) -> List[ChunkingStrategyType]:
+        """Get the list of supported chunking strategies for Tavily readers."""
+        return [
+            ChunkingStrategyType.SEMANTIC_CHUNKER,
+            ChunkingStrategyType.FIXED_SIZE_CHUNKER,
+            ChunkingStrategyType.AGENTIC_CHUNKER,
+            ChunkingStrategyType.DOCUMENT_CHUNKER,
+            ChunkingStrategyType.RECURSIVE_CHUNKER,
+        ]
+    @classmethod
+    def get_supported_content_types(self) -> List[ContentType]:
+        return [ContentType.URL]
+    def _extract(self, url: str, name: Optional[str] = None) -> List[Document]:
+        """
+        Internal method to extract content from a URL using Tavily's Extract API.
+        Args:
+            url: The URL to extract content from
+            name: Optional name for the document (defaults to URL)
+        Returns:
+            A list of documents containing the extracted content
+        """
+        log_debug(f"Extracting content from: {url}")
+        client = TavilyClient(api_key=self.api_key)
+        # Prepare extract parameters
+        extract_params = {
+            "urls": [url],
+            "depth": self.extract_depth,
+        }
+        # Add optional params if provided
+        if self.params:
+            extract_params.update(self.params)
+        try:
+            # Call Tavily Extract API
+            response = client.extract(**extract_params)
+            # Extract content from response
+            if not response or "results" not in response:
+                logger.warning(f"No results received for URL: {url}")
+                return [Document(name=name or url, id=url, content="")]
+            results = response.get("results", [])
+            if not results:
+                logger.warning(f"Empty results for URL: {url}")
+                return [Document(name=name or url, id=url, content="")]
+            # Get the first result (since we're extracting a single URL)
+            result = results[0]
+            # Check if extraction failed
+            if "failed_reason" in result:
+                logger.warning(f"Extraction failed for {url}: {result['failed_reason']}")
+                return [Document(name=name or url, id=url, content="")]
+            # Get raw content
+            content = result.get("raw_content", "")
+            if content is None:
+                content = ""
+                logger.warning(f"No content received for URL: {url}")
+            # Debug logging
+            log_debug(f"Received content type: {type(content)}")
+            log_debug(f"Content length: {len(content) if content else 0}")
+            # Create documents
+            documents = []
+            if self.chunk and content:
+                documents.extend(self.chunk_document(Document(name=name or url, id=url, content=content)))
+            else:
+                documents.append(Document(name=name or url, id=url, content=content))
+            return documents
+        except Exception as e:
+            logger.error(f"Error extracting content from {url}: {e}")
+            return [Document(name=name or url, id=url, content="")]
+    async def _async_extract(self, url: str, name: Optional[str] = None) -> List[Document]:
+        """
+        Internal async method to extract content from a URL.
+        Args:
+            url: The URL to extract content from
+            name: Optional name for the document
+        Returns:
+            A list of documents containing the extracted content
+        """
+        log_debug(f"Async extracting content from: {url}")
+        # Use asyncio.to_thread to run the synchronous extract in a thread
+        return await asyncio.to_thread(self._extract, url, name)
+    def read(self, url: str, name: Optional[str] = None) -> List[Document]:
+        """
+        Reads content from a URL using Tavily Extract API.
+        This is the public API method that users should call.
+        Args:
+            url: The URL to extract content from
+            name: Optional name for the document
+        Returns:
+            A list of documents containing the extracted content
+        """
+        return self._extract(url, name)
+    async def async_read(self, url: str, name: Optional[str] = None) -> List[Document]:
+        """
+        Asynchronously reads content from a URL using Tavily Extract API.
+        This is the public API method that users should call for async operations.
+        Args:
+            url: The URL to extract content from
+            name: Optional name for the document
+        Returns:
+            A list of documents containing the extracted content
+        """
+        return await self._async_extract(url, name)

agno/knowledge/reader/text_reader.py CHANGED Viewed

@@ -8,7 +8,7 @@ from agno.knowledge.chunking.strategy import ChunkingStrategy, ChunkingStrategyT
 from agno.knowledge.document.base import Document
 from agno.knowledge.reader.base import Reader
 from agno.knowledge.types import ContentType
-from agno.utils.log import log_info, logger
+from agno.utils.log import log_debug, log_error, log_warning
 class TextReader(Reader):
@@ -37,12 +37,18 @@ class TextReader(Reader):
             if isinstance(file, Path):
                 if not file.exists():
                     raise FileNotFoundError(f"Could not find file: {file}")
-                log_info(f"Reading: {file}")
+                log_debug(f"Reading: {file}")
                 file_name = name or file.stem
                 file_contents = file.read_text(self.encoding or "utf-8")
             else:
-                file_name = name or file.name.split(".")[0]
-                log_info(f"Reading uploaded file: {file_name}")
+                # Handle BytesIO and other file-like objects that may not have a name attribute
+                if name:
+                    file_name = name
+                elif hasattr(file, "name") and file.name is not None:
+                    file_name = file.name.split(".")[0]
+                else:
+                    file_name = "text_file"
+                log_debug(f"Reading uploaded file: {file_name}")
                 file.seek(0)
                 file_contents = file.read().decode(self.encoding or "utf-8")
@@ -60,7 +66,7 @@ class TextReader(Reader):
                 return chunked_documents
             return documents
         except Exception as e:
-            logger.error(f"Error reading: {file}: {e}")
+            log_error(f"Error reading: {file}: {e}")
             return []
     async def async_read(self, file: Union[Path, IO[Any]], name: Optional[str] = None) -> List[Document]:
@@ -69,7 +75,7 @@ class TextReader(Reader):
                 if not file.exists():
                     raise FileNotFoundError(f"Could not find file: {file}")
-                log_info(f"Reading asynchronously: {file}")
+                log_debug(f"Reading asynchronously: {file}")
                 file_name = name or file.stem
                 try:
@@ -78,11 +84,17 @@ class TextReader(Reader):
                     async with aiofiles.open(file, "r", encoding=self.encoding or "utf-8") as f:
                         file_contents = await f.read()
                 except ImportError:
-                    logger.warning("aiofiles not installed, using synchronous file I/O")
+                    log_warning("aiofiles not installed, using synchronous file I/O")
                     file_contents = file.read_text(self.encoding or "utf-8")
             else:
-                log_info(f"Reading uploaded file asynchronously: {file.name}")
-                file_name = name or file.name.split(".")[0]
+                # Handle BytesIO and other file-like objects that may not have a name attribute
+                if name:
+                    file_name = name
+                elif hasattr(file, "name") and file.name is not None:
+                    file_name = file.name.split(".")[0]
+                else:
+                    file_name = "text_file"
+                log_debug(f"Reading uploaded file asynchronously: {file_name}")
                 file.seek(0)
                 file_contents = file.read().decode(self.encoding or "utf-8")
@@ -96,7 +108,7 @@ class TextReader(Reader):
                 return await self._async_chunk_document(document)
             return [document]
         except Exception as e:
-            logger.error(f"Error reading asynchronously: {file}: {e}")
+            log_error(f"Error reading asynchronously: {file}: {e}")
             return []
     async def _async_chunk_document(self, document: Document) -> List[Document]:

agno/knowledge/reader/web_search_reader.py CHANGED Viewed

@@ -37,7 +37,7 @@ class WebSearchReader(Reader):
     user_agent: str = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
     # Search engine configuration
-    search_engine: Literal["duckduckgo", "google"] = "duckduckgo"
+    search_engine: Literal["duckduckgo"] = "duckduckgo"
     search_delay: float = 3.0  # Delay between search requests
     max_search_retries: int = 2  # Retries for search operations
@@ -121,57 +121,10 @@ class WebSearchReader(Reader):
                     return []
         return []
-    def _perform_google_search(self, query: str) -> List[Dict[str, str]]:
-        """Perform web search using Google (requires googlesearch-python)"""
-        log_debug(f"Performing Google search for: {query}")
-        try:
-            from googlesearch import search
-        except ImportError:
-            logger.error("Google search requires 'googlesearch-python'. Install with: pip install googlesearch-python")
-            return []
-        for attempt in range(self.max_search_retries):
-            try:
-                self._respect_rate_limits()
-                results = []
-                # Use the basic search function without unsupported parameters
-                # The googlesearch-python library's search function only accepts basic parameters
-                search_results = search(query)
-                # Convert iterator to list and limit results
-                result_list = list(search_results)[: self.max_results]
-                for result in result_list:
-                    # The search function returns URLs as strings
-                    results.append(
-                        {
-                            "title": "",  # Google search doesn't provide titles directly
-                            "url": result,
-                            "description": "",  # Google search doesn't provide descriptions directly
-                        }
-                    )
-                log_debug(f"Found {len(results)} Google search results")
-                return results
-            except Exception as e:
-                logger.warning(f"Google search attempt {attempt + 1} failed: {e}")
-                if attempt < self.max_search_retries - 1:
-                    time.sleep(self.search_delay)
-                else:
-                    logger.error(f"All Google search attempts failed: {e}")
-                    return []
-        return []
     def _perform_web_search(self, query: str) -> List[Dict[str, str]]:
         """Perform web search using the configured search engine"""
         if self.search_engine == "duckduckgo":
             return self._perform_duckduckgo_search(query)
-        elif self.search_engine == "google":
-            return self._perform_google_search(query)
         else:
             logger.error(f"Unsupported search engine: {self.search_engine}")
             return []

agno/knowledge/reader/website_reader.py CHANGED Viewed

@@ -12,7 +12,7 @@ from agno.knowledge.chunking.strategy import ChunkingStrategy, ChunkingStrategyT
 from agno.knowledge.document.base import Document
 from agno.knowledge.reader.base import Reader
 from agno.knowledge.types import ContentType
-from agno.utils.log import log_debug, logger
+from agno.utils.log import log_debug, log_error, log_warning
 try:
     from bs4 import BeautifulSoup, Tag  # noqa: F401
@@ -229,21 +229,21 @@ class WebsiteReader(Reader):
                 # Log HTTP status errors but continue crawling other pages
                 # Skip redirect errors (3xx) as they should be handled by follow_redirects
                 if e.response.status_code >= 300 and e.response.status_code < 400:
-                    logger.debug(f"Redirect encountered for {current_url}, skipping: {e}")
+                    log_debug(f"Redirect encountered for {current_url}, skipping: {e}")
                 else:
-                    logger.warning(f"HTTP status error while crawling {current_url}: {e}")
+                    log_warning(f"HTTP status error while crawling {current_url}: {e}")
                 # For the initial URL, we should raise the error only if it's not a redirect
                 if current_url == url and not crawler_result and not (300 <= e.response.status_code < 400):
                     raise
             except httpx.RequestError as e:
                 # Log request errors but continue crawling other pages
-                logger.warning(f"Request error while crawling {current_url}: {e}")
+                log_warning(f"Request error while crawling {current_url}: {e}")
                 # For the initial URL, we should raise the error
                 if current_url == url and not crawler_result:
                     raise
             except Exception as e:
                 # Log other exceptions but continue crawling other pages
-                logger.warning(f"Failed to crawl {current_url}: {e}")
+                log_warning(f"Failed to crawl {current_url}: {e}")
                 # For the initial URL, we should raise the error
                 if current_url == url and not crawler_result:
                     # Wrap non-HTTP exceptions in a RequestError
@@ -332,19 +332,19 @@ class WebsiteReader(Reader):
                 except httpx.HTTPStatusError as e:
                     # Log HTTP status errors but continue crawling other pages
-                    logger.warning(f"HTTP status error while crawling asynchronously {current_url}: {e}")
+                    log_warning(f"HTTP status error while crawling asynchronously {current_url}: {e}")
                     # For the initial URL, we should raise the error
                     if current_url == url and not crawler_result:
                         raise
                 except httpx.RequestError as e:
                     # Log request errors but continue crawling other pages
-                    logger.warning(f"Request error while crawling asynchronously {current_url}: {e}")
+                    log_warning(f"Request error while crawling asynchronously {current_url}: {e}")
                     # For the initial URL, we should raise the error
                     if current_url == url and not crawler_result:
                         raise
                 except Exception as e:
                     # Log other exceptions but continue crawling other pages
-                    logger.warning(f"Failed to crawl asynchronously {current_url}: {e}")
+                    log_warning(f"Failed to crawl asynchronously {current_url}: {e}")
                     # For the initial URL, we should raise the error
                     if current_url == url and not crawler_result:
                         # Wrap non-HTTP exceptions in a RequestError
@@ -398,7 +398,7 @@ class WebsiteReader(Reader):
                     )
             return documents
         except (httpx.HTTPStatusError, httpx.RequestError) as e:
-            logger.error(f"Error reading website {url}: {e}")
+            log_error(f"Error reading website {url}: {e}")
             raise
     async def async_read(self, url: str, name: Optional[str] = None) -> List[Document]:
@@ -451,5 +451,5 @@ class WebsiteReader(Reader):
             return documents
         except (httpx.HTTPStatusError, httpx.RequestError) as e:
-            logger.error(f"Error reading website asynchronously {url}: {e}")
+            log_error(f"Error reading website asynchronously {url}: {e}")
             raise

agno/knowledge/reader/wikipedia_reader.py CHANGED Viewed

@@ -1,3 +1,4 @@
+import asyncio
 from typing import List, Optional
 from agno.knowledge.chunking.fixed import FixedSizeChunking
@@ -45,7 +46,38 @@ class WikipediaReader(Reader):
         except wikipedia.exceptions.PageError:
             summary = None
-            log_info("PageError: Page not found.")
+            log_info("Wikipedia Error: Page not found.")
+        # Only create Document if we successfully got a summary
+        if summary:
+            return [
+                Document(
+                    name=topic,
+                    meta_data={"topic": topic},
+                    content=summary,
+                )
+            ]
+        return []
+    async def async_read(self, topic: str) -> List[Document]:
+        """
+        Asynchronously read content from Wikipedia.
+        Args:
+            topic: The Wikipedia topic to read
+        Returns:
+            A list of documents containing the Wikipedia summary
+        """
+        log_debug(f"Async reading Wikipedia topic: {topic}")
+        summary = None
+        try:
+            # Run the synchronous wikipedia API call in a thread pool
+            summary = await asyncio.to_thread(wikipedia.summary, topic, auto_suggest=self.auto_suggest)
+        except wikipedia.exceptions.PageError:
+            summary = None
+            log_info("Wikipedia Error: Page not found.")
         # Only create Document if we successfully got a summary
         if summary:

agno/knowledge/types.py CHANGED Viewed

@@ -20,6 +20,7 @@ class ContentType(str, Enum):
     MARKDOWN = ".md"
     DOCX = ".docx"
     DOC = ".doc"
+    PPTX = ".pptx"
     JSON = ".json"
     # Spreadsheet file extensions

agno/knowledge/utils.py CHANGED Viewed

@@ -1,5 +1,6 @@
-from typing import Dict, List
+from typing import Any, Dict, List, Optional
+from agno.knowledge.reader.base import Reader
 from agno.knowledge.reader.reader_factory import ReaderFactory
 from agno.knowledge.types import ContentType
 from agno.utils.log import log_debug
@@ -75,8 +76,33 @@ def get_reader_info(reader_key: str) -> Dict:
         raise ValueError(f"Unknown reader: {reader_key}. Error: {str(e)}")
-def get_all_readers_info() -> List[Dict]:
-    """Get information about all available readers."""
+def get_reader_info_from_instance(reader: Reader, reader_id: str) -> Dict:
+    """Get information about a reader instance."""
+    try:
+        reader_class = reader.__class__
+        supported_strategies = reader_class.get_supported_chunking_strategies()
+        supported_content_types = reader_class.get_supported_content_types()
+        return {
+            "id": reader_id,
+            "name": getattr(reader, "name", reader_class.__name__),
+            "description": getattr(reader, "description", f"Custom {reader_class.__name__}"),
+            "chunking_strategies": [strategy.value for strategy in supported_strategies],
+            "content_types": [ct.value for ct in supported_content_types],
+        }
+    except Exception as e:
+        raise ValueError(f"Failed to get info for reader '{reader_id}': {str(e)}")
+def get_all_readers_info(knowledge_instance: Optional[Any] = None) -> List[Dict]:
+    """Get information about all available readers, including custom readers from a Knowledge instance.
+    Args:
+        knowledge_instance: Optional Knowledge instance to include custom readers from.
+    Returns:
+        List of reader info dictionaries.
+    """
     readers_info = []
     keys = ReaderFactory.get_all_reader_keys()
     for key in keys:
@@ -88,18 +114,35 @@ def get_all_readers_info() -> List[Dict]:
             # Log the error but don't fail the entire request
             log_debug(f"Skipping reader '{key}': {e}")
             continue
+    # Add custom readers from knowledge instance if provided
+    if knowledge_instance is not None:
+        custom_readers = knowledge_instance.get_readers()
+        if isinstance(custom_readers, dict):
+            for reader_id, reader in custom_readers.items():
+                try:
+                    reader_info = get_reader_info_from_instance(reader, reader_id)
+                    # Only add if not already present (custom readers take precedence)
+                    if not any(r["id"] == reader_id for r in readers_info):
+                        readers_info.append(reader_info)
+                except ValueError as e:
+                    log_debug(f"Skipping custom reader '{reader_id}': {e}")
+                    continue
     return readers_info
-def get_content_types_to_readers_mapping() -> Dict[str, List[str]]:
+def get_content_types_to_readers_mapping(knowledge_instance: Optional[Any] = None) -> Dict[str, List[str]]:
     """Get mapping of content types to list of reader IDs that support them.
+    Args:
+        knowledge_instance: Optional Knowledge instance to include custom readers from.
     Returns:
         Dictionary mapping content type strings (ContentType enum values) to list of reader IDs.
     """
     content_type_mapping: Dict[str, List[str]] = {}
-    readers_info = get_all_readers_info()
+    readers_info = get_all_readers_info(knowledge_instance)
     for reader_info in readers_info:
         reader_id = reader_info["id"]
         content_types = reader_info.get("content_types", [])
@@ -107,7 +150,9 @@ def get_content_types_to_readers_mapping() -> Dict[str, List[str]]:
         for content_type in content_types:
             if content_type not in content_type_mapping:
                 content_type_mapping[content_type] = []
-            content_type_mapping[content_type].append(reader_id)
+            # Avoid duplicates
+            if reader_id not in content_type_mapping[content_type]:
+                content_type_mapping[content_type].append(reader_id)
     return content_type_mapping
@@ -129,12 +174,32 @@ def get_chunker_info(chunker_key: str) -> Dict:
             class_name = chunker_class.__name__
             docstring = chunker_class.__doc__ or f"{class_name} chunking strategy"
+            # Check class __init__ signature for chunk_size and overlap parameters
+            metadata = {}
+            import inspect
+            try:
+                sig = inspect.signature(chunker_class.__init__)
+                param_names = set(sig.parameters.keys())
+                # If class has chunk_size or max_chunk_size parameter, set default chunk_size
+                if "chunk_size" in param_names or "max_chunk_size" in param_names:
+                    metadata["chunk_size"] = 5000
+                # If class has overlap parameter, set default overlap
+                if "overlap" in param_names:
+                    metadata["chunk_overlap"] = 0
+            except Exception:
+                # If we can't inspect, skip metadata
+                pass
             return {
                 "key": chunker_key,
                 "class_name": class_name,
                 "name": chunker_key,
                 "description": docstring.strip(),
                 "strategy_type": strategy_type.value,
+                "metadata": metadata,
             }
         except ValueError:
             raise ValueError(f"Unknown chunker key: {chunker_key}")

agno/media.py CHANGED Viewed

@@ -4,6 +4,8 @@ from uuid import uuid4
 from pydantic import BaseModel, field_validator, model_validator
+from agno.utils.log import log_error
 class Image(BaseModel):
     """Unified Image class for all use cases (input, output, artifacts)"""
@@ -395,10 +397,20 @@ class File(BaseModel):
         name: Optional[str] = None,
         format: Optional[str] = None,
     ) -> "File":
-        """Create File from base64 encoded content"""
+        """Create File from base64 encoded content or plain text.
+        Handles both base64-encoded binary content and plain text content
+        (which is stored as UTF-8 strings for text/* MIME types).
+        """
         import base64
-        content_bytes = base64.b64decode(base64_content)
+        try:
+            content_bytes = base64.b64decode(base64_content)
+        except Exception:
+            # If not valid base64, it might be plain text content (text/csv, text/plain, etc.)
+            # which is stored as UTF-8 strings, not base64
+            content_bytes = base64_content.encode("utf-8")
         return cls(
             content=content_bytes,
             id=id,
@@ -413,10 +425,14 @@ class File(BaseModel):
         import httpx
         if self.url:
-            response = httpx.get(self.url)
-            content = response.content
-            mime_type = response.headers.get("Content-Type", "").split(";")[0]
-            return content, mime_type
+            try:
+                response = httpx.get(self.url)
+                content = response.content
+                mime_type = response.headers.get("Content-Type", "").split(";")[0]
+                return content, mime_type
+            except Exception:
+                log_error(f"Failed to download file from {self.url}")
+                return None
         else:
             return None

agno/memory/__init__.py CHANGED Viewed

@@ -1,3 +1,16 @@
 from agno.memory.manager import MemoryManager, UserMemory
+from agno.memory.strategies import (
+    MemoryOptimizationStrategy,
+    MemoryOptimizationStrategyFactory,
+    MemoryOptimizationStrategyType,
+    SummarizeStrategy,
+)
-__all__ = ["MemoryManager", "UserMemory"]
+__all__ = [
+    "MemoryManager",
+    "UserMemory",
+    "MemoryOptimizationStrategy",
+    "MemoryOptimizationStrategyType",
+    "MemoryOptimizationStrategyFactory",
+    "SummarizeStrategy",
+]

agno 2.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl

agno 2.1.2py3-none-any.whl → 2.3.13py3-none-any.whl