PyPI - agno - Versions diffs - 2.0.11__py3-none-any.whl → 2.1.1__py3-none-any.whl - Mend

agno 2.0.11py3-none-any.whl → 2.1.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

agno/agent/agent.py +607 -176
agno/db/in_memory/in_memory_db.py +42 -29
agno/db/mongo/mongo.py +65 -66
agno/db/postgres/postgres.py +6 -4
agno/db/utils.py +50 -22
agno/exceptions.py +62 -1
agno/guardrails/__init__.py +6 -0
agno/guardrails/base.py +19 -0
agno/guardrails/openai.py +144 -0
agno/guardrails/pii.py +94 -0
agno/guardrails/prompt_injection.py +51 -0
agno/knowledge/embedder/aws_bedrock.py +9 -4
agno/knowledge/embedder/azure_openai.py +54 -0
agno/knowledge/embedder/base.py +2 -0
agno/knowledge/embedder/cohere.py +184 -5
agno/knowledge/embedder/google.py +79 -1
agno/knowledge/embedder/huggingface.py +9 -4
agno/knowledge/embedder/jina.py +63 -0
agno/knowledge/embedder/mistral.py +78 -11
agno/knowledge/embedder/ollama.py +5 -0
agno/knowledge/embedder/openai.py +18 -54
agno/knowledge/embedder/voyageai.py +69 -16
agno/knowledge/knowledge.py +11 -4
agno/knowledge/reader/pdf_reader.py +4 -3
agno/knowledge/reader/website_reader.py +3 -2
agno/models/base.py +125 -32
agno/models/cerebras/cerebras.py +1 -0
agno/models/cerebras/cerebras_openai.py +1 -0
agno/models/dashscope/dashscope.py +1 -0
agno/models/google/gemini.py +27 -5
agno/models/openai/chat.py +13 -4
agno/models/openai/responses.py +1 -1
agno/models/perplexity/perplexity.py +2 -3
agno/models/requesty/__init__.py +5 -0
agno/models/requesty/requesty.py +49 -0
agno/models/vllm/vllm.py +1 -0
agno/models/xai/xai.py +1 -0
agno/os/app.py +98 -126
agno/os/interfaces/__init__.py +1 -0
agno/os/interfaces/agui/agui.py +21 -5
agno/os/interfaces/base.py +4 -2
agno/os/interfaces/slack/slack.py +13 -8
agno/os/interfaces/whatsapp/router.py +2 -0
agno/os/interfaces/whatsapp/whatsapp.py +12 -5
agno/os/mcp.py +2 -2
agno/os/middleware/__init__.py +7 -0
agno/os/middleware/jwt.py +233 -0
agno/os/router.py +182 -46
agno/os/routers/home.py +2 -2
agno/os/routers/memory/memory.py +23 -1
agno/os/routers/memory/schemas.py +1 -1
agno/os/routers/session/session.py +20 -3
agno/os/utils.py +74 -8
agno/run/agent.py +120 -77
agno/run/base.py +2 -13
agno/run/team.py +115 -72
agno/run/workflow.py +5 -15
agno/session/summary.py +9 -10
agno/session/team.py +2 -1
agno/team/team.py +721 -169
agno/tools/firecrawl.py +4 -4
agno/tools/function.py +42 -2
agno/tools/knowledge.py +3 -3
agno/tools/searxng.py +2 -2
agno/tools/serper.py +2 -2
agno/tools/spider.py +2 -2
agno/tools/workflow.py +4 -5
agno/utils/events.py +66 -1
agno/utils/hooks.py +57 -0
agno/utils/media.py +11 -9
agno/utils/print_response/agent.py +43 -5
agno/utils/print_response/team.py +48 -12
agno/utils/serialize.py +32 -0
agno/vectordb/cassandra/cassandra.py +44 -4
agno/vectordb/chroma/chromadb.py +79 -8
agno/vectordb/clickhouse/clickhousedb.py +43 -6
agno/vectordb/couchbase/couchbase.py +76 -5
agno/vectordb/lancedb/lance_db.py +38 -3
agno/vectordb/milvus/milvus.py +76 -4
agno/vectordb/mongodb/mongodb.py +76 -4
agno/vectordb/pgvector/pgvector.py +50 -6
agno/vectordb/pineconedb/pineconedb.py +39 -2
agno/vectordb/qdrant/qdrant.py +76 -26
agno/vectordb/singlestore/singlestore.py +77 -4
agno/vectordb/upstashdb/upstashdb.py +42 -2
agno/vectordb/weaviate/weaviate.py +39 -3
agno/workflow/types.py +5 -6
agno/workflow/workflow.py +58 -2
{agno-2.0.11.dist-info → agno-2.1.1.dist-info}/METADATA +4 -3
{agno-2.0.11.dist-info → agno-2.1.1.dist-info}/RECORD +93 -82
{agno-2.0.11.dist-info → agno-2.1.1.dist-info}/WHEEL +0 -0
{agno-2.0.11.dist-info → agno-2.1.1.dist-info}/licenses/LICENSE +0 -0
{agno-2.0.11.dist-info → agno-2.1.1.dist-info}/top_level.txt +0 -0

agno/vectordb/upstashdb/upstashdb.py CHANGED Viewed

@@ -504,8 +504,48 @@ class UpstashVectorDb(VectorDb):
         _namespace = self.namespace if namespace is None else namespace
         vectors = []
-        embed_tasks = [document.async_embed(embedder=self.embedder) for document in documents]
-        await asyncio.gather(*embed_tasks, return_exceptions=True)
+        if (
+            self.embedder
+            and self.embedder.enable_batch
+            and hasattr(self.embedder, "async_get_embeddings_batch_and_usage")
+        ):
+            # Use batch embedding when enabled and supported
+            try:
+                # Extract content from all documents
+                doc_contents = [doc.content for doc in documents]
+                # Get batch embeddings and usage
+                embeddings, usages = await self.embedder.async_get_embeddings_batch_and_usage(doc_contents)
+                # Process documents with pre-computed embeddings
+                for j, doc in enumerate(documents):
+                    try:
+                        if j < len(embeddings):
+                            doc.embedding = embeddings[j]
+                            doc.usage = usages[j] if j < len(usages) else None
+                    except Exception as e:
+                        logger.error(f"Error assigning batch embedding to document '{doc.name}': {e}")
+            except Exception as e:
+                # Check if this is a rate limit error - don't fall back as it would make things worse
+                error_str = str(e).lower()
+                is_rate_limit = any(
+                    phrase in error_str
+                    for phrase in ["rate limit", "too many requests", "429", "trial key", "api calls / minute"]
+                )
+                if is_rate_limit:
+                    logger.error(f"Rate limit detected during batch embedding. {e}")
+                    raise e
+                else:
+                    logger.warning(f"Async batch embedding failed, falling back to individual embeddings: {e}")
+                    # Fall back to individual embedding
+                    embed_tasks = [doc.async_embed(embedder=self.embedder) for doc in documents]
+                    await asyncio.gather(*embed_tasks, return_exceptions=True)
+        else:
+            # Use individual embedding
+            embed_tasks = [document.async_embed(embedder=self.embedder) for document in documents]
+            await asyncio.gather(*embed_tasks, return_exceptions=True)
         for i, document in enumerate(documents):
             if document.id is None:

agno/vectordb/weaviate/weaviate.py CHANGED Viewed

@@ -270,9 +270,45 @@ class Weaviate(VectorDb):
         if not documents:
             return
-        # Embed document
-        embed_tasks = [document.async_embed(embedder=self.embedder) for document in documents]
-        await asyncio.gather(*embed_tasks, return_exceptions=True)
+        # Apply batch embedding logic
+        if self.embedder.enable_batch and hasattr(self.embedder, "async_get_embeddings_batch_and_usage"):
+            # Use batch embedding when enabled and supported
+            try:
+                # Extract content from all documents
+                doc_contents = [doc.content for doc in documents]
+                # Get batch embeddings and usage
+                embeddings, usages = await self.embedder.async_get_embeddings_batch_and_usage(doc_contents)
+                # Process documents with pre-computed embeddings
+                for j, doc in enumerate(documents):
+                    try:
+                        if j < len(embeddings):
+                            doc.embedding = embeddings[j]
+                            doc.usage = usages[j] if j < len(usages) else None
+                    except Exception as e:
+                        logger.error(f"Error assigning batch embedding to document '{doc.name}': {e}")
+            except Exception as e:
+                # Check if this is a rate limit error - don't fall back as it would make things worse
+                error_str = str(e).lower()
+                is_rate_limit = any(
+                    phrase in error_str
+                    for phrase in ["rate limit", "too many requests", "429", "trial key", "api calls / minute"]
+                )
+                if is_rate_limit:
+                    logger.error(f"Rate limit detected during batch embedding. {e}")
+                    raise e
+                else:
+                    logger.warning(f"Async batch embedding failed, falling back to individual embeddings: {e}")
+                    # Fall back to individual embedding
+                    embed_tasks = [doc.async_embed(embedder=self.embedder) for doc in documents]
+                    await asyncio.gather(*embed_tasks, return_exceptions=True)
+        else:
+            # Use individual embedding
+            embed_tasks = [document.async_embed(embedder=self.embedder) for document in documents]
+            await asyncio.gather(*embed_tasks, return_exceptions=True)
         client = await self.get_async_client()
         try:

agno/workflow/types.py CHANGED Viewed

@@ -1,3 +1,4 @@
+import json
 from dataclasses import dataclass
 from enum import Enum
 from typing import Any, Dict, List, Optional, Union
@@ -8,6 +9,7 @@ from pydantic import BaseModel
 from agno.media import Audio, File, Image, Video
 from agno.models.metrics import Metrics
 from agno.utils.log import log_warning
+from agno.utils.serialize import json_serializer
 @dataclass
@@ -57,6 +59,7 @@ class WorkflowExecutionInput:
             "images": [img.to_dict() for img in self.images] if self.images else None,
             "videos": [vid.to_dict() for vid in self.videos] if self.videos else None,
             "audio": [aud.to_dict() for aud in self.audio] if self.audio else None,
+            "files": [file.to_dict() for file in self.files] if self.files else None,
         }
@@ -442,9 +445,7 @@ class WebSocketHandler:
             else:
                 data = {"type": "message", "content": str(event)}
-            import json
-            await self.websocket.send_text(self.format_sse_event(json.dumps(data)))
+            await self.websocket.send_text(self.format_sse_event(json.dumps(data, default=json_serializer)))
         except Exception as e:
             log_warning(f"Failed to handle WebSocket event: {e}")
@@ -465,9 +466,7 @@ class WebSocketHandler:
             return
         try:
-            import json
-            await self.websocket.send_text(self.format_sse_event(json.dumps(data)))
+            await self.websocket.send_text(self.format_sse_event(json.dumps(data, default=json_serializer)))
         except Exception as e:
             log_warning(f"Failed to send WebSocket dict: {e}")

agno/workflow/workflow.py CHANGED Viewed

@@ -25,7 +25,7 @@ from pydantic import BaseModel
 from agno.agent.agent import Agent
 from agno.db.base import BaseDb, SessionType
-from agno.exceptions import RunCancelledException
+from agno.exceptions import InputCheckError, OutputCheckError, RunCancelledException
 from agno.media import Audio, File, Image, Video
 from agno.models.message import Message
 from agno.models.metrics import Metrics
@@ -54,6 +54,7 @@ from agno.team.team import Team
 from agno.utils.common import is_typed_dict, validate_typed_dict
 from agno.utils.log import (
     log_debug,
+    log_error,
     log_warning,
     logger,
     set_log_level_to_debug,
@@ -1000,8 +1001,14 @@ class Workflow:
                 workflow_run_response.audio = output_audio
                 workflow_run_response.status = RunStatus.completed
+            except (InputCheckError, OutputCheckError) as e:
+                log_error(f"Validation failed: {str(e)} | Check: {e.check_trigger}")
+                # Store error response
+                workflow_run_response.status = RunStatus.error
+                workflow_run_response.content = f"Validation failed: {str(e)} | Check: {e.check_trigger}"
+                raise e
             except RunCancelledException as e:
-                # Handle run cancellation
                 logger.info(f"Workflow run {workflow_run_response.run_id} was cancelled")
                 workflow_run_response.status = RunStatus.cancelled
                 workflow_run_response.content = str(e)
@@ -1013,6 +1020,7 @@ class Workflow:
                 # Store error response
                 workflow_run_response.status = RunStatus.error
                 workflow_run_response.content = f"Workflow execution failed: {e}"
+                raise e
             finally:
                 self._update_session_metrics(session=session, workflow_run_response=workflow_run_response)
@@ -1199,6 +1207,24 @@ class Workflow:
                 workflow_run_response.audio = output_audio
                 workflow_run_response.status = RunStatus.completed
+            except (InputCheckError, OutputCheckError) as e:
+                log_error(f"Validation failed: {str(e)} | Check: {e.check_trigger}")
+                from agno.run.workflow import WorkflowErrorEvent
+                error_event = WorkflowErrorEvent(
+                    run_id=workflow_run_response.run_id or "",
+                    workflow_id=self.id,
+                    workflow_name=self.name,
+                    session_id=session.session_id,
+                    error=str(e),
+                )
+                yield error_event
+                # Update workflow_run_response with error
+                workflow_run_response.content = error_event.error
+                workflow_run_response.status = RunStatus.error
             except RunCancelledException as e:
                 # Handle run cancellation during streaming
                 logger.info(f"Workflow run {workflow_run_response.run_id} was cancelled during streaming")
@@ -1230,6 +1256,7 @@ class Workflow:
                 # Update workflow_run_response with error
                 workflow_run_response.content = error_event.error
                 workflow_run_response.status = RunStatus.error
+                raise e
         # Yield workflow completed event
         workflow_completed_event = WorkflowCompletedEvent(
@@ -1436,6 +1463,13 @@ class Workflow:
                 workflow_run_response.audio = output_audio
                 workflow_run_response.status = RunStatus.completed
+            except (InputCheckError, OutputCheckError) as e:
+                log_error(f"Validation failed: {str(e)} | Check: {e.check_trigger}")
+                # Store error response
+                workflow_run_response.status = RunStatus.error
+                workflow_run_response.content = f"Validation failed: {str(e)} | Check: {e.check_trigger}"
+                raise e
             except RunCancelledException as e:
                 logger.info(f"Workflow run {workflow_run_response.run_id} was cancelled")
                 workflow_run_response.status = RunStatus.cancelled
@@ -1444,6 +1478,7 @@ class Workflow:
                 logger.error(f"Workflow execution failed: {e}")
                 workflow_run_response.status = RunStatus.error
                 workflow_run_response.content = f"Workflow execution failed: {e}"
+                raise e
         self._update_session_metrics(session=session, workflow_run_response=workflow_run_response)
         session.upsert_run(run=workflow_run_response)
@@ -1471,6 +1506,7 @@ class Workflow:
         from inspect import isasyncgenfunction, iscoroutinefunction, isgeneratorfunction
         workflow_run_response.status = RunStatus.running
         workflow_started_event = WorkflowStartedEvent(
             run_id=workflow_run_response.run_id or "",
             workflow_name=workflow_run_response.workflow_name,
@@ -1633,6 +1669,24 @@ class Workflow:
                 workflow_run_response.audio = output_audio
                 workflow_run_response.status = RunStatus.completed
+            except (InputCheckError, OutputCheckError) as e:
+                log_error(f"Validation failed: {str(e)} | Check: {e.check_trigger}")
+                from agno.run.workflow import WorkflowErrorEvent
+                error_event = WorkflowErrorEvent(
+                    run_id=workflow_run_response.run_id or "",
+                    workflow_id=self.id,
+                    workflow_name=self.name,
+                    session_id=session.session_id,
+                    error=str(e),
+                )
+                yield error_event
+                # Update workflow_run_response with error
+                workflow_run_response.content = error_event.error
+                workflow_run_response.status = RunStatus.error
             except RunCancelledException as e:
                 # Handle run cancellation during streaming
                 logger.info(f"Workflow run {workflow_run_response.run_id} was cancelled during streaming")
@@ -1668,6 +1722,7 @@ class Workflow:
                 # Update workflow_run_response with error
                 workflow_run_response.content = error_event.error
                 workflow_run_response.status = RunStatus.error
+                raise e
         # Yield workflow completed event
         workflow_completed_event = WorkflowCompletedEvent(
@@ -2175,6 +2230,7 @@ class Workflow:
             audio=audio,  # type: ignore
             images=images,  # type: ignore
             videos=videos,  # type: ignore
+            files=files,
         )
         log_debug(
             f"Created async pipeline input with session state keys: {list(session_state.keys()) if session_state else 'None'}"

{agno-2.0.11.dist-info → agno-2.1.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: agno
-Version: 2.0.11
+Version: 2.1.1
 Summary: Agno: a lightweight library for building Multi-Agent Systems
 Author-email: Ashpreet Bedi <ashpreet@agno.com>
 Project-URL: homepage, https://agno.com
@@ -48,6 +48,7 @@ Requires-Dist: uvicorn; extra == "dev"
 Provides-Extra: os
 Requires-Dist: fastapi; extra == "os"
 Requires-Dist: uvicorn; extra == "os"
+Requires-Dist: PyJWT; extra == "os"
 Provides-Extra: integration-tests
 Requires-Dist: exa_py; extra == "integration-tests"
 Requires-Dist: ddgs; extra == "integration-tests"
@@ -444,7 +445,7 @@ At Agno, we're obsessed with performance. Why? because even simple AI workflows
 - Agent instantiation: ~3μs on average
 - Memory footprint: ~6.5Kib on average
-> Tested on an Apple M4 Mackbook Pro.
+> Tested on an Apple M4 MacBook Pro.
 While an Agent's run-time is bottlenecked by inference, we must do everything possible to minimize execution time, reduce memory usage, and parallelize tool calls. These numbers may seem trivial at first, but our experience shows that they add up even at a reasonably small scale.
@@ -468,7 +469,7 @@ python evals/performance/instantiation_with_tool.py
 python evals/performance/other/langgraph_instantiation.py
 ```
-> The following evaluation is run on an Apple M4 Mackbook Pro. It also runs as a Github action on this repo.
+> The following evaluation is run on an Apple M4 MacBook Pro. It also runs as a Github action on this repo.
 LangGraph is on the right, **let's start it first and give it a head start**.

agno 2.0.11__py3-none-any.whl → 2.1.1__py3-none-any.whl

agno 2.0.11py3-none-any.whl → 2.1.1py3-none-any.whl