PyPI - agno - Versions diffs - 2.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl - Mend

agno 2.1.2py3-none-any.whl → 2.3.13py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (314) hide show

agno/agent/agent.py +5540 -2273
agno/api/api.py +2 -0
agno/api/os.py +1 -1
agno/compression/__init__.py +3 -0
agno/compression/manager.py +247 -0
agno/culture/__init__.py +3 -0
agno/culture/manager.py +956 -0
agno/db/async_postgres/__init__.py +3 -0
agno/db/base.py +689 -6
agno/db/dynamo/dynamo.py +933 -37
agno/db/dynamo/schemas.py +174 -10
agno/db/dynamo/utils.py +63 -4
agno/db/firestore/firestore.py +831 -9
agno/db/firestore/schemas.py +51 -0
agno/db/firestore/utils.py +102 -4
agno/db/gcs_json/gcs_json_db.py +660 -12
agno/db/gcs_json/utils.py +60 -26
agno/db/in_memory/in_memory_db.py +287 -14
agno/db/in_memory/utils.py +60 -2
agno/db/json/json_db.py +590 -14
agno/db/json/utils.py +60 -26
agno/db/migrations/manager.py +199 -0
agno/db/migrations/v1_to_v2.py +43 -13
agno/db/migrations/versions/__init__.py +0 -0
agno/db/migrations/versions/v2_3_0.py +938 -0
agno/db/mongo/__init__.py +15 -1
agno/db/mongo/async_mongo.py +2760 -0
agno/db/mongo/mongo.py +879 -11
agno/db/mongo/schemas.py +42 -0
agno/db/mongo/utils.py +80 -8
agno/db/mysql/__init__.py +2 -1
agno/db/mysql/async_mysql.py +2912 -0
agno/db/mysql/mysql.py +946 -68
agno/db/mysql/schemas.py +72 -10
agno/db/mysql/utils.py +198 -7
agno/db/postgres/__init__.py +2 -1
agno/db/postgres/async_postgres.py +2579 -0
agno/db/postgres/postgres.py +942 -57
agno/db/postgres/schemas.py +81 -18
agno/db/postgres/utils.py +164 -2
agno/db/redis/redis.py +671 -7
agno/db/redis/schemas.py +50 -0
agno/db/redis/utils.py +65 -7
agno/db/schemas/__init__.py +2 -1
agno/db/schemas/culture.py +120 -0
agno/db/schemas/evals.py +1 -0
agno/db/schemas/memory.py +17 -2
agno/db/singlestore/schemas.py +63 -0
agno/db/singlestore/singlestore.py +949 -83
agno/db/singlestore/utils.py +60 -2
agno/db/sqlite/__init__.py +2 -1
agno/db/sqlite/async_sqlite.py +2911 -0
agno/db/sqlite/schemas.py +62 -0
agno/db/sqlite/sqlite.py +965 -46
agno/db/sqlite/utils.py +169 -8
agno/db/surrealdb/__init__.py +3 -0
agno/db/surrealdb/metrics.py +292 -0
agno/db/surrealdb/models.py +334 -0
agno/db/surrealdb/queries.py +71 -0
agno/db/surrealdb/surrealdb.py +1908 -0
agno/db/surrealdb/utils.py +147 -0
agno/db/utils.py +2 -0
agno/eval/__init__.py +10 -0
agno/eval/accuracy.py +75 -55
agno/eval/agent_as_judge.py +861 -0
agno/eval/base.py +29 -0
agno/eval/performance.py +16 -7
agno/eval/reliability.py +28 -16
agno/eval/utils.py +35 -17
agno/exceptions.py +27 -2
agno/filters.py +354 -0
agno/guardrails/prompt_injection.py +1 -0
agno/hooks/__init__.py +3 -0
agno/hooks/decorator.py +164 -0
agno/integrations/discord/client.py +1 -1
agno/knowledge/chunking/agentic.py +13 -10
agno/knowledge/chunking/fixed.py +4 -1
agno/knowledge/chunking/semantic.py +9 -4
agno/knowledge/chunking/strategy.py +59 -15
agno/knowledge/embedder/fastembed.py +1 -1
agno/knowledge/embedder/nebius.py +1 -1
agno/knowledge/embedder/ollama.py +8 -0
agno/knowledge/embedder/openai.py +8 -8
agno/knowledge/embedder/sentence_transformer.py +6 -2
agno/knowledge/embedder/vllm.py +262 -0
agno/knowledge/knowledge.py +1618 -318
agno/knowledge/reader/base.py +6 -2
agno/knowledge/reader/csv_reader.py +8 -10
agno/knowledge/reader/docx_reader.py +5 -6
agno/knowledge/reader/field_labeled_csv_reader.py +16 -20
agno/knowledge/reader/json_reader.py +5 -4
agno/knowledge/reader/markdown_reader.py +8 -8
agno/knowledge/reader/pdf_reader.py +17 -19
agno/knowledge/reader/pptx_reader.py +101 -0
agno/knowledge/reader/reader_factory.py +32 -3
agno/knowledge/reader/s3_reader.py +3 -3
agno/knowledge/reader/tavily_reader.py +193 -0
agno/knowledge/reader/text_reader.py +22 -10
agno/knowledge/reader/web_search_reader.py +1 -48
agno/knowledge/reader/website_reader.py +10 -10
agno/knowledge/reader/wikipedia_reader.py +33 -1
agno/knowledge/types.py +1 -0
agno/knowledge/utils.py +72 -7
agno/media.py +22 -6
agno/memory/__init__.py +14 -1
agno/memory/manager.py +544 -83
agno/memory/strategies/__init__.py +15 -0
agno/memory/strategies/base.py +66 -0
agno/memory/strategies/summarize.py +196 -0
agno/memory/strategies/types.py +37 -0
agno/models/aimlapi/aimlapi.py +17 -0
agno/models/anthropic/claude.py +515 -40
agno/models/aws/bedrock.py +102 -21
agno/models/aws/claude.py +131 -274
agno/models/azure/ai_foundry.py +41 -19
agno/models/azure/openai_chat.py +39 -8
agno/models/base.py +1249 -525
agno/models/cerebras/cerebras.py +91 -21
agno/models/cerebras/cerebras_openai.py +21 -2
agno/models/cohere/chat.py +40 -6
agno/models/cometapi/cometapi.py +18 -1
agno/models/dashscope/dashscope.py +2 -3
agno/models/deepinfra/deepinfra.py +18 -1
agno/models/deepseek/deepseek.py +69 -3
agno/models/fireworks/fireworks.py +18 -1
agno/models/google/gemini.py +877 -80
agno/models/google/utils.py +22 -0
agno/models/groq/groq.py +51 -18
agno/models/huggingface/huggingface.py +17 -6
agno/models/ibm/watsonx.py +16 -6
agno/models/internlm/internlm.py +18 -1
agno/models/langdb/langdb.py +13 -1
agno/models/litellm/chat.py +44 -9
agno/models/litellm/litellm_openai.py +18 -1
agno/models/message.py +28 -5
agno/models/meta/llama.py +47 -14
agno/models/meta/llama_openai.py +22 -17
agno/models/mistral/mistral.py +8 -4
agno/models/nebius/nebius.py +6 -7
agno/models/nvidia/nvidia.py +20 -3
agno/models/ollama/chat.py +24 -8
agno/models/openai/chat.py +104 -29
agno/models/openai/responses.py +101 -81
agno/models/openrouter/openrouter.py +60 -3
agno/models/perplexity/perplexity.py +17 -1
agno/models/portkey/portkey.py +7 -6
agno/models/requesty/requesty.py +24 -4
agno/models/response.py +73 -2
agno/models/sambanova/sambanova.py +20 -3
agno/models/siliconflow/siliconflow.py +19 -2
agno/models/together/together.py +20 -3
agno/models/utils.py +254 -8
agno/models/vercel/v0.py +20 -3
agno/models/vertexai/__init__.py +0 -0
agno/models/vertexai/claude.py +190 -0
agno/models/vllm/vllm.py +19 -14
agno/models/xai/xai.py +19 -2
agno/os/app.py +549 -152
agno/os/auth.py +190 -3
agno/os/config.py +23 -0
agno/os/interfaces/a2a/router.py +8 -11
agno/os/interfaces/a2a/utils.py +1 -1
agno/os/interfaces/agui/router.py +18 -3
agno/os/interfaces/agui/utils.py +152 -39
agno/os/interfaces/slack/router.py +55 -37
agno/os/interfaces/slack/slack.py +9 -1
agno/os/interfaces/whatsapp/router.py +0 -1
agno/os/interfaces/whatsapp/security.py +3 -1
agno/os/mcp.py +110 -52
agno/os/middleware/__init__.py +2 -0
agno/os/middleware/jwt.py +676 -112
agno/os/router.py +40 -1478
agno/os/routers/agents/__init__.py +3 -0
agno/os/routers/agents/router.py +599 -0
agno/os/routers/agents/schema.py +261 -0
agno/os/routers/evals/evals.py +96 -39
agno/os/routers/evals/schemas.py +65 -33
agno/os/routers/evals/utils.py +80 -10
agno/os/routers/health.py +10 -4
agno/os/routers/knowledge/knowledge.py +196 -38
agno/os/routers/knowledge/schemas.py +82 -22
agno/os/routers/memory/memory.py +279 -52
agno/os/routers/memory/schemas.py +46 -17
agno/os/routers/metrics/metrics.py +20 -8
agno/os/routers/metrics/schemas.py +16 -16
agno/os/routers/session/session.py +462 -34
agno/os/routers/teams/__init__.py +3 -0
agno/os/routers/teams/router.py +512 -0
agno/os/routers/teams/schema.py +257 -0
agno/os/routers/traces/__init__.py +3 -0
agno/os/routers/traces/schemas.py +414 -0
agno/os/routers/traces/traces.py +499 -0
agno/os/routers/workflows/__init__.py +3 -0
agno/os/routers/workflows/router.py +624 -0
agno/os/routers/workflows/schema.py +75 -0
agno/os/schema.py +256 -693
agno/os/scopes.py +469 -0
agno/os/utils.py +514 -36
agno/reasoning/anthropic.py +80 -0
agno/reasoning/gemini.py +73 -0
agno/reasoning/openai.py +5 -0
agno/reasoning/vertexai.py +76 -0
agno/run/__init__.py +6 -0
agno/run/agent.py +155 -32
agno/run/base.py +55 -3
agno/run/requirement.py +181 -0
agno/run/team.py +125 -38
agno/run/workflow.py +72 -18
agno/session/agent.py +102 -89
agno/session/summary.py +56 -15
agno/session/team.py +164 -90
agno/session/workflow.py +405 -40
agno/table.py +10 -0
agno/team/team.py +3974 -1903
agno/tools/dalle.py +2 -4
agno/tools/eleven_labs.py +23 -25
agno/tools/exa.py +21 -16
agno/tools/file.py +153 -23
agno/tools/file_generation.py +16 -10
agno/tools/firecrawl.py +15 -7
agno/tools/function.py +193 -38
agno/tools/gmail.py +238 -14
agno/tools/google_drive.py +271 -0
agno/tools/googlecalendar.py +36 -8
agno/tools/googlesheets.py +20 -5
agno/tools/jira.py +20 -0
agno/tools/mcp/__init__.py +10 -0
agno/tools/mcp/mcp.py +331 -0
agno/tools/mcp/multi_mcp.py +347 -0
agno/tools/mcp/params.py +24 -0
agno/tools/mcp_toolbox.py +3 -3
agno/tools/models/nebius.py +5 -5
agno/tools/models_labs.py +20 -10
agno/tools/nano_banana.py +151 -0
agno/tools/notion.py +204 -0
agno/tools/parallel.py +314 -0
agno/tools/postgres.py +76 -36
agno/tools/redshift.py +406 -0
agno/tools/scrapegraph.py +1 -1
agno/tools/shopify.py +1519 -0
agno/tools/slack.py +18 -3
agno/tools/spotify.py +919 -0
agno/tools/tavily.py +146 -0
agno/tools/toolkit.py +25 -0
agno/tools/workflow.py +8 -1
agno/tools/yfinance.py +12 -11
agno/tracing/__init__.py +12 -0
agno/tracing/exporter.py +157 -0
agno/tracing/schemas.py +276 -0
agno/tracing/setup.py +111 -0
agno/utils/agent.py +938 -0
agno/utils/cryptography.py +22 -0
agno/utils/dttm.py +33 -0
agno/utils/events.py +151 -3
agno/utils/gemini.py +15 -5
agno/utils/hooks.py +118 -4
agno/utils/http.py +113 -2
agno/utils/knowledge.py +12 -5
agno/utils/log.py +1 -0
agno/utils/mcp.py +92 -2
agno/utils/media.py +187 -1
agno/utils/merge_dict.py +3 -3
agno/utils/message.py +60 -0
agno/utils/models/ai_foundry.py +9 -2
agno/utils/models/claude.py +49 -14
agno/utils/models/cohere.py +9 -2
agno/utils/models/llama.py +9 -2
agno/utils/models/mistral.py +4 -2
agno/utils/print_response/agent.py +109 -16
agno/utils/print_response/team.py +223 -30
agno/utils/print_response/workflow.py +251 -34
agno/utils/streamlit.py +1 -1
agno/utils/team.py +98 -9
agno/utils/tokens.py +657 -0
agno/vectordb/base.py +39 -7
agno/vectordb/cassandra/cassandra.py +21 -5
agno/vectordb/chroma/chromadb.py +43 -12
agno/vectordb/clickhouse/clickhousedb.py +21 -5
agno/vectordb/couchbase/couchbase.py +29 -5
agno/vectordb/lancedb/lance_db.py +92 -181
agno/vectordb/langchaindb/langchaindb.py +24 -4
agno/vectordb/lightrag/lightrag.py +17 -3
agno/vectordb/llamaindex/llamaindexdb.py +25 -5
agno/vectordb/milvus/milvus.py +50 -37
agno/vectordb/mongodb/__init__.py +7 -1
agno/vectordb/mongodb/mongodb.py +36 -30
agno/vectordb/pgvector/pgvector.py +201 -77
agno/vectordb/pineconedb/pineconedb.py +41 -23
agno/vectordb/qdrant/qdrant.py +67 -54
agno/vectordb/redis/__init__.py +9 -0
agno/vectordb/redis/redisdb.py +682 -0
agno/vectordb/singlestore/singlestore.py +50 -29
agno/vectordb/surrealdb/surrealdb.py +31 -41
agno/vectordb/upstashdb/upstashdb.py +34 -6
agno/vectordb/weaviate/weaviate.py +53 -14
agno/workflow/__init__.py +2 -0
agno/workflow/agent.py +299 -0
agno/workflow/condition.py +120 -18
agno/workflow/loop.py +77 -10
agno/workflow/parallel.py +231 -143
agno/workflow/router.py +118 -17
agno/workflow/step.py +609 -170
agno/workflow/steps.py +73 -6
agno/workflow/types.py +96 -21
agno/workflow/workflow.py +2039 -262
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/METADATA +201 -66
agno-2.3.13.dist-info/RECORD +613 -0
agno/tools/googlesearch.py +0 -98
agno/tools/mcp.py +0 -679
agno/tools/memori.py +0 -339
agno-2.1.2.dist-info/RECORD +0 -543
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/WHEEL +0 -0
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/licenses/LICENSE +0 -0
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/top_level.txt +0 -0

agno/models/openai/responses.py CHANGED Viewed

@@ -6,16 +6,18 @@ import httpx
 from pydantic import BaseModel
 from typing_extensions import Literal
-from agno.exceptions import ModelProviderError
+from agno.exceptions import ModelAuthenticationError, ModelProviderError
 from agno.media import File
-from agno.models.base import MessageData, Model
+from agno.models.base import Model
 from agno.models.message import Citations, Message, UrlCitation
 from agno.models.metrics import Metrics
 from agno.models.response import ModelResponse
 from agno.run.agent import RunOutput
+from agno.utils.http import get_default_async_client, get_default_sync_client
 from agno.utils.log import log_debug, log_error, log_warning
 from agno.utils.models.openai_responses import images_to_message
 from agno.utils.models.schema_utils import get_response_schema_for_provider
+from agno.utils.tokens import count_schema_tokens
 try:
     from openai import APIConnectionError, APIStatusError, AsyncOpenAI, OpenAI, RateLimitError
@@ -53,6 +55,7 @@ class OpenAIResponses(Model):
     truncation: Optional[Literal["auto", "disabled"]] = None
     user: Optional[str] = None
     service_tier: Optional[Literal["auto", "default", "flex", "priority"]] = None
+    strict_output: bool = True  # When True, guarantees schema adherence for structured outputs. When False, attempts to follow schema as a guide but may occasionally deviate
     extra_headers: Optional[Any] = None
     extra_query: Optional[Any] = None
     extra_body: Optional[Any] = None
@@ -66,7 +69,7 @@ class OpenAIResponses(Model):
     max_retries: Optional[int] = None
     default_headers: Optional[Dict[str, str]] = None
     default_query: Optional[Dict[str, str]] = None
-    http_client: Optional[httpx.Client] = None
+    http_client: Optional[Union[httpx.Client, httpx.AsyncClient]] = None
     client_params: Optional[Dict[str, Any]] = None
     # Parameters affecting built-in tools
@@ -115,7 +118,10 @@ class OpenAIResponses(Model):
         if not self.api_key:
             self.api_key = getenv("OPENAI_API_KEY")
             if not self.api_key:
-                log_error("OPENAI_API_KEY not set. Please set the OPENAI_API_KEY environment variable.")
+                raise ModelAuthenticationError(
+                    message="OPENAI_API_KEY not set. Please set the OPENAI_API_KEY environment variable.",
+                    model_name=self.name,
+                )
         # Define base client params
         base_params = {
@@ -139,7 +145,7 @@ class OpenAIResponses(Model):
     def get_client(self) -> OpenAI:
         """
-        Returns an OpenAI client.
+        Returns an OpenAI client. Caches the client to avoid recreating it on every request.
         Returns:
             OpenAI: An instance of the OpenAI client.
@@ -150,28 +156,29 @@ class OpenAIResponses(Model):
         client_params: Dict[str, Any] = self._get_client_params()
         if self.http_client is not None:
             client_params["http_client"] = self.http_client
+        else:
+            # Use global sync client when no custom http_client is provided
+            client_params["http_client"] = get_default_sync_client()
         self.client = OpenAI(**client_params)
         return self.client
     def get_async_client(self) -> AsyncOpenAI:
         """
-        Returns an asynchronous OpenAI client.
+        Returns an asynchronous OpenAI client. Caches the client to avoid recreating it on every request.
         Returns:
             AsyncOpenAI: An instance of the asynchronous OpenAI client.
         """
-        if self.async_client:
+        if self.async_client and not self.async_client.is_closed():
             return self.async_client
         client_params: Dict[str, Any] = self._get_client_params()
-        if self.http_client:
+        if self.http_client and isinstance(self.http_client, httpx.AsyncClient):
             client_params["http_client"] = self.http_client
         else:
-            # Create a new async HTTP client with custom limits
-            client_params["http_client"] = httpx.AsyncClient(
-                limits=httpx.Limits(max_connections=1000, max_keepalive_connections=100)
-            )
+            # Use global async client when no custom http_client is provided
+            client_params["http_client"] = get_default_async_client()
         self.async_client = AsyncOpenAI(**client_params)
         return self.async_client
@@ -224,7 +231,7 @@ class OpenAIResponses(Model):
                     "type": "json_schema",
                     "name": response_format.__name__,
                     "schema": schema,
-                    "strict": True,
+                    "strict": self.strict_output,
                 }
             else:
                 # JSON mode
@@ -301,6 +308,8 @@ class OpenAIResponses(Model):
     def _upload_file(self, file: File) -> Optional[str]:
         """Upload a file to the OpenAI vector database."""
+        from pathlib import Path
+        from urllib.parse import urlparse
         if file.url is not None:
             file_content_tuple = file.file_url_content
@@ -308,13 +317,12 @@ class OpenAIResponses(Model):
                 file_content = file_content_tuple[0]
             else:
                 return None
-            file_name = file.url.split("/")[-1]
+            file_name = Path(urlparse(file.url).path).name or "file"
             file_tuple = (file_name, file_content)
             result = self.get_client().files.create(file=file_tuple, purpose="assistants")
             return result.id
         elif file.filepath is not None:
             import mimetypes
-            from pathlib import Path
             file_path = file.filepath if isinstance(file.filepath, Path) else Path(file.filepath)
             if file_path.exists() and file_path.is_file():
@@ -392,12 +400,15 @@ class OpenAIResponses(Model):
         return formatted_tools
-    def _format_messages(self, messages: List[Message]) -> List[Union[Dict[str, Any], ResponseReasoningItem]]:
+    def _format_messages(
+        self, messages: List[Message], compress_tool_results: bool = False
+    ) -> List[Union[Dict[str, Any], ResponseReasoningItem]]:
         """
         Format a message into the format expected by OpenAI.
         Args:
             messages (List[Message]): The message to format.
+            compress_tool_results: Whether to compress tool results.
         Returns:
             Dict[str, Any]: The formatted message.
@@ -442,7 +453,7 @@ class OpenAIResponses(Model):
             if message.role in ["user", "system"]:
                 message_dict: Dict[str, Any] = {
                     "role": self.role_map[message.role],
-                    "content": message.content,
+                    "content": message.get_content(use_compressed_content=compress_tool_results),
                 }
                 message_dict = {k: v for k, v in message_dict.items() if v is not None}
@@ -466,7 +477,9 @@ class OpenAIResponses(Model):
             # Tool call result
             elif message.role == "tool":
-                if message.tool_call_id and message.content is not None:
+                tool_result = message.get_content(use_compressed_content=compress_tool_results)
+                if message.tool_call_id and tool_result is not None:
                     function_call_id = message.tool_call_id
                     # Normalize: if a fc_* id was provided, translate to its corresponding call_* id
                     if isinstance(function_call_id, str) and function_call_id in fc_id_to_call_id:
@@ -474,7 +487,7 @@ class OpenAIResponses(Model):
                     else:
                         call_id_value = function_call_id
                     formatted_messages.append(
-                        {"type": "function_call_output", "call_id": call_id_value, "output": message.content}
+                        {"type": "function_call_output", "call_id": call_id_value, "output": tool_result}
                     )
             # Tool Calls
             elif message.tool_calls is not None and len(message.tool_calls) > 0:
@@ -508,6 +521,49 @@ class OpenAIResponses(Model):
                         formatted_messages.append(reasoning_output)
         return formatted_messages
+    def count_tokens(
+        self,
+        messages: List[Message],
+        tools: Optional[List[Dict[str, Any]]] = None,
+        output_schema: Optional[Union[Dict, Type[BaseModel]]] = None,
+    ) -> int:
+        try:
+            formatted_input = self._format_messages(messages, compress_tool_results=True)
+            formatted_tools = self._format_tool_params(messages, tools) if tools else None
+            response = self.get_client().responses.input_tokens.count(
+                model=self.id,
+                input=formatted_input,  # type: ignore
+                instructions=self.instructions,  # type: ignore
+                tools=formatted_tools,  # type: ignore
+            )
+            return response.input_tokens + count_schema_tokens(output_schema, self.id)
+        except Exception as e:
+            log_warning(f"Failed to count tokens via API: {e}")
+            return super().count_tokens(messages, tools, output_schema)
+    async def acount_tokens(
+        self,
+        messages: List[Message],
+        tools: Optional[List[Dict[str, Any]]] = None,
+        output_schema: Optional[Union[Dict, Type[BaseModel]]] = None,
+    ) -> int:
+        """Async version of count_tokens using the async client."""
+        try:
+            formatted_input = self._format_messages(messages, compress_tool_results=True)
+            formatted_tools = self._format_tool_params(messages, tools) if tools else None
+            response = await self.get_async_client().responses.input_tokens.count(
+                model=self.id,
+                input=formatted_input,  # type: ignore
+                instructions=self.instructions,  # type: ignore
+                tools=formatted_tools,  # type: ignore
+            )
+            return response.input_tokens + count_schema_tokens(output_schema, self.id)
+        except Exception as e:
+            log_warning(f"Failed to count tokens via API: {e}")
+            return await super().acount_tokens(messages, tools, output_schema)
     def invoke(
         self,
         messages: List[Message],
@@ -516,6 +572,7 @@ class OpenAIResponses(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> ModelResponse:
         """
         Send a request to the OpenAI Responses API.
@@ -532,7 +589,7 @@ class OpenAIResponses(Model):
             provider_response = self.get_client().responses.create(
                 model=self.id,
-                input=self._format_messages(messages),  # type: ignore
+                input=self._format_messages(messages, compress_tool_results),  # type: ignore
                 **request_params,
             )
@@ -573,6 +630,9 @@ class OpenAIResponses(Model):
                 model_name=self.name,
                 model_id=self.id,
             ) from exc
+        except ModelAuthenticationError as exc:
+            log_error(f"Model authentication error from OpenAI API: {exc}")
+            raise exc
         except Exception as exc:
             log_error(f"Error from OpenAI API: {exc}")
             raise ModelProviderError(message=str(exc), model_name=self.name, model_id=self.id) from exc
@@ -585,6 +645,7 @@ class OpenAIResponses(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> ModelResponse:
         """
         Sends an asynchronous request to the OpenAI Responses API.
@@ -601,7 +662,7 @@ class OpenAIResponses(Model):
             provider_response = await self.get_async_client().responses.create(
                 model=self.id,
-                input=self._format_messages(messages),  # type: ignore
+                input=self._format_messages(messages, compress_tool_results),  # type: ignore
                 **request_params,
             )
@@ -642,6 +703,9 @@ class OpenAIResponses(Model):
                 model_name=self.name,
                 model_id=self.id,
             ) from exc
+        except ModelAuthenticationError as exc:
+            log_error(f"Model authentication error from OpenAI API: {exc}")
+            raise exc
         except Exception as exc:
             log_error(f"Error from OpenAI API: {exc}")
             raise ModelProviderError(message=str(exc), model_name=self.name, model_id=self.id) from exc
@@ -654,6 +718,7 @@ class OpenAIResponses(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> Iterator[ModelResponse]:
         """
         Send a streaming request to the OpenAI Responses API.
@@ -671,7 +736,7 @@ class OpenAIResponses(Model):
             for chunk in self.get_client().responses.create(
                 model=self.id,
-                input=self._format_messages(messages),  # type: ignore
+                input=self._format_messages(messages, compress_tool_results),  # type: ignore
                 stream=True,
                 **request_params,
             ):
@@ -715,6 +780,9 @@ class OpenAIResponses(Model):
                 model_name=self.name,
                 model_id=self.id,
             ) from exc
+        except ModelAuthenticationError as exc:
+            log_error(f"Model authentication error from OpenAI API: {exc}")
+            raise exc
         except Exception as exc:
             log_error(f"Error from OpenAI API: {exc}")
             raise ModelProviderError(message=str(exc), model_name=self.name, model_id=self.id) from exc
@@ -727,6 +795,7 @@ class OpenAIResponses(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> AsyncIterator[ModelResponse]:
         """
         Sends an asynchronous streaming request to the OpenAI Responses API.
@@ -744,7 +813,7 @@ class OpenAIResponses(Model):
             async_stream = await self.get_async_client().responses.create(
                 model=self.id,
-                input=self._format_messages(messages),  # type: ignore
+                input=self._format_messages(messages, compress_tool_results),  # type: ignore
                 stream=True,
                 **request_params,
             )
@@ -785,12 +854,19 @@ class OpenAIResponses(Model):
                 model_name=self.name,
                 model_id=self.id,
             ) from exc
+        except ModelAuthenticationError as exc:
+            log_error(f"Model authentication error from OpenAI API: {exc}")
+            raise exc
         except Exception as exc:
             log_error(f"Error from OpenAI API: {exc}")
             raise ModelProviderError(message=str(exc), model_name=self.name, model_id=self.id) from exc
     def format_function_call_results(
-        self, messages: List[Message], function_call_results: List[Message], tool_call_ids: List[str]
+        self,
+        messages: List[Message],
+        function_call_results: List[Message],
+        tool_call_ids: List[str],
+        compress_tool_results: bool = False,
     ) -> None:
         """
         Handle the results of function calls.
@@ -799,69 +875,13 @@ class OpenAIResponses(Model):
             messages (List[Message]): The list of conversation messages.
             function_call_results (List[Message]): The results of the function calls.
             tool_ids (List[str]): The tool ids.
+            compress_tool_results (bool): Whether to compress tool results.
         """
         if len(function_call_results) > 0:
             for _fc_message_index, _fc_message in enumerate(function_call_results):
                 _fc_message.tool_call_id = tool_call_ids[_fc_message_index]
                 messages.append(_fc_message)
-    def process_response_stream(
-        self,
-        messages: List[Message],
-        assistant_message: Message,
-        stream_data: MessageData,
-        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
-        tools: Optional[List[Dict[str, Any]]] = None,
-        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
-        run_response: Optional[RunOutput] = None,
-    ) -> Iterator[ModelResponse]:
-        """Process the synchronous response stream."""
-        for model_response_delta in self.invoke_stream(
-            messages=messages,
-            assistant_message=assistant_message,
-            tools=tools,
-            response_format=response_format,
-            tool_choice=tool_choice,
-            run_response=run_response,
-        ):
-            yield from self._populate_stream_data_and_assistant_message(
-                stream_data=stream_data,
-                assistant_message=assistant_message,
-                model_response_delta=model_response_delta,
-            )
-        # Add final metrics to assistant message
-        self._populate_assistant_message(assistant_message=assistant_message, provider_response=model_response_delta)
-    async def aprocess_response_stream(
-        self,
-        messages: List[Message],
-        assistant_message: Message,
-        stream_data: MessageData,
-        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
-        tools: Optional[List[Dict[str, Any]]] = None,
-        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
-        run_response: Optional[RunOutput] = None,
-    ) -> AsyncIterator[ModelResponse]:
-        """Process the asynchronous response stream."""
-        async for model_response_delta in self.ainvoke_stream(
-            messages=messages,
-            assistant_message=assistant_message,
-            tools=tools,
-            response_format=response_format,
-            tool_choice=tool_choice,
-            run_response=run_response,
-        ):
-            for model_response in self._populate_stream_data_and_assistant_message(
-                stream_data=stream_data,
-                assistant_message=assistant_message,
-                model_response_delta=model_response_delta,
-            ):
-                yield model_response
-        # Add final metrics to assistant message
-        self._populate_assistant_message(assistant_message=assistant_message, provider_response=model_response_delta)
     def _parse_provider_response(self, response: Response, **kwargs) -> ModelResponse:
         """
         Parse the OpenAI response into a ModelResponse.

agno/models/openrouter/openrouter.py CHANGED Viewed

@@ -1,8 +1,12 @@
-from dataclasses import dataclass, field
+from dataclasses import dataclass
 from os import getenv
-from typing import Optional
+from typing import Any, Dict, List, Optional, Type, Union
+from pydantic import BaseModel
+from agno.exceptions import ModelAuthenticationError
 from agno.models.openai.like import OpenAILike
+from agno.run.agent import RunOutput
 @dataclass
@@ -17,12 +21,65 @@ class OpenRouter(OpenAILike):
         api_key (Optional[str]): The API key.
         base_url (str): The base URL. Defaults to "https://openrouter.ai/api/v1".
         max_tokens (int): The maximum number of tokens. Defaults to 1024.
+        fallback_models (Optional[List[str]]): List of fallback model IDs to use if the primary model
+            fails due to rate limits, timeouts, or unavailability. OpenRouter will automatically try
+            these models in order. Example: ["anthropic/claude-sonnet-4", "deepseek/deepseek-r1"]
     """
     id: str = "gpt-4o"
     name: str = "OpenRouter"
     provider: str = "OpenRouter"
-    api_key: Optional[str] = field(default_factory=lambda: getenv("OPENROUTER_API_KEY"))
+    api_key: Optional[str] = None
     base_url: str = "https://openrouter.ai/api/v1"
     max_tokens: int = 1024
+    models: Optional[List[str]] = None  # Dynamic model routing https://openrouter.ai/docs/features/model-routing
+    def _get_client_params(self) -> Dict[str, Any]:
+        """
+        Returns client parameters for API requests, checking for OPENROUTER_API_KEY.
+        Returns:
+            Dict[str, Any]: A dictionary of client parameters for API requests.
+        """
+        # Fetch API key from env if not already set
+        if not self.api_key:
+            self.api_key = getenv("OPENROUTER_API_KEY")
+            if not self.api_key:
+                raise ModelAuthenticationError(
+                    message="OPENROUTER_API_KEY not set. Please set the OPENROUTER_API_KEY environment variable.",
+                    model_name=self.name,
+                )
+        return super()._get_client_params()
+    def get_request_params(
+        self,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+        run_response: Optional[RunOutput] = None,
+    ) -> Dict[str, Any]:
+        """
+        Returns keyword arguments for API requests, including fallback models configuration.
+        Returns:
+            Dict[str, Any]: A dictionary of keyword arguments for API requests.
+        """
+        # Get base request params from parent class
+        request_params = super().get_request_params(
+            response_format=response_format, tools=tools, tool_choice=tool_choice, run_response=run_response
+        )
+        # Add fallback models to extra_body if specified
+        if self.models:
+            # Get existing extra_body or create new dict
+            extra_body = request_params.get("extra_body") or {}
+            # Merge fallback models into extra_body
+            extra_body["models"] = self.models
+            # Update request params
+            request_params["extra_body"] = extra_body
+        return request_params

agno/models/perplexity/perplexity.py CHANGED Viewed

@@ -4,7 +4,7 @@ from typing import Any, Dict, Optional, Type, Union
 from pydantic import BaseModel
-from agno.exceptions import ModelProviderError
+from agno.exceptions import ModelAuthenticationError, ModelProviderError
 from agno.models.message import Citations, UrlCitation
 from agno.models.metrics import Metrics
 from agno.models.response import ModelResponse
@@ -50,6 +50,22 @@ class Perplexity(OpenAILike):
     supports_native_structured_outputs: bool = False
     supports_json_schema_outputs: bool = True
+    def _get_client_params(self) -> Dict[str, Any]:
+        """
+        Returns client parameters for API requests, checking for PERPLEXITY_API_KEY.
+        Returns:
+            Dict[str, Any]: A dictionary of client parameters for API requests.
+        """
+        if not self.api_key:
+            self.api_key = getenv("PERPLEXITY_API_KEY")
+            if not self.api_key:
+                raise ModelAuthenticationError(
+                    message="PERPLEXITY_API_KEY not set. Please set the PERPLEXITY_API_KEY environment variable.",
+                    model_name=self.name,
+                )
+        return super()._get_client_params()
     def get_request_params(
         self,
         response_format: Optional[Union[Dict, Type[BaseModel]]] = None,

agno/models/portkey/portkey.py CHANGED Viewed

@@ -1,8 +1,8 @@
-from dataclasses import dataclass, field
+from dataclasses import dataclass
 from os import getenv
 from typing import Any, Dict, Optional, cast
-from agno.exceptions import ModelProviderError
+from agno.exceptions import ModelAuthenticationError
 from agno.models.openai.like import OpenAILike
 try:
@@ -30,20 +30,21 @@ class Portkey(OpenAILike):
     name: str = "Portkey"
     provider: str = "Portkey"
-    portkey_api_key: Optional[str] = field(default_factory=lambda: getenv("PORTKEY_API_KEY"))
-    virtual_key: Optional[str] = field(default_factory=lambda: getenv("PORTKEY_VIRTUAL_KEY"))
+    portkey_api_key: Optional[str] = None
+    virtual_key: Optional[str] = None
     config: Optional[Dict[str, Any]] = None
     base_url: str = PORTKEY_GATEWAY_URL
     def _get_client_params(self) -> Dict[str, Any]:
         # Check for required keys
         if not self.portkey_api_key:
-            raise ModelProviderError(
+            raise ModelAuthenticationError(
                 message="PORTKEY_API_KEY not set. Please set the PORTKEY_API_KEY environment variable.",
                 model_name=self.name,
-                model_id=self.id,
             )
+        self.virtual_key = self.virtual_key or getenv("PORTKEY_VIRTUAL_KEY")
         # Create headers using Portkey's createHeaders function
         header_params: Dict[str, Any] = {
             "api_key": self.portkey_api_key,

agno/models/requesty/requesty.py CHANGED Viewed

@@ -1,11 +1,13 @@
-from dataclasses import dataclass, field
+from dataclasses import dataclass
 from os import getenv
 from typing import Any, Dict, List, Optional, Type, Union
 from pydantic import BaseModel
+from agno.exceptions import ModelAuthenticationError
 from agno.models.openai.like import OpenAILike
 from agno.run.agent import RunOutput
+from agno.run.team import TeamRunOutput
 @dataclass
@@ -25,18 +27,36 @@ class Requesty(OpenAILike):
     name: str = "Requesty"
     provider: str = "Requesty"
-    api_key: Optional[str] = field(default_factory=lambda: getenv("REQUESTY_API_KEY"))
+    api_key: Optional[str] = None
     base_url: str = "https://router.requesty.ai/v1"
     max_tokens: int = 1024
+    def _get_client_params(self) -> Dict[str, Any]:
+        """
+        Returns client parameters for API requests, checking for REQUESTY_API_KEY.
+        Returns:
+            Dict[str, Any]: A dictionary of client parameters for API requests.
+        """
+        if not self.api_key:
+            self.api_key = getenv("REQUESTY_API_KEY")
+            if not self.api_key:
+                raise ModelAuthenticationError(
+                    message="REQUESTY_API_KEY not set. Please set the REQUESTY_API_KEY environment variable.",
+                    model_name=self.name,
+                )
+        return super()._get_client_params()
     def get_request_params(
         self,
         response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
-        run_response: Optional[RunOutput] = None,
+        run_response: Optional[Union[RunOutput, TeamRunOutput]] = None,
     ) -> Dict[str, Any]:
-        params = super().get_request_params(response_format=response_format, tools=tools, tool_choice=tool_choice)
+        params = super().get_request_params(
+            response_format=response_format, tools=tools, tool_choice=tool_choice, run_response=run_response
+        )
         if "extra_body" not in params:
             params["extra_body"] = {}

agno 2.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl

agno 2.1.2py3-none-any.whl → 2.3.13py3-none-any.whl