PyPI - agno - Versions diffs - 2.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl - Mend

agno 2.1.2py3-none-any.whl → 2.3.13py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (314) hide show

agno/agent/agent.py +5540 -2273
agno/api/api.py +2 -0
agno/api/os.py +1 -1
agno/compression/__init__.py +3 -0
agno/compression/manager.py +247 -0
agno/culture/__init__.py +3 -0
agno/culture/manager.py +956 -0
agno/db/async_postgres/__init__.py +3 -0
agno/db/base.py +689 -6
agno/db/dynamo/dynamo.py +933 -37
agno/db/dynamo/schemas.py +174 -10
agno/db/dynamo/utils.py +63 -4
agno/db/firestore/firestore.py +831 -9
agno/db/firestore/schemas.py +51 -0
agno/db/firestore/utils.py +102 -4
agno/db/gcs_json/gcs_json_db.py +660 -12
agno/db/gcs_json/utils.py +60 -26
agno/db/in_memory/in_memory_db.py +287 -14
agno/db/in_memory/utils.py +60 -2
agno/db/json/json_db.py +590 -14
agno/db/json/utils.py +60 -26
agno/db/migrations/manager.py +199 -0
agno/db/migrations/v1_to_v2.py +43 -13
agno/db/migrations/versions/__init__.py +0 -0
agno/db/migrations/versions/v2_3_0.py +938 -0
agno/db/mongo/__init__.py +15 -1
agno/db/mongo/async_mongo.py +2760 -0
agno/db/mongo/mongo.py +879 -11
agno/db/mongo/schemas.py +42 -0
agno/db/mongo/utils.py +80 -8
agno/db/mysql/__init__.py +2 -1
agno/db/mysql/async_mysql.py +2912 -0
agno/db/mysql/mysql.py +946 -68
agno/db/mysql/schemas.py +72 -10
agno/db/mysql/utils.py +198 -7
agno/db/postgres/__init__.py +2 -1
agno/db/postgres/async_postgres.py +2579 -0
agno/db/postgres/postgres.py +942 -57
agno/db/postgres/schemas.py +81 -18
agno/db/postgres/utils.py +164 -2
agno/db/redis/redis.py +671 -7
agno/db/redis/schemas.py +50 -0
agno/db/redis/utils.py +65 -7
agno/db/schemas/__init__.py +2 -1
agno/db/schemas/culture.py +120 -0
agno/db/schemas/evals.py +1 -0
agno/db/schemas/memory.py +17 -2
agno/db/singlestore/schemas.py +63 -0
agno/db/singlestore/singlestore.py +949 -83
agno/db/singlestore/utils.py +60 -2
agno/db/sqlite/__init__.py +2 -1
agno/db/sqlite/async_sqlite.py +2911 -0
agno/db/sqlite/schemas.py +62 -0
agno/db/sqlite/sqlite.py +965 -46
agno/db/sqlite/utils.py +169 -8
agno/db/surrealdb/__init__.py +3 -0
agno/db/surrealdb/metrics.py +292 -0
agno/db/surrealdb/models.py +334 -0
agno/db/surrealdb/queries.py +71 -0
agno/db/surrealdb/surrealdb.py +1908 -0
agno/db/surrealdb/utils.py +147 -0
agno/db/utils.py +2 -0
agno/eval/__init__.py +10 -0
agno/eval/accuracy.py +75 -55
agno/eval/agent_as_judge.py +861 -0
agno/eval/base.py +29 -0
agno/eval/performance.py +16 -7
agno/eval/reliability.py +28 -16
agno/eval/utils.py +35 -17
agno/exceptions.py +27 -2
agno/filters.py +354 -0
agno/guardrails/prompt_injection.py +1 -0
agno/hooks/__init__.py +3 -0
agno/hooks/decorator.py +164 -0
agno/integrations/discord/client.py +1 -1
agno/knowledge/chunking/agentic.py +13 -10
agno/knowledge/chunking/fixed.py +4 -1
agno/knowledge/chunking/semantic.py +9 -4
agno/knowledge/chunking/strategy.py +59 -15
agno/knowledge/embedder/fastembed.py +1 -1
agno/knowledge/embedder/nebius.py +1 -1
agno/knowledge/embedder/ollama.py +8 -0
agno/knowledge/embedder/openai.py +8 -8
agno/knowledge/embedder/sentence_transformer.py +6 -2
agno/knowledge/embedder/vllm.py +262 -0
agno/knowledge/knowledge.py +1618 -318
agno/knowledge/reader/base.py +6 -2
agno/knowledge/reader/csv_reader.py +8 -10
agno/knowledge/reader/docx_reader.py +5 -6
agno/knowledge/reader/field_labeled_csv_reader.py +16 -20
agno/knowledge/reader/json_reader.py +5 -4
agno/knowledge/reader/markdown_reader.py +8 -8
agno/knowledge/reader/pdf_reader.py +17 -19
agno/knowledge/reader/pptx_reader.py +101 -0
agno/knowledge/reader/reader_factory.py +32 -3
agno/knowledge/reader/s3_reader.py +3 -3
agno/knowledge/reader/tavily_reader.py +193 -0
agno/knowledge/reader/text_reader.py +22 -10
agno/knowledge/reader/web_search_reader.py +1 -48
agno/knowledge/reader/website_reader.py +10 -10
agno/knowledge/reader/wikipedia_reader.py +33 -1
agno/knowledge/types.py +1 -0
agno/knowledge/utils.py +72 -7
agno/media.py +22 -6
agno/memory/__init__.py +14 -1
agno/memory/manager.py +544 -83
agno/memory/strategies/__init__.py +15 -0
agno/memory/strategies/base.py +66 -0
agno/memory/strategies/summarize.py +196 -0
agno/memory/strategies/types.py +37 -0
agno/models/aimlapi/aimlapi.py +17 -0
agno/models/anthropic/claude.py +515 -40
agno/models/aws/bedrock.py +102 -21
agno/models/aws/claude.py +131 -274
agno/models/azure/ai_foundry.py +41 -19
agno/models/azure/openai_chat.py +39 -8
agno/models/base.py +1249 -525
agno/models/cerebras/cerebras.py +91 -21
agno/models/cerebras/cerebras_openai.py +21 -2
agno/models/cohere/chat.py +40 -6
agno/models/cometapi/cometapi.py +18 -1
agno/models/dashscope/dashscope.py +2 -3
agno/models/deepinfra/deepinfra.py +18 -1
agno/models/deepseek/deepseek.py +69 -3
agno/models/fireworks/fireworks.py +18 -1
agno/models/google/gemini.py +877 -80
agno/models/google/utils.py +22 -0
agno/models/groq/groq.py +51 -18
agno/models/huggingface/huggingface.py +17 -6
agno/models/ibm/watsonx.py +16 -6
agno/models/internlm/internlm.py +18 -1
agno/models/langdb/langdb.py +13 -1
agno/models/litellm/chat.py +44 -9
agno/models/litellm/litellm_openai.py +18 -1
agno/models/message.py +28 -5
agno/models/meta/llama.py +47 -14
agno/models/meta/llama_openai.py +22 -17
agno/models/mistral/mistral.py +8 -4
agno/models/nebius/nebius.py +6 -7
agno/models/nvidia/nvidia.py +20 -3
agno/models/ollama/chat.py +24 -8
agno/models/openai/chat.py +104 -29
agno/models/openai/responses.py +101 -81
agno/models/openrouter/openrouter.py +60 -3
agno/models/perplexity/perplexity.py +17 -1
agno/models/portkey/portkey.py +7 -6
agno/models/requesty/requesty.py +24 -4
agno/models/response.py +73 -2
agno/models/sambanova/sambanova.py +20 -3
agno/models/siliconflow/siliconflow.py +19 -2
agno/models/together/together.py +20 -3
agno/models/utils.py +254 -8
agno/models/vercel/v0.py +20 -3
agno/models/vertexai/__init__.py +0 -0
agno/models/vertexai/claude.py +190 -0
agno/models/vllm/vllm.py +19 -14
agno/models/xai/xai.py +19 -2
agno/os/app.py +549 -152
agno/os/auth.py +190 -3
agno/os/config.py +23 -0
agno/os/interfaces/a2a/router.py +8 -11
agno/os/interfaces/a2a/utils.py +1 -1
agno/os/interfaces/agui/router.py +18 -3
agno/os/interfaces/agui/utils.py +152 -39
agno/os/interfaces/slack/router.py +55 -37
agno/os/interfaces/slack/slack.py +9 -1
agno/os/interfaces/whatsapp/router.py +0 -1
agno/os/interfaces/whatsapp/security.py +3 -1
agno/os/mcp.py +110 -52
agno/os/middleware/__init__.py +2 -0
agno/os/middleware/jwt.py +676 -112
agno/os/router.py +40 -1478
agno/os/routers/agents/__init__.py +3 -0
agno/os/routers/agents/router.py +599 -0
agno/os/routers/agents/schema.py +261 -0
agno/os/routers/evals/evals.py +96 -39
agno/os/routers/evals/schemas.py +65 -33
agno/os/routers/evals/utils.py +80 -10
agno/os/routers/health.py +10 -4
agno/os/routers/knowledge/knowledge.py +196 -38
agno/os/routers/knowledge/schemas.py +82 -22
agno/os/routers/memory/memory.py +279 -52
agno/os/routers/memory/schemas.py +46 -17
agno/os/routers/metrics/metrics.py +20 -8
agno/os/routers/metrics/schemas.py +16 -16
agno/os/routers/session/session.py +462 -34
agno/os/routers/teams/__init__.py +3 -0
agno/os/routers/teams/router.py +512 -0
agno/os/routers/teams/schema.py +257 -0
agno/os/routers/traces/__init__.py +3 -0
agno/os/routers/traces/schemas.py +414 -0
agno/os/routers/traces/traces.py +499 -0
agno/os/routers/workflows/__init__.py +3 -0
agno/os/routers/workflows/router.py +624 -0
agno/os/routers/workflows/schema.py +75 -0
agno/os/schema.py +256 -693
agno/os/scopes.py +469 -0
agno/os/utils.py +514 -36
agno/reasoning/anthropic.py +80 -0
agno/reasoning/gemini.py +73 -0
agno/reasoning/openai.py +5 -0
agno/reasoning/vertexai.py +76 -0
agno/run/__init__.py +6 -0
agno/run/agent.py +155 -32
agno/run/base.py +55 -3
agno/run/requirement.py +181 -0
agno/run/team.py +125 -38
agno/run/workflow.py +72 -18
agno/session/agent.py +102 -89
agno/session/summary.py +56 -15
agno/session/team.py +164 -90
agno/session/workflow.py +405 -40
agno/table.py +10 -0
agno/team/team.py +3974 -1903
agno/tools/dalle.py +2 -4
agno/tools/eleven_labs.py +23 -25
agno/tools/exa.py +21 -16
agno/tools/file.py +153 -23
agno/tools/file_generation.py +16 -10
agno/tools/firecrawl.py +15 -7
agno/tools/function.py +193 -38
agno/tools/gmail.py +238 -14
agno/tools/google_drive.py +271 -0
agno/tools/googlecalendar.py +36 -8
agno/tools/googlesheets.py +20 -5
agno/tools/jira.py +20 -0
agno/tools/mcp/__init__.py +10 -0
agno/tools/mcp/mcp.py +331 -0
agno/tools/mcp/multi_mcp.py +347 -0
agno/tools/mcp/params.py +24 -0
agno/tools/mcp_toolbox.py +3 -3
agno/tools/models/nebius.py +5 -5
agno/tools/models_labs.py +20 -10
agno/tools/nano_banana.py +151 -0
agno/tools/notion.py +204 -0
agno/tools/parallel.py +314 -0
agno/tools/postgres.py +76 -36
agno/tools/redshift.py +406 -0
agno/tools/scrapegraph.py +1 -1
agno/tools/shopify.py +1519 -0
agno/tools/slack.py +18 -3
agno/tools/spotify.py +919 -0
agno/tools/tavily.py +146 -0
agno/tools/toolkit.py +25 -0
agno/tools/workflow.py +8 -1
agno/tools/yfinance.py +12 -11
agno/tracing/__init__.py +12 -0
agno/tracing/exporter.py +157 -0
agno/tracing/schemas.py +276 -0
agno/tracing/setup.py +111 -0
agno/utils/agent.py +938 -0
agno/utils/cryptography.py +22 -0
agno/utils/dttm.py +33 -0
agno/utils/events.py +151 -3
agno/utils/gemini.py +15 -5
agno/utils/hooks.py +118 -4
agno/utils/http.py +113 -2
agno/utils/knowledge.py +12 -5
agno/utils/log.py +1 -0
agno/utils/mcp.py +92 -2
agno/utils/media.py +187 -1
agno/utils/merge_dict.py +3 -3
agno/utils/message.py +60 -0
agno/utils/models/ai_foundry.py +9 -2
agno/utils/models/claude.py +49 -14
agno/utils/models/cohere.py +9 -2
agno/utils/models/llama.py +9 -2
agno/utils/models/mistral.py +4 -2
agno/utils/print_response/agent.py +109 -16
agno/utils/print_response/team.py +223 -30
agno/utils/print_response/workflow.py +251 -34
agno/utils/streamlit.py +1 -1
agno/utils/team.py +98 -9
agno/utils/tokens.py +657 -0
agno/vectordb/base.py +39 -7
agno/vectordb/cassandra/cassandra.py +21 -5
agno/vectordb/chroma/chromadb.py +43 -12
agno/vectordb/clickhouse/clickhousedb.py +21 -5
agno/vectordb/couchbase/couchbase.py +29 -5
agno/vectordb/lancedb/lance_db.py +92 -181
agno/vectordb/langchaindb/langchaindb.py +24 -4
agno/vectordb/lightrag/lightrag.py +17 -3
agno/vectordb/llamaindex/llamaindexdb.py +25 -5
agno/vectordb/milvus/milvus.py +50 -37
agno/vectordb/mongodb/__init__.py +7 -1
agno/vectordb/mongodb/mongodb.py +36 -30
agno/vectordb/pgvector/pgvector.py +201 -77
agno/vectordb/pineconedb/pineconedb.py +41 -23
agno/vectordb/qdrant/qdrant.py +67 -54
agno/vectordb/redis/__init__.py +9 -0
agno/vectordb/redis/redisdb.py +682 -0
agno/vectordb/singlestore/singlestore.py +50 -29
agno/vectordb/surrealdb/surrealdb.py +31 -41
agno/vectordb/upstashdb/upstashdb.py +34 -6
agno/vectordb/weaviate/weaviate.py +53 -14
agno/workflow/__init__.py +2 -0
agno/workflow/agent.py +299 -0
agno/workflow/condition.py +120 -18
agno/workflow/loop.py +77 -10
agno/workflow/parallel.py +231 -143
agno/workflow/router.py +118 -17
agno/workflow/step.py +609 -170
agno/workflow/steps.py +73 -6
agno/workflow/types.py +96 -21
agno/workflow/workflow.py +2039 -262
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/METADATA +201 -66
agno-2.3.13.dist-info/RECORD +613 -0
agno/tools/googlesearch.py +0 -98
agno/tools/mcp.py +0 -679
agno/tools/memori.py +0 -339
agno-2.1.2.dist-info/RECORD +0 -543
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/WHEEL +0 -0
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/licenses/LICENSE +0 -0
{agno-2.1.2.dist-info → agno-2.3.13.dist-info}/top_level.txt +0 -0

agno/models/cerebras/cerebras.py CHANGED Viewed

@@ -12,6 +12,7 @@ from agno.models.message import Message
 from agno.models.metrics import Metrics
 from agno.models.response import ModelResponse
 from agno.run.agent import RunOutput
+from agno.utils.http import get_default_async_client, get_default_sync_client
 from agno.utils.log import log_debug, log_error, log_warning
 try:
@@ -51,6 +52,7 @@ class Cerebras(Model):
     temperature: Optional[float] = None
     top_p: Optional[float] = None
     top_k: Optional[int] = None
+    strict_output: bool = True  # When True, guarantees schema adherence for structured outputs. When False, attempts to follow schema as a guide but may occasionally deviate
     extra_headers: Optional[Any] = None
     extra_query: Optional[Any] = None
     extra_body: Optional[Any] = None
@@ -63,7 +65,7 @@ class Cerebras(Model):
     max_retries: Optional[int] = None
     default_headers: Optional[Any] = None
     default_query: Optional[Any] = None
-    http_client: Optional[httpx.Client] = None
+    http_client: Optional[Union[httpx.Client, httpx.AsyncClient]] = None
     client_params: Optional[Dict[str, Any]] = None
     # Cerebras clients
@@ -102,12 +104,15 @@ class Cerebras(Model):
         Returns:
             CerebrasClient: An instance of the Cerebras client.
         """
-        if self.client:
+        if self.client and not self.client.is_closed():
             return self.client
         client_params: Dict[str, Any] = self._get_client_params()
         if self.http_client is not None:
             client_params["http_client"] = self.http_client
+        else:
+            # Use global sync client when no custom http_client is provided
+            client_params["http_client"] = get_default_sync_client()
         self.client = CerebrasClient(**client_params)
         return self.client
@@ -118,17 +123,15 @@ class Cerebras(Model):
         Returns:
             AsyncCerebras: An instance of the asynchronous Cerebras client.
         """
-        if self.async_client:
+        if self.async_client and not self.async_client.is_closed():
             return self.async_client
         client_params: Dict[str, Any] = self._get_client_params()
-        if self.http_client:
+        if self.http_client and isinstance(self.http_client, httpx.AsyncClient):
             client_params["http_client"] = self.http_client
         else:
-            # Create a new async HTTP client with custom limits
-            client_params["http_client"] = httpx.AsyncClient(
-                limits=httpx.Limits(max_connections=1000, max_keepalive_connections=100)
-            )
+            # Use global async client when no custom http_client is provided
+            client_params["http_client"] = get_default_async_client()
         self.async_client = AsyncCerebrasClient(**client_params)
         return self.async_client
@@ -186,10 +189,10 @@ class Cerebras(Model):
                 and response_format.get("type") == "json_schema"
                 and isinstance(response_format.get("json_schema"), dict)
             ):
-                # Ensure json_schema has strict=True as required by Cerebras API
+                # Ensure json_schema has strict parameter set
                 schema = response_format["json_schema"]
                 if isinstance(schema.get("schema"), dict) and "strict" not in schema:
-                    schema["strict"] = True
+                    schema["strict"] = self.strict_output
                 request_params["response_format"] = response_format
@@ -209,6 +212,7 @@ class Cerebras(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> ModelResponse:
         """
         Send a chat completion request to the Cerebras API.
@@ -225,7 +229,7 @@ class Cerebras(Model):
         assistant_message.metrics.start_timer()
         provider_response = self.get_client().chat.completions.create(
             model=self.id,
-            messages=[self._format_message(m) for m in messages],  # type: ignore
+            messages=[self._format_message(m, compress_tool_results) for m in messages],  # type: ignore
             **self.get_request_params(response_format=response_format, tools=tools),
         )
         assistant_message.metrics.stop_timer()
@@ -242,6 +246,7 @@ class Cerebras(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> ModelResponse:
         """
         Sends an asynchronous chat completion request to the Cerebras API.
@@ -258,7 +263,7 @@ class Cerebras(Model):
         assistant_message.metrics.start_timer()
         provider_response = await self.get_async_client().chat.completions.create(
             model=self.id,
-            messages=[self._format_message(m) for m in messages],  # type: ignore
+            messages=[self._format_message(m, compress_tool_results) for m in messages],  # type: ignore
             **self.get_request_params(response_format=response_format, tools=tools),
         )
         assistant_message.metrics.stop_timer()
@@ -275,6 +280,7 @@ class Cerebras(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> Iterator[ModelResponse]:
         """
         Send a streaming chat completion request to the Cerebras API.
@@ -292,7 +298,7 @@ class Cerebras(Model):
         for chunk in self.get_client().chat.completions.create(
             model=self.id,
-            messages=[self._format_message(m) for m in messages],  # type: ignore
+            messages=[self._format_message(m, compress_tool_results) for m in messages],  # type: ignore
             stream=True,
             **self.get_request_params(response_format=response_format, tools=tools),
         ):
@@ -308,6 +314,7 @@ class Cerebras(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> AsyncIterator[ModelResponse]:
         """
         Sends an asynchronous streaming chat completion request to the Cerebras API.
@@ -325,7 +332,7 @@ class Cerebras(Model):
         async_stream = await self.get_async_client().chat.completions.create(
             model=self.id,
-            messages=[self._format_message(m) for m in messages],  # type: ignore
+            messages=[self._format_message(m, compress_tool_results) for m in messages],  # type: ignore
             stream=True,
             **self.get_request_params(response_format=response_format, tools=tools),
         )
@@ -335,20 +342,27 @@ class Cerebras(Model):
         assistant_message.metrics.stop_timer()
-    def _format_message(self, message: Message) -> Dict[str, Any]:
+    def _format_message(self, message: Message, compress_tool_results: bool = False) -> Dict[str, Any]:
         """
         Format a message into the format expected by the Cerebras API.
         Args:
             message (Message): The message to format.
+            compress_tool_results: Whether to compress tool results.
         Returns:
             Dict[str, Any]: The formatted message.
         """
+        # Use compressed content for tool messages if compression is active
+        if message.role == "tool":
+            content = message.get_content(use_compressed_content=compress_tool_results)
+        else:
+            content = message.content if message.content is not None else ""
         # Basic message content
         message_dict: Dict[str, Any] = {
             "role": message.role,
-            "content": message.content if message.content is not None else "",
+            "content": content,
         }
         # Add name if present
@@ -377,7 +391,7 @@ class Cerebras(Model):
             message_dict = {
                 "role": "tool",
                 "tool_call_id": message.tool_call_id,
-                "content": message.content if message.content is not None else "",
+                "content": content,
             }
         # Ensure no None values in the message
@@ -456,18 +470,19 @@ class Cerebras(Model):
                 if choice_delta.content:
                     model_response.content = choice_delta.content
-                # Add tool calls
+                # Add tool calls - preserve index for proper aggregation in parse_tool_calls
                 if choice_delta.tool_calls:
                     model_response.tool_calls = [
                         {
+                            "index": tool_call.index if hasattr(tool_call, "index") else idx,
                             "id": tool_call.id,
                             "type": tool_call.type,
                             "function": {
-                                "name": tool_call.function.name,
-                                "arguments": tool_call.function.arguments,
+                                "name": tool_call.function.name if tool_call.function else None,
+                                "arguments": tool_call.function.arguments if tool_call.function else None,
                             },
                         }
-                        for tool_call in choice_delta.tool_calls
+                        for idx, tool_call in enumerate(choice_delta.tool_calls)
                     ]
         # Add usage metrics
@@ -476,6 +491,61 @@ class Cerebras(Model):
         return model_response
+    def parse_tool_calls(self, tool_calls_data: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
+        """
+        Build complete tool calls from streamed tool call delta data.
+        Cerebras streams tool calls incrementally with partial data in each chunk.
+        This method aggregates those chunks by index to produce complete tool calls.
+        Args:
+            tool_calls_data: List of tool call deltas from streaming chunks.
+        Returns:
+            List[Dict[str, Any]]: List of fully-formed tool call dicts.
+        """
+        tool_calls: List[Dict[str, Any]] = []
+        for tool_call_delta in tool_calls_data:
+            # Get the index for this tool call (default to 0 if not present)
+            index = tool_call_delta.get("index", 0)
+            # Extend the list if needed
+            while len(tool_calls) <= index:
+                tool_calls.append(
+                    {
+                        "id": None,
+                        "type": None,
+                        "function": {
+                            "name": "",
+                            "arguments": "",
+                        },
+                    }
+                )
+            tool_call_entry = tool_calls[index]
+            # Update id if present
+            if tool_call_delta.get("id"):
+                tool_call_entry["id"] = tool_call_delta["id"]
+            # Update type if present
+            if tool_call_delta.get("type"):
+                tool_call_entry["type"] = tool_call_delta["type"]
+            # Update function name and arguments (concatenate for streaming)
+            if tool_call_delta.get("function"):
+                func_delta = tool_call_delta["function"]
+                if func_delta.get("name"):
+                    tool_call_entry["function"]["name"] += func_delta["name"]
+                if func_delta.get("arguments"):
+                    tool_call_entry["function"]["arguments"] += func_delta["arguments"]
+        # Filter out any incomplete tool calls (missing id or function name)
+        complete_tool_calls = [tc for tc in tool_calls if tc.get("id") and tc.get("function", {}).get("name")]
+        return complete_tool_calls
     def _get_metrics(self, response_usage: Union[ChatCompletionResponseUsage, ChatChunkResponseUsage]) -> Metrics:
         """
         Parse the given Cerebras usage into an Agno Metrics object.

agno/models/cerebras/cerebras_openai.py CHANGED Viewed

@@ -5,6 +5,7 @@ from typing import Any, Dict, List, Optional, Type, Union
 from pydantic import BaseModel
+from agno.exceptions import ModelAuthenticationError
 from agno.models.message import Message
 from agno.models.openai.like import OpenAILike
 from agno.utils.log import log_debug
@@ -20,6 +21,22 @@ class CerebrasOpenAI(OpenAILike):
     base_url: str = "https://api.cerebras.ai/v1"
     api_key: Optional[str] = field(default_factory=lambda: getenv("CEREBRAS_API_KEY", None))
+    def _get_client_params(self) -> Dict[str, Any]:
+        """
+        Returns client parameters for API requests, checking for CEREBRAS_API_KEY.
+        Returns:
+            Dict[str, Any]: A dictionary of client parameters for API requests.
+        """
+        if not self.api_key:
+            self.api_key = getenv("CEREBRAS_API_KEY")
+            if not self.api_key:
+                raise ModelAuthenticationError(
+                    message="CEREBRAS_API_KEY not set. Please set the CEREBRAS_API_KEY environment variable.",
+                    model_name=self.name,
+                )
+        return super()._get_client_params()
     def get_request_params(
         self,
         response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
@@ -61,7 +78,7 @@ class CerebrasOpenAI(OpenAILike):
             log_debug(f"Calling {self.provider} with request parameters: {request_params}", log_level=2)
         return request_params
-    def _format_message(self, message: Message) -> Dict[str, Any]:
+    def _format_message(self, message: Message, compress_tool_results: bool = False) -> Dict[str, Any]:
         """
         Format a message into the format expected by the Cerebras API.
@@ -71,6 +88,7 @@ class CerebrasOpenAI(OpenAILike):
         Returns:
             Dict[str, Any]: The formatted message.
         """
         # Basic message content
         message_dict: Dict[str, Any] = {
             "role": message.role,
@@ -100,10 +118,11 @@ class CerebrasOpenAI(OpenAILike):
         # Handle tool responses
         if message.role == "tool" and message.tool_call_id:
+            content = message.get_content(use_compressed_content=compress_tool_results)
             message_dict = {
                 "role": "tool",
                 "tool_call_id": message.tool_call_id,
-                "content": message.content if message.content is not None else "",
+                "content": content if message.content is not None else "",
             }
         # Ensure no None values in the message

agno/models/cohere/chat.py CHANGED Viewed

@@ -2,6 +2,7 @@ from dataclasses import dataclass
 from os import getenv
 from typing import Any, AsyncIterator, Dict, Iterator, List, Optional, Tuple, Type, Union
+import httpx
 from pydantic import BaseModel
 from agno.exceptions import ModelProviderError
@@ -10,7 +11,8 @@ from agno.models.message import Message
 from agno.models.metrics import Metrics
 from agno.models.response import ModelResponse
 from agno.run.agent import RunOutput
-from agno.utils.log import log_debug, log_error
+from agno.utils.http import get_default_async_client, get_default_sync_client
+from agno.utils.log import log_debug, log_error, log_warning
 from agno.utils.models.cohere import format_messages
 try:
@@ -50,6 +52,7 @@ class Cohere(Model):
     # -*- Client parameters
     api_key: Optional[str] = None
     client_params: Optional[Dict[str, Any]] = None
+    http_client: Optional[Union[httpx.Client, httpx.AsyncClient]] = None
     # -*- Provide the Cohere client manually
     client: Optional[CohereClient] = None
     async_client: Optional[CohereAsyncClient] = None
@@ -66,6 +69,17 @@ class Cohere(Model):
         _client_params["api_key"] = self.api_key
+        if self.http_client:
+            if isinstance(self.http_client, httpx.Client):
+                _client_params["httpx_client"] = self.http_client
+            else:
+                log_warning("http_client is not an instance of httpx.Client. Using default global httpx.Client.")
+                # Use global sync client when user http_client is invalid
+                _client_params["httpx_client"] = get_default_sync_client()
+        else:
+            # Use global sync client when no custom http_client is provided
+            _client_params["httpx_client"] = get_default_sync_client()
         self.client = CohereClient(**_client_params)
         return self.client  # type: ignore
@@ -78,10 +92,26 @@ class Cohere(Model):
         self.api_key = self.api_key or getenv("CO_API_KEY")
         if not self.api_key:
-            log_error("CO_API_KEY not set. Please set the CO_API_KEY environment variable.")
+            raise ModelProviderError(
+                message="CO_API_KEY not set. Please set the CO_API_KEY environment variable.",
+                model_name=self.name,
+                model_id=self.id,
+            )
         _client_params["api_key"] = self.api_key
+        if self.http_client:
+            if isinstance(self.http_client, httpx.AsyncClient):
+                _client_params["httpx_client"] = self.http_client
+            else:
+                log_warning(
+                    "http_client is not an instance of httpx.AsyncClient. Using default global httpx.AsyncClient."
+                )
+                # Use global async client when user http_client is invalid
+                _client_params["httpx_client"] = get_default_async_client()
+        else:
+            # Use global async client when no custom http_client is provided
+            _client_params["httpx_client"] = get_default_async_client()
         self.async_client = CohereAsyncClient(**_client_params)
         return self.async_client  # type: ignore
@@ -155,6 +185,7 @@ class Cohere(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> ModelResponse:
         """
         Invoke a non-streamed chat response from the Cohere API.
@@ -168,7 +199,7 @@ class Cohere(Model):
             assistant_message.metrics.start_timer()
             provider_response = self.get_client().chat(
                 model=self.id,
-                messages=format_messages(messages),  # type: ignore
+                messages=format_messages(messages, compress_tool_results),  # type: ignore
                 **request_kwargs,
             )  # type: ignore
             assistant_message.metrics.stop_timer()
@@ -189,6 +220,7 @@ class Cohere(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> Iterator[ModelResponse]:
         """
         Invoke a streamed chat response from the Cohere API.
@@ -205,7 +237,7 @@ class Cohere(Model):
             for response in self.get_client().chat_stream(
                 model=self.id,
-                messages=format_messages(messages),  # type: ignore
+                messages=format_messages(messages, compress_tool_results),  # type: ignore
                 **request_kwargs,
             ):
                 model_response, tool_use = self._parse_provider_response_delta(response, tool_use=tool_use)
@@ -225,6 +257,7 @@ class Cohere(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> ModelResponse:
         """
         Asynchronously invoke a non-streamed chat response from the Cohere API.
@@ -238,7 +271,7 @@ class Cohere(Model):
             assistant_message.metrics.start_timer()
             provider_response = await self.get_async_client().chat(
                 model=self.id,
-                messages=format_messages(messages),  # type: ignore
+                messages=format_messages(messages, compress_tool_results),  # type: ignore
                 **request_kwargs,
             )
             assistant_message.metrics.stop_timer()
@@ -259,6 +292,7 @@ class Cohere(Model):
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
     ) -> AsyncIterator[ModelResponse]:
         """
         Asynchronously invoke a streamed chat response from the Cohere API.
@@ -275,7 +309,7 @@ class Cohere(Model):
             async for response in self.get_async_client().chat_stream(
                 model=self.id,
-                messages=format_messages(messages),  # type: ignore
+                messages=format_messages(messages, compress_tool_results),  # type: ignore
                 **request_kwargs,
             ):
                 model_response, tool_use = self._parse_provider_response_delta(response, tool_use=tool_use)

agno/models/cometapi/cometapi.py CHANGED Viewed

@@ -1,9 +1,10 @@
 from dataclasses import dataclass, field
 from os import getenv
-from typing import List, Optional
+from typing import Any, Dict, List, Optional
 import httpx
+from agno.exceptions import ModelAuthenticationError
 from agno.models.openai.like import OpenAILike
 from agno.utils.log import log_debug
@@ -26,6 +27,22 @@ class CometAPI(OpenAILike):
     api_key: Optional[str] = field(default_factory=lambda: getenv("COMETAPI_KEY"))
     base_url: str = "https://api.cometapi.com/v1"
+    def _get_client_params(self) -> Dict[str, Any]:
+        """
+        Returns client parameters for API requests, checking for COMETAPI_KEY.
+        Returns:
+            Dict[str, Any]: A dictionary of client parameters for API requests.
+        """
+        if not self.api_key:
+            self.api_key = getenv("COMETAPI_KEY")
+            if not self.api_key:
+                raise ModelAuthenticationError(
+                    message="COMETAPI_KEY not set. Please set the COMETAPI_KEY environment variable.",
+                    model_name=self.name,
+                )
+        return super()._get_client_params()
     def get_available_models(self) -> List[str]:
         """
         Fetch available chat models from CometAPI, filtering out non-chat models.

agno/models/dashscope/dashscope.py CHANGED Viewed

@@ -4,7 +4,7 @@ from typing import Any, Dict, List, Optional, Type, Union
 from pydantic import BaseModel
-from agno.exceptions import ModelProviderError
+from agno.exceptions import ModelAuthenticationError
 from agno.models.openai.like import OpenAILike
@@ -43,10 +43,9 @@ class DashScope(OpenAILike):
         if not self.api_key:
             self.api_key = getenv("DASHSCOPE_API_KEY")
             if not self.api_key:
-                raise ModelProviderError(
+                raise ModelAuthenticationError(
                     message="DASHSCOPE_API_KEY not set. Please set the DASHSCOPE_API_KEY environment variable.",
                     model_name=self.name,
-                    model_id=self.id,
                 )
         # Define base client params

agno/models/deepinfra/deepinfra.py CHANGED Viewed

@@ -1,7 +1,8 @@
 from dataclasses import dataclass, field
 from os import getenv
-from typing import Optional
+from typing import Any, Dict, Optional
+from agno.exceptions import ModelAuthenticationError
 from agno.models.openai.like import OpenAILike
@@ -26,3 +27,19 @@ class DeepInfra(OpenAILike):
     base_url: str = "https://api.deepinfra.com/v1/openai"
     supports_native_structured_outputs: bool = False
+    def _get_client_params(self) -> Dict[str, Any]:
+        """
+        Returns client parameters for API requests, checking for DEEPINFRA_API_KEY.
+        Returns:
+            Dict[str, Any]: A dictionary of client parameters for API requests.
+        """
+        if not self.api_key:
+            self.api_key = getenv("DEEPINFRA_API_KEY")
+            if not self.api_key:
+                raise ModelAuthenticationError(
+                    message="DEEPINFRA_API_KEY not set. Please set the DEEPINFRA_API_KEY environment variable.",
+                    model_name=self.name,
+                )
+        return super()._get_client_params()

agno/models/deepseek/deepseek.py CHANGED Viewed

@@ -2,8 +2,11 @@ from dataclasses import dataclass, field
 from os import getenv
 from typing import Any, Dict, Optional
-from agno.exceptions import ModelProviderError
+from agno.exceptions import ModelAuthenticationError
+from agno.models.message import Message
 from agno.models.openai.like import OpenAILike
+from agno.utils.log import log_warning
+from agno.utils.openai import _format_file_for_message, audio_to_message, images_to_message
 @dataclass
@@ -35,10 +38,9 @@ class DeepSeek(OpenAILike):
             self.api_key = getenv("DEEPSEEK_API_KEY")
             if not self.api_key:
                 # Raise error immediately if key is missing
-                raise ModelProviderError(
+                raise ModelAuthenticationError(
                     message="DEEPSEEK_API_KEY not set. Please set the DEEPSEEK_API_KEY environment variable.",
                     model_name=self.name,
-                    model_id=self.id,
                 )
         # Define base client params
@@ -59,3 +61,67 @@ class DeepSeek(OpenAILike):
         if self.client_params:
             client_params.update(self.client_params)
         return client_params
+    def _format_message(self, message: Message, compress_tool_results: bool = False) -> Dict[str, Any]:
+        """
+        Format a message into the format expected by OpenAI.
+        Args:
+            message (Message): The message to format.
+            compress_tool_results: Whether to compress tool results.
+        Returns:
+            Dict[str, Any]: The formatted message.
+        """
+        tool_result = message.get_content(use_compressed_content=compress_tool_results)
+        message_dict: Dict[str, Any] = {
+            "role": self.role_map[message.role] if self.role_map else self.default_role_map[message.role],
+            "content": tool_result,
+            "name": message.name,
+            "tool_call_id": message.tool_call_id,
+            "tool_calls": message.tool_calls,
+            "reasoning_content": message.reasoning_content,
+        }
+        message_dict = {k: v for k, v in message_dict.items() if v is not None}
+        # Ignore non-string message content
+        # because we assume that the images/audio are already added to the message
+        if (message.images is not None and len(message.images) > 0) or (
+            message.audio is not None and len(message.audio) > 0
+        ):
+            # Ignore non-string message content
+            # because we assume that the images/audio are already added to the message
+            if isinstance(message.content, str):
+                message_dict["content"] = [{"type": "text", "text": message.content}]
+                if message.images is not None:
+                    message_dict["content"].extend(images_to_message(images=message.images))
+                if message.audio is not None:
+                    message_dict["content"].extend(audio_to_message(audio=message.audio))
+        if message.audio_output is not None:
+            message_dict["content"] = ""
+            message_dict["audio"] = {"id": message.audio_output.id}
+        if message.videos is not None and len(message.videos) > 0:
+            log_warning("Video input is currently unsupported.")
+        if message.files is not None:
+            # Ensure content is a list of parts
+            content = message_dict.get("content")
+            if isinstance(content, str):  # wrap existing text
+                text = content
+                message_dict["content"] = [{"type": "text", "text": text}]
+            elif content is None:
+                message_dict["content"] = []
+            # Insert each file part before text parts
+            for file in message.files:
+                file_part = _format_file_for_message(file)
+                if file_part:
+                    message_dict["content"].insert(0, file_part)
+        # Manually add the content field even if it is None
+        if message.content is None:
+            message_dict["content"] = ""
+        return message_dict

agno/models/fireworks/fireworks.py CHANGED Viewed

@@ -1,7 +1,8 @@
 from dataclasses import dataclass, field
 from os import getenv
-from typing import Optional
+from typing import Any, Dict, Optional
+from agno.exceptions import ModelAuthenticationError
 from agno.models.openai import OpenAILike
@@ -24,3 +25,19 @@ class Fireworks(OpenAILike):
     api_key: Optional[str] = field(default_factory=lambda: getenv("FIREWORKS_API_KEY"))
     base_url: str = "https://api.fireworks.ai/inference/v1"
+    def _get_client_params(self) -> Dict[str, Any]:
+        """
+        Returns client parameters for API requests, checking for FIREWORKS_API_KEY.
+        Returns:
+            Dict[str, Any]: A dictionary of client parameters for API requests.
+        """
+        if not self.api_key:
+            self.api_key = getenv("FIREWORKS_API_KEY")
+            if not self.api_key:
+                raise ModelAuthenticationError(
+                    message="FIREWORKS_API_KEY not set. Please set the FIREWORKS_API_KEY environment variable.",
+                    model_name=self.name,
+                )
+        return super()._get_client_params()

agno 2.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl

agno 2.1.2py3-none-any.whl → 2.3.13py3-none-any.whl