PyPI - agno - Versions diffs - 2.3.7__py3-none-any.whl → 2.3.9__py3-none-any.whl - Mend

agno 2.3.7py3-none-any.whl → 2.3.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (71) hide show

agno/agent/agent.py +391 -335
agno/db/mongo/async_mongo.py +0 -24
agno/db/mongo/mongo.py +0 -16
agno/db/mysql/__init__.py +2 -1
agno/db/mysql/async_mysql.py +2888 -0
agno/db/mysql/mysql.py +17 -27
agno/db/mysql/utils.py +139 -6
agno/db/postgres/async_postgres.py +10 -26
agno/db/postgres/postgres.py +7 -25
agno/db/redis/redis.py +0 -4
agno/db/schemas/evals.py +1 -0
agno/db/singlestore/singlestore.py +5 -12
agno/db/sqlite/async_sqlite.py +2 -26
agno/db/sqlite/sqlite.py +0 -20
agno/eval/__init__.py +10 -0
agno/eval/agent_as_judge.py +860 -0
agno/eval/base.py +29 -0
agno/eval/utils.py +2 -1
agno/exceptions.py +7 -0
agno/knowledge/embedder/openai.py +8 -8
agno/knowledge/knowledge.py +1142 -176
agno/media.py +22 -6
agno/models/aws/claude.py +8 -7
agno/models/base.py +160 -11
agno/models/deepseek/deepseek.py +67 -0
agno/models/google/gemini.py +65 -11
agno/models/google/utils.py +22 -0
agno/models/message.py +2 -0
agno/models/openai/chat.py +4 -0
agno/models/openai/responses.py +3 -2
agno/os/app.py +64 -74
agno/os/interfaces/a2a/router.py +3 -4
agno/os/interfaces/a2a/utils.py +1 -1
agno/os/interfaces/agui/router.py +2 -0
agno/os/middleware/jwt.py +8 -6
agno/os/router.py +3 -1607
agno/os/routers/agents/__init__.py +3 -0
agno/os/routers/agents/router.py +581 -0
agno/os/routers/agents/schema.py +261 -0
agno/os/routers/evals/evals.py +26 -6
agno/os/routers/evals/schemas.py +34 -2
agno/os/routers/evals/utils.py +101 -20
agno/os/routers/knowledge/knowledge.py +1 -1
agno/os/routers/teams/__init__.py +3 -0
agno/os/routers/teams/router.py +496 -0
agno/os/routers/teams/schema.py +257 -0
agno/os/routers/workflows/__init__.py +3 -0
agno/os/routers/workflows/router.py +545 -0
agno/os/routers/workflows/schema.py +75 -0
agno/os/schema.py +1 -559
agno/os/utils.py +139 -2
agno/team/team.py +159 -100
agno/tools/file_generation.py +12 -6
agno/tools/firecrawl.py +15 -7
agno/tools/workflow.py +8 -1
agno/utils/hooks.py +64 -5
agno/utils/http.py +2 -2
agno/utils/media.py +11 -1
agno/utils/print_response/agent.py +8 -0
agno/utils/print_response/team.py +8 -0
agno/vectordb/pgvector/pgvector.py +88 -51
agno/workflow/parallel.py +11 -5
agno/workflow/step.py +17 -5
agno/workflow/types.py +38 -2
agno/workflow/workflow.py +12 -4
{agno-2.3.7.dist-info → agno-2.3.9.dist-info}/METADATA +8 -3
{agno-2.3.7.dist-info → agno-2.3.9.dist-info}/RECORD +70 -58
agno/tools/memori.py +0 -339
{agno-2.3.7.dist-info → agno-2.3.9.dist-info}/WHEEL +0 -0
{agno-2.3.7.dist-info → agno-2.3.9.dist-info}/licenses/LICENSE +0 -0
{agno-2.3.7.dist-info → agno-2.3.9.dist-info}/top_level.txt +0 -0

agno/media.py CHANGED Viewed

@@ -4,6 +4,8 @@ from uuid import uuid4
 from pydantic import BaseModel, field_validator, model_validator
+from agno.utils.log import log_error
 class Image(BaseModel):
     """Unified Image class for all use cases (input, output, artifacts)"""
@@ -395,10 +397,20 @@ class File(BaseModel):
         name: Optional[str] = None,
         format: Optional[str] = None,
     ) -> "File":
-        """Create File from base64 encoded content"""
+        """Create File from base64 encoded content or plain text.
+        Handles both base64-encoded binary content and plain text content
+        (which is stored as UTF-8 strings for text/* MIME types).
+        """
         import base64
-        content_bytes = base64.b64decode(base64_content)
+        try:
+            content_bytes = base64.b64decode(base64_content)
+        except Exception:
+            # If not valid base64, it might be plain text content (text/csv, text/plain, etc.)
+            # which is stored as UTF-8 strings, not base64
+            content_bytes = base64_content.encode("utf-8")
         return cls(
             content=content_bytes,
             id=id,
@@ -413,10 +425,14 @@ class File(BaseModel):
         import httpx
         if self.url:
-            response = httpx.get(self.url)
-            content = response.content
-            mime_type = response.headers.get("Content-Type", "").split(";")[0]
-            return content, mime_type
+            try:
+                response = httpx.get(self.url)
+                content = response.content
+                mime_type = response.headers.get("Content-Type", "").split(";")[0]
+                return content, mime_type
+            except Exception:
+                log_error(f"Failed to download file from {self.url}")
+                return None
         else:
             return None

agno/models/aws/claude.py CHANGED Viewed

@@ -7,7 +7,7 @@ from pydantic import BaseModel
 from agno.models.anthropic import Claude as AnthropicClaude
 from agno.utils.http import get_default_async_client, get_default_sync_client
-from agno.utils.log import log_debug, log_error, log_warning
+from agno.utils.log import log_debug, log_warning
 from agno.utils.models.claude import format_tools_for_model
 try:
@@ -70,8 +70,8 @@ class Claude(AnthropicClaude):
                 if self.aws_region:
                     client_params["aws_region"] = self.aws_region
             else:
-                self.aws_access_key = self.aws_access_key or getenv("AWS_ACCESS_KEY")
-                self.aws_secret_key = self.aws_secret_key or getenv("AWS_SECRET_KEY")
+                self.aws_access_key = self.aws_access_key or getenv("AWS_ACCESS_KEY_ID") or getenv("AWS_ACCESS_KEY")
+                self.aws_secret_key = self.aws_secret_key or getenv("AWS_SECRET_ACCESS_KEY") or getenv("AWS_SECRET_KEY")
                 self.aws_region = self.aws_region or getenv("AWS_REGION")
                 client_params = {
@@ -79,10 +79,11 @@ class Claude(AnthropicClaude):
                     "aws_access_key": self.aws_access_key,
                     "aws_region": self.aws_region,
                 }
-        if not (self.aws_access_key or (self.aws_access_key and self.aws_secret_key)):
-            log_error(
-                "AWS credentials not found. Please either set the AWS_BEDROCK_API_KEY or AWS_ACCESS_KEY and AWS_SECRET_KEY environment variables."
-            )
+            if not (self.api_key or (self.aws_access_key and self.aws_secret_key)):
+                log_warning(
+                    "AWS credentials not found. Please set AWS_BEDROCK_API_KEY or AWS_ACCESS_KEY_ID and AWS_SECRET_ACCESS_KEY environment variables or provide a boto3 session."
+                )
         if self.timeout is not None:
             client_params["timeout"] = self.timeout

agno/models/base.py CHANGED Viewed

@@ -5,7 +5,7 @@ from abc import ABC, abstractmethod
 from dataclasses import dataclass, field
 from hashlib import md5
 from pathlib import Path
-from time import time
+from time import sleep, time
 from types import AsyncGeneratorType, GeneratorType
 from typing import (
     Any,
@@ -24,7 +24,7 @@ from uuid import uuid4
 from pydantic import BaseModel
-from agno.exceptions import AgentRunException
+from agno.exceptions import AgentRunException, ModelProviderError, RetryableModelProviderError
 from agno.media import Audio, File, Image, Video
 from agno.models.message import Citations, Message
 from agno.models.metrics import Metrics
@@ -146,15 +146,164 @@ class Model(ABC):
     cache_ttl: Optional[int] = None
     cache_dir: Optional[str] = None
+    # Retry configuration for model provider errors
+    # Number of retries to attempt when a ModelProviderError occurs
+    retries: int = 0
+    # Delay between retries (in seconds)
+    delay_between_retries: int = 1
+    # Exponential backoff: if True, the delay between retries is doubled each time
+    exponential_backoff: bool = False
+    # Enable retrying a model invocation once with a guidance message.
+    # This is useful for known errors avoidable with extra instructions.
+    retry_with_guidance: bool = True
     def __post_init__(self):
         if self.provider is None and self.name is not None:
             self.provider = f"{self.name} ({self.id})"
+    def _get_retry_delay(self, attempt: int) -> float:
+        """Calculate the delay before the next retry attempt."""
+        if self.exponential_backoff:
+            return self.delay_between_retries * (2**attempt)
+        return self.delay_between_retries
+    def _invoke_with_retry(self, **kwargs) -> ModelResponse:
+        """
+        Invoke the model with retry logic for ModelProviderError.
+        This method wraps the invoke() call and retries on ModelProviderError
+        with optional exponential backoff.
+        """
+        last_exception: Optional[ModelProviderError] = None
+        for attempt in range(self.retries + 1):
+            try:
+                return self.invoke(**kwargs)
+            except ModelProviderError as e:
+                last_exception = e
+                if attempt < self.retries:
+                    delay = self._get_retry_delay(attempt)
+                    log_warning(
+                        f"Model provider error (attempt {attempt + 1}/{self.retries + 1}): {e}. Retrying in {delay}s..."
+                    )
+                    sleep(delay)
+                else:
+                    log_error(f"Model provider error after {self.retries + 1} attempts: {e}")
+            except RetryableModelProviderError as e:
+                kwargs["messages"].append(Message(role="user", content=e.retry_guidance_message, temporary=True))
+                return self._invoke_with_retry(**kwargs, retrying_with_guidance=True)
+        # If we've exhausted all retries, raise the last exception
+        raise last_exception  # type: ignore
+    async def _ainvoke_with_retry(self, **kwargs) -> ModelResponse:
+        """
+        Asynchronously invoke the model with retry logic for ModelProviderError.
+        This method wraps the ainvoke() call and retries on ModelProviderError
+        with optional exponential backoff.
+        """
+        last_exception: Optional[ModelProviderError] = None
+        for attempt in range(self.retries + 1):
+            try:
+                return await self.ainvoke(**kwargs)
+            except ModelProviderError as e:
+                last_exception = e
+                if attempt < self.retries:
+                    delay = self._get_retry_delay(attempt)
+                    log_warning(
+                        f"Model provider error (attempt {attempt + 1}/{self.retries + 1}): {e}. Retrying in {delay}s..."
+                    )
+                    await asyncio.sleep(delay)
+                else:
+                    log_error(f"Model provider error after {self.retries + 1} attempts: {e}")
+            except RetryableModelProviderError as e:
+                kwargs["messages"].append(Message(role="user", content=e.retry_guidance_message, temporary=True))
+                return await self._ainvoke_with_retry(**kwargs, retrying_with_guidance=True)
+        # If we've exhausted all retries, raise the last exception
+        raise last_exception  # type: ignore
+    def _invoke_stream_with_retry(self, **kwargs) -> Iterator[ModelResponse]:
+        """
+        Invoke the model stream with retry logic for ModelProviderError.
+        This method wraps the invoke_stream() call and retries on ModelProviderError
+        with optional exponential backoff. Note that retries restart the entire stream.
+        """
+        last_exception: Optional[ModelProviderError] = None
+        for attempt in range(self.retries + 1):
+            try:
+                yield from self.invoke_stream(**kwargs)
+                return  # Success, exit the retry loop
+            except ModelProviderError as e:
+                last_exception = e
+                if attempt < self.retries:
+                    delay = self._get_retry_delay(attempt)
+                    log_warning(
+                        f"Model provider error during stream (attempt {attempt + 1}/{self.retries + 1}): {e}. "
+                        f"Retrying in {delay}s..."
+                    )
+                    sleep(delay)
+                else:
+                    log_error(f"Model provider error after {self.retries + 1} attempts: {e}")
+            except RetryableModelProviderError as e:
+                kwargs["messages"].append(Message(role="user", content=e.retry_guidance_message, temporary=True))
+                yield from self._invoke_stream_with_retry(**kwargs, retrying_with_guidance=True)
+                return  # Success, exit after regeneration
+        # If we've exhausted all retries, raise the last exception
+        raise last_exception  # type: ignore
+    async def _ainvoke_stream_with_retry(self, **kwargs) -> AsyncIterator[ModelResponse]:
+        """
+        Asynchronously invoke the model stream with retry logic for ModelProviderError.
+        This method wraps the ainvoke_stream() call and retries on ModelProviderError
+        with optional exponential backoff. Note that retries restart the entire stream.
+        """
+        last_exception: Optional[ModelProviderError] = None
+        for attempt in range(self.retries + 1):
+            try:
+                async for response in self.ainvoke_stream(**kwargs):
+                    yield response
+                return  # Success, exit the retry loop
+            except ModelProviderError as e:
+                last_exception = e
+                if attempt < self.retries:
+                    delay = self._get_retry_delay(attempt)
+                    log_warning(
+                        f"Model provider error during stream (attempt {attempt + 1}/{self.retries + 1}): {e}. "
+                        f"Retrying in {delay}s..."
+                    )
+                    await asyncio.sleep(delay)
+                else:
+                    log_error(f"Model provider error after {self.retries + 1} attempts: {e}")
+            except RetryableModelProviderError as e:
+                kwargs["messages"].append(Message(role="user", content=e.retry_guidance_message, temporary=True))
+                async for response in self._ainvoke_stream_with_retry(**kwargs, retrying_with_guidance=True):
+                    yield response
+                return  # Success, exit after regeneration
+        # If we've exhausted all retries, raise the last exception
+        raise last_exception  # type: ignore
     def to_dict(self) -> Dict[str, Any]:
         fields = {"name", "id", "provider"}
         _dict = {field: getattr(self, field) for field in fields if getattr(self, field) is not None}
         return _dict
+    def _remove_temporarys(self, messages: List[Message]) -> None:
+        """Remove temporal messages from the given list.
+        Args:
+            messages: The list of messages to filter (modified in place).
+        """
+        messages[:] = [m for m in messages if not m.temporary]
     def get_provider(self) -> str:
         return self.provider or self.name or self.__class__.__name__
@@ -734,8 +883,8 @@ class Model(ABC):
         Returns:
             Tuple[Message, bool]: (assistant_message, should_continue)
         """
-        # Generate response
-        provider_response = self.invoke(
+        # Generate response with retry logic for ModelProviderError
+        provider_response = self._invoke_with_retry(
             assistant_message=assistant_message,
             messages=messages,
             response_format=response_format,
@@ -791,8 +940,8 @@ class Model(ABC):
         Returns:
             Tuple[Message, bool]: (assistant_message, should_continue)
         """
-        # Generate response
-        provider_response = await self.ainvoke(
+        # Generate response with retry logic for ModelProviderError
+        provider_response = await self._ainvoke_with_retry(
             messages=messages,
             response_format=response_format,
             tools=tools,
@@ -913,10 +1062,10 @@ class Model(ABC):
         compress_tool_results: bool = False,
     ) -> Iterator[ModelResponse]:
         """
-        Process a streaming response from the model.
+        Process a streaming response from the model with retry logic for ModelProviderError.
         """
-        for response_delta in self.invoke_stream(
+        for response_delta in self._invoke_stream_with_retry(
             messages=messages,
             assistant_message=assistant_message,
             response_format=response_format,
@@ -1132,9 +1281,9 @@ class Model(ABC):
         compress_tool_results: bool = False,
     ) -> AsyncIterator[ModelResponse]:
         """
-        Process a streaming response from the model.
+        Process a streaming response from the model with retry logic for ModelProviderError.
         """
-        async for response_delta in self.ainvoke_stream(
+        async for response_delta in self._ainvoke_stream_with_retry(
             messages=messages,
             assistant_message=assistant_message,
             response_format=response_format,
@@ -1142,7 +1291,7 @@ class Model(ABC):
             tool_choice=tool_choice or self._tool_choice,
             run_response=run_response,
             compress_tool_results=compress_tool_results,
-        ):  # type: ignore
+        ):
             for model_response_delta in self._populate_stream_data(
                 stream_data=stream_data,
                 model_response_delta=response_delta,

agno/models/deepseek/deepseek.py CHANGED Viewed

@@ -3,7 +3,10 @@ from os import getenv
 from typing import Any, Dict, Optional
 from agno.exceptions import ModelAuthenticationError
+from agno.models.message import Message
 from agno.models.openai.like import OpenAILike
+from agno.utils.log import log_warning
+from agno.utils.openai import _format_file_for_message, audio_to_message, images_to_message
 @dataclass
@@ -58,3 +61,67 @@ class DeepSeek(OpenAILike):
         if self.client_params:
             client_params.update(self.client_params)
         return client_params
+    def _format_message(self, message: Message, compress_tool_results: bool = False) -> Dict[str, Any]:
+        """
+        Format a message into the format expected by OpenAI.
+        Args:
+            message (Message): The message to format.
+            compress_tool_results: Whether to compress tool results.
+        Returns:
+            Dict[str, Any]: The formatted message.
+        """
+        tool_result = message.get_content(use_compressed_content=compress_tool_results)
+        message_dict: Dict[str, Any] = {
+            "role": self.role_map[message.role] if self.role_map else self.default_role_map[message.role],
+            "content": tool_result,
+            "name": message.name,
+            "tool_call_id": message.tool_call_id,
+            "tool_calls": message.tool_calls,
+            "reasoning_content": message.reasoning_content,
+        }
+        message_dict = {k: v for k, v in message_dict.items() if v is not None}
+        # Ignore non-string message content
+        # because we assume that the images/audio are already added to the message
+        if (message.images is not None and len(message.images) > 0) or (
+            message.audio is not None and len(message.audio) > 0
+        ):
+            # Ignore non-string message content
+            # because we assume that the images/audio are already added to the message
+            if isinstance(message.content, str):
+                message_dict["content"] = [{"type": "text", "text": message.content}]
+                if message.images is not None:
+                    message_dict["content"].extend(images_to_message(images=message.images))
+                if message.audio is not None:
+                    message_dict["content"].extend(audio_to_message(audio=message.audio))
+        if message.audio_output is not None:
+            message_dict["content"] = ""
+            message_dict["audio"] = {"id": message.audio_output.id}
+        if message.videos is not None and len(message.videos) > 0:
+            log_warning("Video input is currently unsupported.")
+        if message.files is not None:
+            # Ensure content is a list of parts
+            content = message_dict.get("content")
+            if isinstance(content, str):  # wrap existing text
+                text = content
+                message_dict["content"] = [{"type": "text", "text": text}]
+            elif content is None:
+                message_dict["content"] = []
+            # Insert each file part before text parts
+            for file in message.files:
+                file_part = _format_file_for_message(file)
+                if file_part:
+                    message_dict["content"].insert(0, file_part)
+        # Manually add the content field even if it is None
+        if message.content is None:
+            message_dict["content"] = ""
+        return message_dict

agno/models/google/gemini.py CHANGED Viewed

@@ -13,7 +13,8 @@ from pydantic import BaseModel
 from agno.exceptions import ModelProviderError
 from agno.media import Audio, File, Image, Video
-from agno.models.base import Model
+from agno.models.base import Model, RetryableModelProviderError
+from agno.models.google.utils import MALFORMED_FUNCTION_CALL_GUIDANCE, GeminiFinishReason
 from agno.models.message import Citations, Message, UrlCitation
 from agno.models.metrics import Metrics
 from agno.models.response import ModelResponse
@@ -317,6 +318,7 @@ class Gemini(Model):
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
         compress_tool_results: bool = False,
+        retrying_with_guidance: bool = False,
     ) -> ModelResponse:
         """
         Invokes the model with a list of messages and returns the response.
@@ -337,7 +339,13 @@ class Gemini(Model):
             )
             assistant_message.metrics.stop_timer()
-            model_response = self._parse_provider_response(provider_response, response_format=response_format)
+            model_response = self._parse_provider_response(
+                provider_response, response_format=response_format, retrying_with_guidance=retrying_with_guidance
+            )
+            # If we were retrying the invoke with guidance, remove the guidance message
+            if retrying_with_guidance is True:
+                self._remove_temporarys(messages)
             return model_response
@@ -350,6 +358,8 @@ class Gemini(Model):
                 model_name=self.name,
                 model_id=self.id,
             ) from e
+        except RetryableModelProviderError:
+            raise
         except Exception as e:
             log_error(f"Unknown error from Gemini API: {e}")
             raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
@@ -363,6 +373,7 @@ class Gemini(Model):
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
         compress_tool_results: bool = False,
+        retrying_with_guidance: bool = False,
     ) -> Iterator[ModelResponse]:
         """
         Invokes the model with a list of messages and returns the response as a stream.
@@ -382,7 +393,11 @@ class Gemini(Model):
                 contents=formatted_messages,
                 **request_kwargs,
             ):
-                yield self._parse_provider_response_delta(response)
+                yield self._parse_provider_response_delta(response, retrying_with_guidance=retrying_with_guidance)
+            # If we were retrying the invoke with guidance, remove the guidance message
+            if retrying_with_guidance is True:
+                self._remove_temporarys(messages)
             assistant_message.metrics.stop_timer()
@@ -394,6 +409,8 @@ class Gemini(Model):
                 model_name=self.name,
                 model_id=self.id,
             ) from e
+        except RetryableModelProviderError:
+            raise
         except Exception as e:
             log_error(f"Unknown error from Gemini API: {e}")
             raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
@@ -407,6 +424,7 @@ class Gemini(Model):
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
         compress_tool_results: bool = False,
+        retrying_with_guidance: bool = False,
     ) -> ModelResponse:
         """
         Invokes the model with a list of messages and returns the response.
@@ -429,7 +447,13 @@ class Gemini(Model):
             )
             assistant_message.metrics.stop_timer()
-            model_response = self._parse_provider_response(provider_response, response_format=response_format)
+            model_response = self._parse_provider_response(
+                provider_response, response_format=response_format, retrying_with_guidance=retrying_with_guidance
+            )
+            # If we were retrying the invoke with guidance, remove the guidance message
+            if retrying_with_guidance is True:
+                self._remove_temporarys(messages)
             return model_response
@@ -441,6 +465,8 @@ class Gemini(Model):
                 model_name=self.name,
                 model_id=self.id,
             ) from e
+        except RetryableModelProviderError:
+            raise
         except Exception as e:
             log_error(f"Unknown error from Gemini API: {e}")
             raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
@@ -454,6 +480,7 @@ class Gemini(Model):
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
         run_response: Optional[RunOutput] = None,
         compress_tool_results: bool = False,
+        retrying_with_guidance: bool = False,
     ) -> AsyncIterator[ModelResponse]:
         """
         Invokes the model with a list of messages and returns the response as a stream.
@@ -476,7 +503,11 @@ class Gemini(Model):
                 **request_kwargs,
             )
             async for chunk in async_stream:
-                yield self._parse_provider_response_delta(chunk)
+                yield self._parse_provider_response_delta(chunk, retrying_with_guidance=retrying_with_guidance)
+            # If we were retrying the invoke with guidance, remove the guidance message
+            if retrying_with_guidance is True:
+                self._remove_temporarys(messages)
             assistant_message.metrics.stop_timer()
@@ -488,6 +519,8 @@ class Gemini(Model):
                 model_name=self.name,
                 model_id=self.id,
             ) from e
+        except RetryableModelProviderError:
+            raise
         except Exception as e:
             log_error(f"Unknown error from Gemini API: {e}")
             raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
@@ -863,10 +896,10 @@ class Gemini(Model):
     def _parse_provider_response(self, response: GenerateContentResponse, **kwargs) -> ModelResponse:
         """
-        Parse the OpenAI response into a ModelResponse.
+        Parse the Gemini response into a ModelResponse.
         Args:
-            response: Raw response from OpenAI
+            response: Raw response from Gemini
         Returns:
             ModelResponse: Parsed response data
@@ -875,8 +908,20 @@ class Gemini(Model):
         # Get response message
         response_message = Content(role="model", parts=[])
-        if response.candidates and response.candidates[0].content:
-            response_message = response.candidates[0].content
+        if response.candidates and len(response.candidates) > 0:
+            candidate = response.candidates[0]
+            # Raise if the request failed because of a malformed function call
+            if hasattr(candidate, "finish_reason") and candidate.finish_reason:
+                if candidate.finish_reason == GeminiFinishReason.MALFORMED_FUNCTION_CALL.value:
+                    # We only want to raise errors that trigger regeneration attempts once
+                    if kwargs.get("retrying_with_guidance") is True:
+                        pass
+                    if self.retry_with_guidance:
+                        raise RetryableModelProviderError(retry_guidance_message=MALFORMED_FUNCTION_CALL_GUIDANCE)
+            if candidate.content:
+                response_message = candidate.content
         # Add role
         if response_message.role is not None:
@@ -1019,11 +1064,20 @@ class Gemini(Model):
         return model_response
-    def _parse_provider_response_delta(self, response_delta: GenerateContentResponse) -> ModelResponse:
+    def _parse_provider_response_delta(self, response_delta: GenerateContentResponse, **kwargs) -> ModelResponse:
         model_response = ModelResponse()
         if response_delta.candidates and len(response_delta.candidates) > 0:
-            candidate_content = response_delta.candidates[0].content
+            candidate = response_delta.candidates[0]
+            candidate_content = candidate.content
+            # Raise if the request failed because of a malformed function call
+            if hasattr(candidate, "finish_reason") and candidate.finish_reason:
+                if candidate.finish_reason == GeminiFinishReason.MALFORMED_FUNCTION_CALL.value:
+                    if kwargs.get("retrying_with_guidance") is True:
+                        pass
+                    raise RetryableModelProviderError(retry_guidance_message=MALFORMED_FUNCTION_CALL_GUIDANCE)
             response_message: Content = Content(role="model", parts=[])
             if candidate_content is not None:
                 response_message = candidate_content

agno/models/google/utils.py ADDED Viewed

@@ -0,0 +1,22 @@
+from enum import Enum
+class GeminiFinishReason(Enum):
+    """Gemini API finish reasons"""
+    STOP = "STOP"
+    MAX_TOKENS = "MAX_TOKENS"
+    SAFETY = "SAFETY"
+    RECITATION = "RECITATION"
+    MALFORMED_FUNCTION_CALL = "MALFORMED_FUNCTION_CALL"
+    OTHER = "OTHER"
+# Guidance message used to retry a Gemini invocation after a MALFORMED_FUNCTION_CALL error
+MALFORMED_FUNCTION_CALL_GUIDANCE = """The previous function call was malformed. Please try again with a valid function call.
+Guidelines:
+- Generate the function call JSON directly, do not generate code
+- Use the function name exactly as defined (no namespace prefixes like 'default_api.')
+- Ensure all required parameters are provided with correct types
+"""

agno/models/message.py CHANGED Viewed

@@ -112,6 +112,8 @@ class Message(BaseModel):
     references: Optional[MessageReferences] = None
     # The Unix timestamp the message was created.
     created_at: int = Field(default_factory=lambda: int(time()))
+    # When True, the message will be sent to the Model but not persisted afterwards.
+    temporary: bool = False
     model_config = ConfigDict(extra="allow", populate_by_name=True, arbitrary_types_allowed=True)

agno/models/openai/chat.py CHANGED Viewed

@@ -814,6 +814,8 @@ class OpenAIChat(Model):
         if hasattr(response_message, "reasoning_content") and response_message.reasoning_content is not None:  # type: ignore
             model_response.reasoning_content = response_message.reasoning_content  # type: ignore
+        elif hasattr(response_message, "reasoning") and response_message.reasoning is not None:  # type: ignore
+            model_response.reasoning_content = response_message.reasoning  # type: ignore
         if response.usage is not None:
             model_response.response_usage = self._get_metrics(response.usage)
@@ -846,6 +848,8 @@ class OpenAIChat(Model):
                 if hasattr(choice_delta, "reasoning_content") and choice_delta.reasoning_content is not None:
                     model_response.reasoning_content = choice_delta.reasoning_content
+                elif hasattr(choice_delta, "reasoning") and choice_delta.reasoning is not None:
+                    model_response.reasoning_content = choice_delta.reasoning
                 # Add audio if present
                 if hasattr(choice_delta, "audio") and choice_delta.audio is not None:

agno/models/openai/responses.py CHANGED Viewed

@@ -307,6 +307,8 @@ class OpenAIResponses(Model):
     def _upload_file(self, file: File) -> Optional[str]:
         """Upload a file to the OpenAI vector database."""
+        from pathlib import Path
+        from urllib.parse import urlparse
         if file.url is not None:
             file_content_tuple = file.file_url_content
@@ -314,13 +316,12 @@ class OpenAIResponses(Model):
                 file_content = file_content_tuple[0]
             else:
                 return None
-            file_name = file.url.split("/")[-1]
+            file_name = Path(urlparse(file.url).path).name or "file"
             file_tuple = (file_name, file_content)
             result = self.get_client().files.create(file=file_tuple, purpose="assistants")
             return result.id
         elif file.filepath is not None:
             import mimetypes
-            from pathlib import Path
             file_path = file.filepath if isinstance(file.filepath, Path) else Path(file.filepath)
             if file_path.exists() and file_path.is_file():

agno 2.3.7__py3-none-any.whl → 2.3.9__py3-none-any.whl

agno 2.3.7py3-none-any.whl → 2.3.9py3-none-any.whl