PyPI - agno - Versions diffs - 2.3.12__py3-none-any.whl → 2.3.14__py3-none-any.whl - Mend

agno 2.3.12py3-none-any.whl → 2.3.14py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (55) hide show

agno/agent/agent.py +1125 -1401
agno/eval/__init__.py +21 -8
agno/knowledge/embedder/azure_openai.py +0 -1
agno/knowledge/embedder/google.py +1 -1
agno/models/anthropic/claude.py +4 -1
agno/models/azure/openai_chat.py +11 -5
agno/models/base.py +8 -4
agno/models/openai/chat.py +0 -2
agno/models/openai/responses.py +2 -2
agno/os/app.py +112 -5
agno/os/auth.py +190 -3
agno/os/config.py +9 -0
agno/os/interfaces/a2a/router.py +619 -9
agno/os/interfaces/a2a/utils.py +31 -32
agno/os/middleware/__init__.py +2 -0
agno/os/middleware/jwt.py +670 -108
agno/os/router.py +0 -1
agno/os/routers/agents/router.py +22 -4
agno/os/routers/agents/schema.py +14 -1
agno/os/routers/teams/router.py +20 -4
agno/os/routers/teams/schema.py +14 -1
agno/os/routers/workflows/router.py +88 -9
agno/os/scopes.py +469 -0
agno/os/utils.py +86 -53
agno/reasoning/anthropic.py +85 -1
agno/reasoning/azure_ai_foundry.py +93 -1
agno/reasoning/deepseek.py +91 -1
agno/reasoning/gemini.py +81 -1
agno/reasoning/groq.py +103 -1
agno/reasoning/manager.py +1244 -0
agno/reasoning/ollama.py +93 -1
agno/reasoning/openai.py +113 -1
agno/reasoning/vertexai.py +85 -1
agno/run/agent.py +11 -0
agno/run/base.py +1 -1
agno/run/team.py +11 -0
agno/session/team.py +0 -3
agno/team/team.py +1204 -1452
agno/tools/postgres.py +1 -1
agno/utils/cryptography.py +22 -0
agno/utils/events.py +69 -2
agno/utils/hooks.py +4 -10
agno/utils/print_response/agent.py +52 -2
agno/utils/print_response/team.py +141 -10
agno/utils/prompts.py +8 -6
agno/utils/string.py +46 -0
agno/utils/team.py +1 -1
agno/vectordb/chroma/chromadb.py +1 -0
agno/vectordb/milvus/milvus.py +32 -3
agno/vectordb/redis/redisdb.py +16 -2
{agno-2.3.12.dist-info → agno-2.3.14.dist-info}/METADATA +3 -2
{agno-2.3.12.dist-info → agno-2.3.14.dist-info}/RECORD +55 -52
{agno-2.3.12.dist-info → agno-2.3.14.dist-info}/WHEEL +0 -0
{agno-2.3.12.dist-info → agno-2.3.14.dist-info}/licenses/LICENSE +0 -0
{agno-2.3.12.dist-info → agno-2.3.14.dist-info}/top_level.txt +0 -0

agno/reasoning/ollama.py CHANGED Viewed

@@ -1,6 +1,6 @@
 from __future__ import annotations
-from typing import List, Optional
+from typing import AsyncIterator, Iterator, List, Optional, Tuple
 from agno.models.base import Model
 from agno.models.message import Message
@@ -65,3 +65,95 @@ async def aget_ollama_reasoning(reasoning_agent: "Agent", messages: List[Message
     return Message(
         role="assistant", content=f"<thinking>\n{reasoning_content}\n</thinking>", reasoning_content=reasoning_content
     )
+def get_ollama_reasoning_stream(
+    reasoning_agent: "Agent",  # type: ignore  # noqa: F821
+    messages: List[Message],
+) -> Iterator[Tuple[Optional[str], Optional[Message]]]:
+    """
+    Stream reasoning content from Ollama model.
+    For reasoning models on Ollama (qwq, deepseek-r1, etc.), we use the main content output as reasoning content.
+    Yields:
+        Tuple of (reasoning_content_delta, final_message)
+        - During streaming: (reasoning_content_delta, None)
+        - At the end: (None, final_message)
+    """
+    from agno.run.agent import RunEvent
+    reasoning_content: str = ""
+    try:
+        for event in reasoning_agent.run(input=messages, stream=True, stream_intermediate_steps=True):
+            if hasattr(event, "event"):
+                if event.event == RunEvent.run_content:
+                    # Check for reasoning_content attribute first (native reasoning)
+                    if hasattr(event, "reasoning_content") and event.reasoning_content:
+                        reasoning_content += event.reasoning_content
+                        yield (event.reasoning_content, None)
+                    # Use the main content as reasoning content
+                    elif hasattr(event, "content") and event.content:
+                        reasoning_content += event.content
+                        yield (event.content, None)
+                elif event.event == RunEvent.run_completed:
+                    pass
+    except Exception as e:
+        logger.warning(f"Reasoning error: {e}")
+        return
+    # Yield final message
+    if reasoning_content:
+        final_message = Message(
+            role="assistant",
+            content=f"<thinking>\n{reasoning_content}\n</thinking>",
+            reasoning_content=reasoning_content,
+        )
+        yield (None, final_message)
+async def aget_ollama_reasoning_stream(
+    reasoning_agent: "Agent",  # type: ignore  # noqa: F821
+    messages: List[Message],
+) -> AsyncIterator[Tuple[Optional[str], Optional[Message]]]:
+    """
+    Stream reasoning content from Ollama model asynchronously.
+    For reasoning models on Ollama (qwq, deepseek-r1, etc.), we use the main content output as reasoning content.
+    Yields:
+        Tuple of (reasoning_content_delta, final_message)
+        - During streaming: (reasoning_content_delta, None)
+        - At the end: (None, final_message)
+    """
+    from agno.run.agent import RunEvent
+    reasoning_content: str = ""
+    try:
+        async for event in reasoning_agent.arun(input=messages, stream=True, stream_intermediate_steps=True):
+            if hasattr(event, "event"):
+                if event.event == RunEvent.run_content:
+                    # Check for reasoning_content attribute first (native reasoning)
+                    if hasattr(event, "reasoning_content") and event.reasoning_content:
+                        reasoning_content += event.reasoning_content
+                        yield (event.reasoning_content, None)
+                    # Use the main content as reasoning content
+                    elif hasattr(event, "content") and event.content:
+                        reasoning_content += event.content
+                        yield (event.content, None)
+                elif event.event == RunEvent.run_completed:
+                    pass
+    except Exception as e:
+        logger.warning(f"Reasoning error: {e}")
+        return
+    # Yield final message
+    if reasoning_content:
+        final_message = Message(
+            role="assistant",
+            content=f"<thinking>\n{reasoning_content}\n</thinking>",
+            reasoning_content=reasoning_content,
+        )
+        yield (None, final_message)

agno/reasoning/openai.py CHANGED Viewed

@@ -1,6 +1,6 @@
 from __future__ import annotations
-from typing import List, Optional
+from typing import AsyncIterator, Iterator, List, Optional, Tuple
 from agno.models.base import Model
 from agno.models.message import Message
@@ -84,3 +84,115 @@ async def aget_openai_reasoning(reasoning_agent: "Agent", messages: List[Message
     return Message(
         role="assistant", content=f"<thinking>\n{reasoning_content}\n</thinking>", reasoning_content=reasoning_content
     )
+def get_openai_reasoning_stream(
+    reasoning_agent: "Agent",  # type: ignore  # noqa: F821
+    messages: List[Message],
+) -> Iterator[Tuple[Optional[str], Optional[Message]]]:
+    """
+    Stream reasoning content from OpenAI model.
+    For OpenAI reasoning models, we use the main content output as reasoning content.
+    Yields:
+        Tuple of (reasoning_content_delta, final_message)
+        - During streaming: (reasoning_content_delta, None)
+        - At the end: (None, final_message)
+    """
+    from agno.run.agent import RunEvent
+    # Update system message role to "system"
+    for message in messages:
+        if message.role == "developer":
+            message.role = "system"
+    reasoning_content: str = ""
+    try:
+        for event in reasoning_agent.run(input=messages, stream=True, stream_intermediate_steps=True):
+            if hasattr(event, "event"):
+                if event.event == RunEvent.run_content:
+                    # Check for reasoning_content attribute first (native reasoning)
+                    if hasattr(event, "reasoning_content") and event.reasoning_content:
+                        reasoning_content += event.reasoning_content
+                        yield (event.reasoning_content, None)
+                    # Use the main content as reasoning content
+                    elif hasattr(event, "content") and event.content:
+                        reasoning_content += event.content
+                        yield (event.content, None)
+                elif event.event == RunEvent.run_completed:
+                    # Check for reasoning_content at completion (OpenAIResponses with reasoning_summary)
+                    if hasattr(event, "reasoning_content") and event.reasoning_content:
+                        # If we haven't accumulated any reasoning content yet, use this
+                        if not reasoning_content:
+                            reasoning_content = event.reasoning_content
+                            yield (event.reasoning_content, None)
+    except Exception as e:
+        logger.warning(f"Reasoning error: {e}")
+        return
+    # Yield final message
+    if reasoning_content:
+        final_message = Message(
+            role="assistant",
+            content=f"<thinking>\n{reasoning_content}\n</thinking>",
+            reasoning_content=reasoning_content,
+        )
+        yield (None, final_message)
+async def aget_openai_reasoning_stream(
+    reasoning_agent: "Agent",  # type: ignore  # noqa: F821
+    messages: List[Message],
+) -> AsyncIterator[Tuple[Optional[str], Optional[Message]]]:
+    """
+    Stream reasoning content from OpenAI model asynchronously.
+    For OpenAI reasoning models, we use the main content output as reasoning content.
+    Yields:
+        Tuple of (reasoning_content_delta, final_message)
+        - During streaming: (reasoning_content_delta, None)
+        - At the end: (None, final_message)
+    """
+    from agno.run.agent import RunEvent
+    # Update system message role to "system"
+    for message in messages:
+        if message.role == "developer":
+            message.role = "system"
+    reasoning_content: str = ""
+    try:
+        async for event in reasoning_agent.arun(input=messages, stream=True, stream_intermediate_steps=True):
+            if hasattr(event, "event"):
+                if event.event == RunEvent.run_content:
+                    # Check for reasoning_content attribute first (native reasoning)
+                    if hasattr(event, "reasoning_content") and event.reasoning_content:
+                        reasoning_content += event.reasoning_content
+                        yield (event.reasoning_content, None)
+                    # Use the main content as reasoning content
+                    elif hasattr(event, "content") and event.content:
+                        reasoning_content += event.content
+                        yield (event.content, None)
+                elif event.event == RunEvent.run_completed:
+                    # Check for reasoning_content at completion (OpenAIResponses with reasoning_summary)
+                    if hasattr(event, "reasoning_content") and event.reasoning_content:
+                        # If we haven't accumulated any reasoning content yet, use this
+                        if not reasoning_content:
+                            reasoning_content = event.reasoning_content
+                            yield (event.reasoning_content, None)
+    except Exception as e:
+        logger.warning(f"Reasoning error: {e}")
+        return
+    # Yield final message
+    if reasoning_content:
+        final_message = Message(
+            role="assistant",
+            content=f"<thinking>\n{reasoning_content}\n</thinking>",
+            reasoning_content=reasoning_content,
+        )
+        yield (None, final_message)

agno/reasoning/vertexai.py CHANGED Viewed

@@ -1,6 +1,6 @@
 from __future__ import annotations
-from typing import List, Optional
+from typing import AsyncIterator, Iterator, List, Optional, Tuple
 from agno.models.base import Model
 from agno.models.message import Message
@@ -74,3 +74,87 @@ async def aget_vertexai_reasoning(reasoning_agent: "Agent", messages: List[Messa
         reasoning_content=reasoning_content,
         redacted_reasoning_content=redacted_reasoning_content,
     )
+def get_vertexai_reasoning_stream(
+    reasoning_agent: "Agent",  # type: ignore  # noqa: F821
+    messages: List[Message],
+) -> Iterator[Tuple[Optional[str], Optional[Message]]]:
+    """
+    Stream reasoning content from VertexAI Claude model.
+    Yields:
+        Tuple of (reasoning_content_delta, final_message)
+        - During streaming: (reasoning_content_delta, None)
+        - At the end: (None, final_message)
+    """
+    from agno.run.agent import RunEvent
+    reasoning_content: str = ""
+    redacted_reasoning_content: Optional[str] = None
+    try:
+        for event in reasoning_agent.run(input=messages, stream=True, stream_intermediate_steps=True):
+            if hasattr(event, "event"):
+                if event.event == RunEvent.run_content:
+                    # Stream reasoning content as it arrives
+                    if hasattr(event, "reasoning_content") and event.reasoning_content:
+                        reasoning_content += event.reasoning_content
+                        yield (event.reasoning_content, None)
+                elif event.event == RunEvent.run_completed:
+                    pass
+    except Exception as e:
+        logger.warning(f"Reasoning error: {e}")
+        return
+    # Yield final message
+    if reasoning_content:
+        final_message = Message(
+            role="assistant",
+            content=f"<thinking>\n{reasoning_content}\n</thinking>",
+            reasoning_content=reasoning_content,
+            redacted_reasoning_content=redacted_reasoning_content,
+        )
+        yield (None, final_message)
+async def aget_vertexai_reasoning_stream(
+    reasoning_agent: "Agent",  # type: ignore  # noqa: F821
+    messages: List[Message],
+) -> AsyncIterator[Tuple[Optional[str], Optional[Message]]]:
+    """
+    Stream reasoning content from VertexAI Claude model asynchronously.
+    Yields:
+        Tuple of (reasoning_content_delta, final_message)
+        - During streaming: (reasoning_content_delta, None)
+        - At the end: (None, final_message)
+    """
+    from agno.run.agent import RunEvent
+    reasoning_content: str = ""
+    redacted_reasoning_content: Optional[str] = None
+    try:
+        async for event in reasoning_agent.arun(input=messages, stream=True, stream_intermediate_steps=True):
+            if hasattr(event, "event"):
+                if event.event == RunEvent.run_content:
+                    # Stream reasoning content as it arrives
+                    if hasattr(event, "reasoning_content") and event.reasoning_content:
+                        reasoning_content += event.reasoning_content
+                        yield (event.reasoning_content, None)
+                elif event.event == RunEvent.run_completed:
+                    pass
+    except Exception as e:
+        logger.warning(f"Reasoning error: {e}")
+        return
+    # Yield final message
+    if reasoning_content:
+        final_message = Message(
+            role="assistant",
+            content=f"<thinking>\n{reasoning_content}\n</thinking>",
+            reasoning_content=reasoning_content,
+            redacted_reasoning_content=redacted_reasoning_content,
+        )
+        yield (None, final_message)

agno/run/agent.py CHANGED Viewed

@@ -156,6 +156,7 @@ class RunEvent(str, Enum):
     reasoning_started = "ReasoningStarted"
     reasoning_step = "ReasoningStep"
+    reasoning_content_delta = "ReasoningContentDelta"
     reasoning_completed = "ReasoningCompleted"
     memory_update_started = "MemoryUpdateStarted"
@@ -373,6 +374,14 @@ class ReasoningStepEvent(BaseAgentRunEvent):
     reasoning_content: str = ""
+@dataclass
+class ReasoningContentDeltaEvent(BaseAgentRunEvent):
+    """Event for streaming reasoning content chunks as they arrive."""
+    event: str = RunEvent.reasoning_content_delta.value
+    reasoning_content: str = ""  # The delta/chunk of reasoning content
 @dataclass
 class ReasoningCompletedEvent(BaseAgentRunEvent):
     event: str = RunEvent.reasoning_completed.value
@@ -442,6 +451,7 @@ RunOutputEvent = Union[
     PostHookCompletedEvent,
     ReasoningStartedEvent,
     ReasoningStepEvent,
+    ReasoningContentDeltaEvent,
     ReasoningCompletedEvent,
     MemoryUpdateStartedEvent,
     MemoryUpdateCompletedEvent,
@@ -474,6 +484,7 @@ RUN_EVENT_TYPE_REGISTRY = {
     RunEvent.post_hook_completed.value: PostHookCompletedEvent,
     RunEvent.reasoning_started.value: ReasoningStartedEvent,
     RunEvent.reasoning_step.value: ReasoningStepEvent,
+    RunEvent.reasoning_content_delta.value: ReasoningContentDeltaEvent,
     RunEvent.reasoning_completed.value: ReasoningCompletedEvent,
     RunEvent.memory_update_started.value: MemoryUpdateStartedEvent,
     RunEvent.memory_update_completed.value: MemoryUpdateCompletedEvent,

agno/run/base.py CHANGED Viewed

@@ -22,7 +22,7 @@ class RunContext:
     knowledge_filters: Optional[Union[Dict[str, Any], List[FilterExpr]]] = None
     metadata: Optional[Dict[str, Any]] = None
     session_state: Optional[Dict[str, Any]] = None
-    output_schema: Optional[Type[BaseModel]] = None
+    output_schema: Optional[Union[Type[BaseModel], Dict[str, Any]]] = None
 @dataclass

agno/run/team.py CHANGED Viewed

@@ -149,6 +149,7 @@ class TeamRunEvent(str, Enum):
     reasoning_started = "TeamReasoningStarted"
     reasoning_step = "TeamReasoningStep"
+    reasoning_content_delta = "TeamReasoningContentDelta"
     reasoning_completed = "TeamReasoningCompleted"
     memory_update_started = "TeamMemoryUpdateStarted"
@@ -346,6 +347,14 @@ class ReasoningStepEvent(BaseTeamRunEvent):
     reasoning_content: str = ""
+@dataclass
+class ReasoningContentDeltaEvent(BaseTeamRunEvent):
+    """Event for streaming reasoning content chunks as they arrive."""
+    event: str = TeamRunEvent.reasoning_content_delta.value
+    reasoning_content: str = ""  # The delta/chunk of reasoning content
 @dataclass
 class ReasoningCompletedEvent(BaseTeamRunEvent):
     event: str = TeamRunEvent.reasoning_completed.value
@@ -411,6 +420,7 @@ TeamRunOutputEvent = Union[
     PreHookCompletedEvent,
     ReasoningStartedEvent,
     ReasoningStepEvent,
+    ReasoningContentDeltaEvent,
     ReasoningCompletedEvent,
     MemoryUpdateStartedEvent,
     MemoryUpdateCompletedEvent,
@@ -440,6 +450,7 @@ TEAM_RUN_EVENT_TYPE_REGISTRY = {
     TeamRunEvent.post_hook_completed.value: PostHookCompletedEvent,
     TeamRunEvent.reasoning_started.value: ReasoningStartedEvent,
     TeamRunEvent.reasoning_step.value: ReasoningStepEvent,
+    TeamRunEvent.reasoning_content_delta.value: ReasoningContentDeltaEvent,
     TeamRunEvent.reasoning_completed.value: ReasoningCompletedEvent,
     TeamRunEvent.memory_update_started.value: MemoryUpdateStartedEvent,
     TeamRunEvent.memory_update_completed.value: MemoryUpdateCompletedEvent,

agno/session/team.py CHANGED Viewed

@@ -91,10 +91,7 @@ class TeamSession:
     def upsert_run(self, run_response: Union[TeamRunOutput, RunOutput]):
         """Adds a RunOutput, together with some calculated data, to the runs list."""
         messages = run_response.messages
-        if messages is None:
-            return
         # Make message duration None
         for m in messages or []:

agno 2.3.12__py3-none-any.whl → 2.3.14__py3-none-any.whl

agno 2.3.12py3-none-any.whl → 2.3.14py3-none-any.whl