PyPI - agno - Versions diffs - 2.2.13__py3-none-any.whl - Mend

agno 2.2.13__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (575) hide show

agno/__init__.py +8 -0
agno/agent/__init__.py +51 -0
agno/agent/agent.py +10405 -0
agno/api/__init__.py +0 -0
agno/api/agent.py +28 -0
agno/api/api.py +40 -0
agno/api/evals.py +22 -0
agno/api/os.py +17 -0
agno/api/routes.py +13 -0
agno/api/schemas/__init__.py +9 -0
agno/api/schemas/agent.py +16 -0
agno/api/schemas/evals.py +16 -0
agno/api/schemas/os.py +14 -0
agno/api/schemas/response.py +6 -0
agno/api/schemas/team.py +16 -0
agno/api/schemas/utils.py +21 -0
agno/api/schemas/workflows.py +16 -0
agno/api/settings.py +53 -0
agno/api/team.py +30 -0
agno/api/workflow.py +28 -0
agno/cloud/aws/base.py +214 -0
agno/cloud/aws/s3/__init__.py +2 -0
agno/cloud/aws/s3/api_client.py +43 -0
agno/cloud/aws/s3/bucket.py +195 -0
agno/cloud/aws/s3/object.py +57 -0
agno/culture/__init__.py +3 -0
agno/culture/manager.py +956 -0
agno/db/__init__.py +24 -0
agno/db/async_postgres/__init__.py +3 -0
agno/db/base.py +598 -0
agno/db/dynamo/__init__.py +3 -0
agno/db/dynamo/dynamo.py +2042 -0
agno/db/dynamo/schemas.py +314 -0
agno/db/dynamo/utils.py +743 -0
agno/db/firestore/__init__.py +3 -0
agno/db/firestore/firestore.py +1795 -0
agno/db/firestore/schemas.py +140 -0
agno/db/firestore/utils.py +376 -0
agno/db/gcs_json/__init__.py +3 -0
agno/db/gcs_json/gcs_json_db.py +1335 -0
agno/db/gcs_json/utils.py +228 -0
agno/db/in_memory/__init__.py +3 -0
agno/db/in_memory/in_memory_db.py +1160 -0
agno/db/in_memory/utils.py +230 -0
agno/db/json/__init__.py +3 -0
agno/db/json/json_db.py +1328 -0
agno/db/json/utils.py +230 -0
agno/db/migrations/__init__.py +0 -0
agno/db/migrations/v1_to_v2.py +635 -0
agno/db/mongo/__init__.py +17 -0
agno/db/mongo/async_mongo.py +2026 -0
agno/db/mongo/mongo.py +1982 -0
agno/db/mongo/schemas.py +87 -0
agno/db/mongo/utils.py +259 -0
agno/db/mysql/__init__.py +3 -0
agno/db/mysql/mysql.py +2308 -0
agno/db/mysql/schemas.py +138 -0
agno/db/mysql/utils.py +355 -0
agno/db/postgres/__init__.py +4 -0
agno/db/postgres/async_postgres.py +1927 -0
agno/db/postgres/postgres.py +2260 -0
agno/db/postgres/schemas.py +139 -0
agno/db/postgres/utils.py +442 -0
agno/db/redis/__init__.py +3 -0
agno/db/redis/redis.py +1660 -0
agno/db/redis/schemas.py +123 -0
agno/db/redis/utils.py +346 -0
agno/db/schemas/__init__.py +4 -0
agno/db/schemas/culture.py +120 -0
agno/db/schemas/evals.py +33 -0
agno/db/schemas/knowledge.py +40 -0
agno/db/schemas/memory.py +46 -0
agno/db/schemas/metrics.py +0 -0
agno/db/singlestore/__init__.py +3 -0
agno/db/singlestore/schemas.py +130 -0
agno/db/singlestore/singlestore.py +2272 -0
agno/db/singlestore/utils.py +384 -0
agno/db/sqlite/__init__.py +4 -0
agno/db/sqlite/async_sqlite.py +2293 -0
agno/db/sqlite/schemas.py +133 -0
agno/db/sqlite/sqlite.py +2288 -0
agno/db/sqlite/utils.py +431 -0
agno/db/surrealdb/__init__.py +3 -0
agno/db/surrealdb/metrics.py +292 -0
agno/db/surrealdb/models.py +309 -0
agno/db/surrealdb/queries.py +71 -0
agno/db/surrealdb/surrealdb.py +1353 -0
agno/db/surrealdb/utils.py +147 -0
agno/db/utils.py +116 -0
agno/debug.py +18 -0
agno/eval/__init__.py +14 -0
agno/eval/accuracy.py +834 -0
agno/eval/performance.py +773 -0
agno/eval/reliability.py +306 -0
agno/eval/utils.py +119 -0
agno/exceptions.py +161 -0
agno/filters.py +354 -0
agno/guardrails/__init__.py +6 -0
agno/guardrails/base.py +19 -0
agno/guardrails/openai.py +144 -0
agno/guardrails/pii.py +94 -0
agno/guardrails/prompt_injection.py +52 -0
agno/integrations/__init__.py +0 -0
agno/integrations/discord/__init__.py +3 -0
agno/integrations/discord/client.py +203 -0
agno/knowledge/__init__.py +5 -0
agno/knowledge/chunking/__init__.py +0 -0
agno/knowledge/chunking/agentic.py +79 -0
agno/knowledge/chunking/document.py +91 -0
agno/knowledge/chunking/fixed.py +57 -0
agno/knowledge/chunking/markdown.py +151 -0
agno/knowledge/chunking/recursive.py +63 -0
agno/knowledge/chunking/row.py +39 -0
agno/knowledge/chunking/semantic.py +86 -0
agno/knowledge/chunking/strategy.py +165 -0
agno/knowledge/content.py +74 -0
agno/knowledge/document/__init__.py +5 -0
agno/knowledge/document/base.py +58 -0
agno/knowledge/embedder/__init__.py +5 -0
agno/knowledge/embedder/aws_bedrock.py +343 -0
agno/knowledge/embedder/azure_openai.py +210 -0
agno/knowledge/embedder/base.py +23 -0
agno/knowledge/embedder/cohere.py +323 -0
agno/knowledge/embedder/fastembed.py +62 -0
agno/knowledge/embedder/fireworks.py +13 -0
agno/knowledge/embedder/google.py +258 -0
agno/knowledge/embedder/huggingface.py +94 -0
agno/knowledge/embedder/jina.py +182 -0
agno/knowledge/embedder/langdb.py +22 -0
agno/knowledge/embedder/mistral.py +206 -0
agno/knowledge/embedder/nebius.py +13 -0
agno/knowledge/embedder/ollama.py +154 -0
agno/knowledge/embedder/openai.py +195 -0
agno/knowledge/embedder/sentence_transformer.py +63 -0
agno/knowledge/embedder/together.py +13 -0
agno/knowledge/embedder/vllm.py +262 -0
agno/knowledge/embedder/voyageai.py +165 -0
agno/knowledge/knowledge.py +1988 -0
agno/knowledge/reader/__init__.py +7 -0
agno/knowledge/reader/arxiv_reader.py +81 -0
agno/knowledge/reader/base.py +95 -0
agno/knowledge/reader/csv_reader.py +166 -0
agno/knowledge/reader/docx_reader.py +82 -0
agno/knowledge/reader/field_labeled_csv_reader.py +292 -0
agno/knowledge/reader/firecrawl_reader.py +201 -0
agno/knowledge/reader/json_reader.py +87 -0
agno/knowledge/reader/markdown_reader.py +137 -0
agno/knowledge/reader/pdf_reader.py +431 -0
agno/knowledge/reader/pptx_reader.py +101 -0
agno/knowledge/reader/reader_factory.py +313 -0
agno/knowledge/reader/s3_reader.py +89 -0
agno/knowledge/reader/tavily_reader.py +194 -0
agno/knowledge/reader/text_reader.py +115 -0
agno/knowledge/reader/web_search_reader.py +372 -0
agno/knowledge/reader/website_reader.py +455 -0
agno/knowledge/reader/wikipedia_reader.py +59 -0
agno/knowledge/reader/youtube_reader.py +78 -0
agno/knowledge/remote_content/__init__.py +0 -0
agno/knowledge/remote_content/remote_content.py +88 -0
agno/knowledge/reranker/__init__.py +3 -0
agno/knowledge/reranker/base.py +14 -0
agno/knowledge/reranker/cohere.py +64 -0
agno/knowledge/reranker/infinity.py +195 -0
agno/knowledge/reranker/sentence_transformer.py +54 -0
agno/knowledge/types.py +39 -0
agno/knowledge/utils.py +189 -0
agno/media.py +462 -0
agno/memory/__init__.py +3 -0
agno/memory/manager.py +1327 -0
agno/models/__init__.py +0 -0
agno/models/aimlapi/__init__.py +5 -0
agno/models/aimlapi/aimlapi.py +45 -0
agno/models/anthropic/__init__.py +5 -0
agno/models/anthropic/claude.py +757 -0
agno/models/aws/__init__.py +15 -0
agno/models/aws/bedrock.py +701 -0
agno/models/aws/claude.py +378 -0
agno/models/azure/__init__.py +18 -0
agno/models/azure/ai_foundry.py +485 -0
agno/models/azure/openai_chat.py +131 -0
agno/models/base.py +2175 -0
agno/models/cerebras/__init__.py +12 -0
agno/models/cerebras/cerebras.py +501 -0
agno/models/cerebras/cerebras_openai.py +112 -0
agno/models/cohere/__init__.py +5 -0
agno/models/cohere/chat.py +389 -0
agno/models/cometapi/__init__.py +5 -0
agno/models/cometapi/cometapi.py +57 -0
agno/models/dashscope/__init__.py +5 -0
agno/models/dashscope/dashscope.py +91 -0
agno/models/deepinfra/__init__.py +5 -0
agno/models/deepinfra/deepinfra.py +28 -0
agno/models/deepseek/__init__.py +5 -0
agno/models/deepseek/deepseek.py +61 -0
agno/models/defaults.py +1 -0
agno/models/fireworks/__init__.py +5 -0
agno/models/fireworks/fireworks.py +26 -0
agno/models/google/__init__.py +5 -0
agno/models/google/gemini.py +1085 -0
agno/models/groq/__init__.py +5 -0
agno/models/groq/groq.py +556 -0
agno/models/huggingface/__init__.py +5 -0
agno/models/huggingface/huggingface.py +491 -0
agno/models/ibm/__init__.py +5 -0
agno/models/ibm/watsonx.py +422 -0
agno/models/internlm/__init__.py +3 -0
agno/models/internlm/internlm.py +26 -0
agno/models/langdb/__init__.py +1 -0
agno/models/langdb/langdb.py +48 -0
agno/models/litellm/__init__.py +14 -0
agno/models/litellm/chat.py +468 -0
agno/models/litellm/litellm_openai.py +25 -0
agno/models/llama_cpp/__init__.py +5 -0
agno/models/llama_cpp/llama_cpp.py +22 -0
agno/models/lmstudio/__init__.py +5 -0
agno/models/lmstudio/lmstudio.py +25 -0
agno/models/message.py +434 -0
agno/models/meta/__init__.py +12 -0
agno/models/meta/llama.py +475 -0
agno/models/meta/llama_openai.py +78 -0
agno/models/metrics.py +120 -0
agno/models/mistral/__init__.py +5 -0
agno/models/mistral/mistral.py +432 -0
agno/models/nebius/__init__.py +3 -0
agno/models/nebius/nebius.py +54 -0
agno/models/nexus/__init__.py +3 -0
agno/models/nexus/nexus.py +22 -0
agno/models/nvidia/__init__.py +5 -0
agno/models/nvidia/nvidia.py +28 -0
agno/models/ollama/__init__.py +5 -0
agno/models/ollama/chat.py +441 -0
agno/models/openai/__init__.py +9 -0
agno/models/openai/chat.py +883 -0
agno/models/openai/like.py +27 -0
agno/models/openai/responses.py +1050 -0
agno/models/openrouter/__init__.py +5 -0
agno/models/openrouter/openrouter.py +66 -0
agno/models/perplexity/__init__.py +5 -0
agno/models/perplexity/perplexity.py +187 -0
agno/models/portkey/__init__.py +3 -0
agno/models/portkey/portkey.py +81 -0
agno/models/requesty/__init__.py +5 -0
agno/models/requesty/requesty.py +52 -0
agno/models/response.py +199 -0
agno/models/sambanova/__init__.py +5 -0
agno/models/sambanova/sambanova.py +28 -0
agno/models/siliconflow/__init__.py +5 -0
agno/models/siliconflow/siliconflow.py +25 -0
agno/models/together/__init__.py +5 -0
agno/models/together/together.py +25 -0
agno/models/utils.py +266 -0
agno/models/vercel/__init__.py +3 -0
agno/models/vercel/v0.py +26 -0
agno/models/vertexai/__init__.py +0 -0
agno/models/vertexai/claude.py +70 -0
agno/models/vllm/__init__.py +3 -0
agno/models/vllm/vllm.py +78 -0
agno/models/xai/__init__.py +3 -0
agno/models/xai/xai.py +113 -0
agno/os/__init__.py +3 -0
agno/os/app.py +876 -0
agno/os/auth.py +57 -0
agno/os/config.py +104 -0
agno/os/interfaces/__init__.py +1 -0
agno/os/interfaces/a2a/__init__.py +3 -0
agno/os/interfaces/a2a/a2a.py +42 -0
agno/os/interfaces/a2a/router.py +250 -0
agno/os/interfaces/a2a/utils.py +924 -0
agno/os/interfaces/agui/__init__.py +3 -0
agno/os/interfaces/agui/agui.py +47 -0
agno/os/interfaces/agui/router.py +144 -0
agno/os/interfaces/agui/utils.py +534 -0
agno/os/interfaces/base.py +25 -0
agno/os/interfaces/slack/__init__.py +3 -0
agno/os/interfaces/slack/router.py +148 -0
agno/os/interfaces/slack/security.py +30 -0
agno/os/interfaces/slack/slack.py +47 -0
agno/os/interfaces/whatsapp/__init__.py +3 -0
agno/os/interfaces/whatsapp/router.py +211 -0
agno/os/interfaces/whatsapp/security.py +53 -0
agno/os/interfaces/whatsapp/whatsapp.py +36 -0
agno/os/mcp.py +292 -0
agno/os/middleware/__init__.py +7 -0
agno/os/middleware/jwt.py +233 -0
agno/os/router.py +1763 -0
agno/os/routers/__init__.py +3 -0
agno/os/routers/evals/__init__.py +3 -0
agno/os/routers/evals/evals.py +430 -0
agno/os/routers/evals/schemas.py +142 -0
agno/os/routers/evals/utils.py +162 -0
agno/os/routers/health.py +31 -0
agno/os/routers/home.py +52 -0
agno/os/routers/knowledge/__init__.py +3 -0
agno/os/routers/knowledge/knowledge.py +997 -0
agno/os/routers/knowledge/schemas.py +178 -0
agno/os/routers/memory/__init__.py +3 -0
agno/os/routers/memory/memory.py +515 -0
agno/os/routers/memory/schemas.py +62 -0
agno/os/routers/metrics/__init__.py +3 -0
agno/os/routers/metrics/metrics.py +190 -0
agno/os/routers/metrics/schemas.py +47 -0
agno/os/routers/session/__init__.py +3 -0
agno/os/routers/session/session.py +997 -0
agno/os/schema.py +1055 -0
agno/os/settings.py +43 -0
agno/os/utils.py +630 -0
agno/py.typed +0 -0
agno/reasoning/__init__.py +0 -0
agno/reasoning/anthropic.py +80 -0
agno/reasoning/azure_ai_foundry.py +67 -0
agno/reasoning/deepseek.py +63 -0
agno/reasoning/default.py +97 -0
agno/reasoning/gemini.py +73 -0
agno/reasoning/groq.py +71 -0
agno/reasoning/helpers.py +63 -0
agno/reasoning/ollama.py +67 -0
agno/reasoning/openai.py +86 -0
agno/reasoning/step.py +31 -0
agno/reasoning/vertexai.py +76 -0
agno/run/__init__.py +6 -0
agno/run/agent.py +787 -0
agno/run/base.py +229 -0
agno/run/cancel.py +81 -0
agno/run/messages.py +32 -0
agno/run/team.py +753 -0
agno/run/workflow.py +708 -0
agno/session/__init__.py +10 -0
agno/session/agent.py +295 -0
agno/session/summary.py +265 -0
agno/session/team.py +392 -0
agno/session/workflow.py +205 -0
agno/team/__init__.py +37 -0
agno/team/team.py +8793 -0
agno/tools/__init__.py +10 -0
agno/tools/agentql.py +120 -0
agno/tools/airflow.py +69 -0
agno/tools/api.py +122 -0
agno/tools/apify.py +314 -0
agno/tools/arxiv.py +127 -0
agno/tools/aws_lambda.py +53 -0
agno/tools/aws_ses.py +66 -0
agno/tools/baidusearch.py +89 -0
agno/tools/bitbucket.py +292 -0
agno/tools/brandfetch.py +213 -0
agno/tools/bravesearch.py +106 -0
agno/tools/brightdata.py +367 -0
agno/tools/browserbase.py +209 -0
agno/tools/calcom.py +255 -0
agno/tools/calculator.py +151 -0
agno/tools/cartesia.py +187 -0
agno/tools/clickup.py +244 -0
agno/tools/confluence.py +240 -0
agno/tools/crawl4ai.py +158 -0
agno/tools/csv_toolkit.py +185 -0
agno/tools/dalle.py +110 -0
agno/tools/daytona.py +475 -0
agno/tools/decorator.py +262 -0
agno/tools/desi_vocal.py +108 -0
agno/tools/discord.py +161 -0
agno/tools/docker.py +716 -0
agno/tools/duckdb.py +379 -0
agno/tools/duckduckgo.py +91 -0
agno/tools/e2b.py +703 -0
agno/tools/eleven_labs.py +196 -0
agno/tools/email.py +67 -0
agno/tools/evm.py +129 -0
agno/tools/exa.py +396 -0
agno/tools/fal.py +127 -0
agno/tools/file.py +240 -0
agno/tools/file_generation.py +350 -0
agno/tools/financial_datasets.py +288 -0
agno/tools/firecrawl.py +143 -0
agno/tools/function.py +1187 -0
agno/tools/giphy.py +93 -0
agno/tools/github.py +1760 -0
agno/tools/gmail.py +922 -0
agno/tools/google_bigquery.py +117 -0
agno/tools/google_drive.py +270 -0
agno/tools/google_maps.py +253 -0
agno/tools/googlecalendar.py +674 -0
agno/tools/googlesearch.py +98 -0
agno/tools/googlesheets.py +377 -0
agno/tools/hackernews.py +77 -0
agno/tools/jina.py +101 -0
agno/tools/jira.py +170 -0
agno/tools/knowledge.py +218 -0
agno/tools/linear.py +426 -0
agno/tools/linkup.py +58 -0
agno/tools/local_file_system.py +90 -0
agno/tools/lumalab.py +183 -0
agno/tools/mcp/__init__.py +10 -0
agno/tools/mcp/mcp.py +331 -0
agno/tools/mcp/multi_mcp.py +347 -0
agno/tools/mcp/params.py +24 -0
agno/tools/mcp_toolbox.py +284 -0
agno/tools/mem0.py +193 -0
agno/tools/memori.py +339 -0
agno/tools/memory.py +419 -0
agno/tools/mlx_transcribe.py +139 -0
agno/tools/models/__init__.py +0 -0
agno/tools/models/azure_openai.py +190 -0
agno/tools/models/gemini.py +203 -0
agno/tools/models/groq.py +158 -0
agno/tools/models/morph.py +186 -0
agno/tools/models/nebius.py +124 -0
agno/tools/models_labs.py +195 -0
agno/tools/moviepy_video.py +349 -0
agno/tools/neo4j.py +134 -0
agno/tools/newspaper.py +46 -0
agno/tools/newspaper4k.py +93 -0
agno/tools/notion.py +204 -0
agno/tools/openai.py +202 -0
agno/tools/openbb.py +160 -0
agno/tools/opencv.py +321 -0
agno/tools/openweather.py +233 -0
agno/tools/oxylabs.py +385 -0
agno/tools/pandas.py +102 -0
agno/tools/parallel.py +314 -0
agno/tools/postgres.py +257 -0
agno/tools/pubmed.py +188 -0
agno/tools/python.py +205 -0
agno/tools/reasoning.py +283 -0
agno/tools/reddit.py +467 -0
agno/tools/replicate.py +117 -0
agno/tools/resend.py +62 -0
agno/tools/scrapegraph.py +222 -0
agno/tools/searxng.py +152 -0
agno/tools/serpapi.py +116 -0
agno/tools/serper.py +255 -0
agno/tools/shell.py +53 -0
agno/tools/slack.py +136 -0
agno/tools/sleep.py +20 -0
agno/tools/spider.py +116 -0
agno/tools/sql.py +154 -0
agno/tools/streamlit/__init__.py +0 -0
agno/tools/streamlit/components.py +113 -0
agno/tools/tavily.py +254 -0
agno/tools/telegram.py +48 -0
agno/tools/todoist.py +218 -0
agno/tools/tool_registry.py +1 -0
agno/tools/toolkit.py +146 -0
agno/tools/trafilatura.py +388 -0
agno/tools/trello.py +274 -0
agno/tools/twilio.py +186 -0
agno/tools/user_control_flow.py +78 -0
agno/tools/valyu.py +228 -0
agno/tools/visualization.py +467 -0
agno/tools/webbrowser.py +28 -0
agno/tools/webex.py +76 -0
agno/tools/website.py +54 -0
agno/tools/webtools.py +45 -0
agno/tools/whatsapp.py +286 -0
agno/tools/wikipedia.py +63 -0
agno/tools/workflow.py +278 -0
agno/tools/x.py +335 -0
agno/tools/yfinance.py +257 -0
agno/tools/youtube.py +184 -0
agno/tools/zendesk.py +82 -0
agno/tools/zep.py +454 -0
agno/tools/zoom.py +382 -0
agno/utils/__init__.py +0 -0
agno/utils/agent.py +820 -0
agno/utils/audio.py +49 -0
agno/utils/certs.py +27 -0
agno/utils/code_execution.py +11 -0
agno/utils/common.py +132 -0
agno/utils/dttm.py +13 -0
agno/utils/enum.py +22 -0
agno/utils/env.py +11 -0
agno/utils/events.py +696 -0
agno/utils/format_str.py +16 -0
agno/utils/functions.py +166 -0
agno/utils/gemini.py +426 -0
agno/utils/hooks.py +57 -0
agno/utils/http.py +74 -0
agno/utils/json_schema.py +234 -0
agno/utils/knowledge.py +36 -0
agno/utils/location.py +19 -0
agno/utils/log.py +255 -0
agno/utils/mcp.py +214 -0
agno/utils/media.py +352 -0
agno/utils/merge_dict.py +41 -0
agno/utils/message.py +118 -0
agno/utils/models/__init__.py +0 -0
agno/utils/models/ai_foundry.py +43 -0
agno/utils/models/claude.py +358 -0
agno/utils/models/cohere.py +87 -0
agno/utils/models/llama.py +78 -0
agno/utils/models/mistral.py +98 -0
agno/utils/models/openai_responses.py +140 -0
agno/utils/models/schema_utils.py +153 -0
agno/utils/models/watsonx.py +41 -0
agno/utils/openai.py +257 -0
agno/utils/pickle.py +32 -0
agno/utils/pprint.py +178 -0
agno/utils/print_response/__init__.py +0 -0
agno/utils/print_response/agent.py +842 -0
agno/utils/print_response/team.py +1724 -0
agno/utils/print_response/workflow.py +1668 -0
agno/utils/prompts.py +111 -0
agno/utils/reasoning.py +108 -0
agno/utils/response.py +163 -0
agno/utils/response_iterator.py +17 -0
agno/utils/safe_formatter.py +24 -0
agno/utils/serialize.py +32 -0
agno/utils/shell.py +22 -0
agno/utils/streamlit.py +487 -0
agno/utils/string.py +231 -0
agno/utils/team.py +139 -0
agno/utils/timer.py +41 -0
agno/utils/tools.py +102 -0
agno/utils/web.py +23 -0
agno/utils/whatsapp.py +305 -0
agno/utils/yaml_io.py +25 -0
agno/vectordb/__init__.py +3 -0
agno/vectordb/base.py +127 -0
agno/vectordb/cassandra/__init__.py +5 -0
agno/vectordb/cassandra/cassandra.py +501 -0
agno/vectordb/cassandra/extra_param_mixin.py +11 -0
agno/vectordb/cassandra/index.py +13 -0
agno/vectordb/chroma/__init__.py +5 -0
agno/vectordb/chroma/chromadb.py +929 -0
agno/vectordb/clickhouse/__init__.py +9 -0
agno/vectordb/clickhouse/clickhousedb.py +835 -0
agno/vectordb/clickhouse/index.py +9 -0
agno/vectordb/couchbase/__init__.py +3 -0
agno/vectordb/couchbase/couchbase.py +1442 -0
agno/vectordb/distance.py +7 -0
agno/vectordb/lancedb/__init__.py +6 -0
agno/vectordb/lancedb/lance_db.py +995 -0
agno/vectordb/langchaindb/__init__.py +5 -0
agno/vectordb/langchaindb/langchaindb.py +163 -0
agno/vectordb/lightrag/__init__.py +5 -0
agno/vectordb/lightrag/lightrag.py +388 -0
agno/vectordb/llamaindex/__init__.py +3 -0
agno/vectordb/llamaindex/llamaindexdb.py +166 -0
agno/vectordb/milvus/__init__.py +4 -0
agno/vectordb/milvus/milvus.py +1182 -0
agno/vectordb/mongodb/__init__.py +9 -0
agno/vectordb/mongodb/mongodb.py +1417 -0
agno/vectordb/pgvector/__init__.py +12 -0
agno/vectordb/pgvector/index.py +23 -0
agno/vectordb/pgvector/pgvector.py +1462 -0
agno/vectordb/pineconedb/__init__.py +5 -0
agno/vectordb/pineconedb/pineconedb.py +747 -0
agno/vectordb/qdrant/__init__.py +5 -0
agno/vectordb/qdrant/qdrant.py +1134 -0
agno/vectordb/redis/__init__.py +9 -0
agno/vectordb/redis/redisdb.py +694 -0
agno/vectordb/search.py +7 -0
agno/vectordb/singlestore/__init__.py +10 -0
agno/vectordb/singlestore/index.py +41 -0
agno/vectordb/singlestore/singlestore.py +763 -0
agno/vectordb/surrealdb/__init__.py +3 -0
agno/vectordb/surrealdb/surrealdb.py +699 -0
agno/vectordb/upstashdb/__init__.py +5 -0
agno/vectordb/upstashdb/upstashdb.py +718 -0
agno/vectordb/weaviate/__init__.py +8 -0
agno/vectordb/weaviate/index.py +15 -0
agno/vectordb/weaviate/weaviate.py +1005 -0
agno/workflow/__init__.py +23 -0
agno/workflow/agent.py +299 -0
agno/workflow/condition.py +738 -0
agno/workflow/loop.py +735 -0
agno/workflow/parallel.py +824 -0
agno/workflow/router.py +702 -0
agno/workflow/step.py +1432 -0
agno/workflow/steps.py +592 -0
agno/workflow/types.py +520 -0
agno/workflow/workflow.py +4321 -0
agno-2.2.13.dist-info/METADATA +614 -0
agno-2.2.13.dist-info/RECORD +575 -0
agno-2.2.13.dist-info/WHEEL +5 -0
agno-2.2.13.dist-info/licenses/LICENSE +201 -0
agno-2.2.13.dist-info/top_level.txt +1 -0

agno/models/openai/chat.py ADDED Viewed

@@ -0,0 +1,883 @@
+from collections.abc import AsyncIterator
+from dataclasses import dataclass
+from os import getenv
+from typing import Any, Dict, Iterator, List, Literal, Optional, Type, Union
+from uuid import uuid4
+import httpx
+from pydantic import BaseModel
+from agno.exceptions import ModelProviderError
+from agno.media import Audio
+from agno.models.base import Model
+from agno.models.message import Message
+from agno.models.metrics import Metrics
+from agno.models.response import ModelResponse
+from agno.run.agent import RunOutput
+from agno.run.team import TeamRunOutput
+from agno.utils.log import log_debug, log_error, log_warning
+from agno.utils.openai import _format_file_for_message, audio_to_message, images_to_message
+from agno.utils.reasoning import extract_thinking_content
+try:
+    from openai import APIConnectionError, APIStatusError, RateLimitError
+    from openai import AsyncOpenAI as AsyncOpenAIClient
+    from openai import OpenAI as OpenAIClient
+    from openai.types import CompletionUsage
+    from openai.types.chat import ChatCompletion, ChatCompletionAudio, ChatCompletionChunk
+    from openai.types.chat.chat_completion_chunk import ChoiceDelta, ChoiceDeltaToolCall
+except (ImportError, ModuleNotFoundError):
+    raise ImportError("`openai` not installed. Please install using `pip install openai`")
+@dataclass
+class OpenAIChat(Model):
+    """
+    A class for interacting with OpenAI models using the Chat completions API.
+    For more information, see: https://platform.openai.com/docs/api-reference/chat/create
+    """
+    id: str = "gpt-4o"
+    name: str = "OpenAIChat"
+    provider: str = "OpenAI"
+    supports_native_structured_outputs: bool = True
+    # Request parameters
+    store: Optional[bool] = None
+    reasoning_effort: Optional[str] = None
+    verbosity: Optional[Literal["low", "medium", "high"]] = None
+    metadata: Optional[Dict[str, Any]] = None
+    frequency_penalty: Optional[float] = None
+    logit_bias: Optional[Any] = None
+    logprobs: Optional[bool] = None
+    top_logprobs: Optional[int] = None
+    max_tokens: Optional[int] = None
+    max_completion_tokens: Optional[int] = None
+    modalities: Optional[List[str]] = None  # "text" and/or "audio"
+    audio: Optional[Dict[str, Any]] = (
+        None  # E.g. {"voice": "alloy", "format": "wav"}. `format` must be one of `wav`, `mp3`, `flac`, `opus`, or `pcm16`. `voice` must be one of `ash`, `ballad`, `coral`, `sage`, `verse`, `alloy`, `echo`, and `shimmer`.
+    )
+    presence_penalty: Optional[float] = None
+    seed: Optional[int] = None
+    stop: Optional[Union[str, List[str]]] = None
+    temperature: Optional[float] = None
+    user: Optional[str] = None
+    top_p: Optional[float] = None
+    service_tier: Optional[str] = None  # "auto" | "default" | "flex" | "priority", defaults to "auto" when not set
+    strict_output: bool = True  # When True, guarantees schema adherence for structured outputs. When False, attempts to follow schema as a guide but may occasionally deviate
+    extra_headers: Optional[Any] = None
+    extra_query: Optional[Any] = None
+    extra_body: Optional[Any] = None
+    request_params: Optional[Dict[str, Any]] = None
+    role_map: Optional[Dict[str, str]] = None
+    # Client parameters
+    api_key: Optional[str] = None
+    organization: Optional[str] = None
+    base_url: Optional[Union[str, httpx.URL]] = None
+    timeout: Optional[float] = None
+    max_retries: Optional[int] = None
+    default_headers: Optional[Any] = None
+    default_query: Optional[Any] = None
+    http_client: Optional[Union[httpx.Client, httpx.AsyncClient]] = None
+    client_params: Optional[Dict[str, Any]] = None
+    # OpenAI clients
+    client: Optional[OpenAIClient] = None
+    async_client: Optional[AsyncOpenAIClient] = None
+    # The role to map the message role to.
+    default_role_map = {
+        "system": "developer",
+        "user": "user",
+        "assistant": "assistant",
+        "tool": "tool",
+        "model": "assistant",
+    }
+    def _get_client_params(self) -> Dict[str, Any]:
+        # Fetch API key from env if not already set
+        if not self.api_key:
+            self.api_key = getenv("OPENAI_API_KEY")
+            if not self.api_key:
+                log_error("OPENAI_API_KEY not set. Please set the OPENAI_API_KEY environment variable.")
+        # Define base client params
+        base_params = {
+            "api_key": self.api_key,
+            "organization": self.organization,
+            "base_url": self.base_url,
+            "timeout": self.timeout,
+            "max_retries": self.max_retries,
+            "default_headers": self.default_headers,
+            "default_query": self.default_query,
+        }
+        # Create client_params dict with non-None values
+        client_params = {k: v for k, v in base_params.items() if v is not None}
+        # Add additional client params if provided
+        if self.client_params:
+            client_params.update(self.client_params)
+        return client_params
+    def get_client(self) -> OpenAIClient:
+        """
+        Returns an OpenAI client.
+        Returns:
+            OpenAIClient: An instance of the OpenAI client.
+        """
+        if self.client and not self.client.is_closed():
+            return self.client
+        client_params: Dict[str, Any] = self._get_client_params()
+        if self.http_client:
+            if isinstance(self.http_client, httpx.Client):
+                client_params["http_client"] = self.http_client
+            else:
+                log_debug("http_client is not an instance of httpx.Client.")
+        self.client = OpenAIClient(**client_params)
+        return self.client
+    def get_async_client(self) -> AsyncOpenAIClient:
+        """
+        Returns an asynchronous OpenAI client.
+        Returns:
+            AsyncOpenAIClient: An instance of the asynchronous OpenAI client.
+        """
+        if self.async_client and not self.async_client.is_closed():
+            return self.async_client
+        client_params: Dict[str, Any] = self._get_client_params()
+        if self.http_client and isinstance(self.http_client, httpx.AsyncClient):
+            client_params["http_client"] = self.http_client
+        else:
+            if self.http_client:
+                log_debug("The current http_client is not async. A default httpx.AsyncClient will be used instead.")
+            # Create a new async HTTP client with custom limits
+            client_params["http_client"] = httpx.AsyncClient(
+                limits=httpx.Limits(max_connections=1000, max_keepalive_connections=100)
+            )
+        self.async_client = AsyncOpenAIClient(**client_params)
+        return self.async_client
+    def get_request_params(
+        self,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+        run_response: Optional[Union[RunOutput, TeamRunOutput]] = None,
+    ) -> Dict[str, Any]:
+        """
+        Returns keyword arguments for API requests.
+        Returns:
+            Dict[str, Any]: A dictionary of keyword arguments for API requests.
+        """
+        # Define base request parameters
+        base_params = {
+            "store": self.store,
+            "reasoning_effort": self.reasoning_effort,
+            "verbosity": self.verbosity,
+            "frequency_penalty": self.frequency_penalty,
+            "logit_bias": self.logit_bias,
+            "logprobs": self.logprobs,
+            "top_logprobs": self.top_logprobs,
+            "max_tokens": self.max_tokens,
+            "max_completion_tokens": self.max_completion_tokens,
+            "modalities": self.modalities,
+            "audio": self.audio,
+            "presence_penalty": self.presence_penalty,
+            "seed": self.seed,
+            "stop": self.stop,
+            "temperature": self.temperature,
+            "user": self.user,
+            "top_p": self.top_p,
+            "extra_headers": self.extra_headers,
+            "extra_query": self.extra_query,
+            "extra_body": self.extra_body,
+            "metadata": self.metadata,
+            "service_tier": self.service_tier,
+        }
+        # Handle response format - always use JSON schema approach
+        if response_format is not None:
+            if isinstance(response_format, type) and issubclass(response_format, BaseModel):
+                # Convert Pydantic to JSON schema for regular endpoint
+                from agno.utils.models.schema_utils import get_response_schema_for_provider
+                schema = get_response_schema_for_provider(response_format, "openai")
+                base_params["response_format"] = {
+                    "type": "json_schema",
+                    "json_schema": {
+                        "name": response_format.__name__,
+                        "schema": schema,
+                        "strict": self.strict_output,
+                    },
+                }
+            else:
+                # Handle other response format types (like {"type": "json_object"})
+                base_params["response_format"] = response_format
+        # Filter out None values
+        request_params = {k: v for k, v in base_params.items() if v is not None}
+        # Add tools
+        if tools is not None and len(tools) > 0:
+            # Remove unsupported fields for OpenAILike models
+            if self.provider in ["AIMLAPI", "Fireworks", "Nvidia"]:
+                for tool in tools:
+                    if tool.get("type") == "function":
+                        if tool["function"].get("requires_confirmation") is not None:
+                            del tool["function"]["requires_confirmation"]
+                        if tool["function"].get("external_execution") is not None:
+                            del tool["function"]["external_execution"]
+            request_params["tools"] = tools
+            if tool_choice is not None:
+                request_params["tool_choice"] = tool_choice
+        # Add additional request params if provided
+        if self.request_params:
+            request_params.update(self.request_params)
+        if request_params:
+            log_debug(f"Calling {self.provider} with request parameters: {request_params}", log_level=2)
+        return request_params
+    def to_dict(self) -> Dict[str, Any]:
+        """
+        Convert the model to a dictionary.
+        Returns:
+            Dict[str, Any]: The dictionary representation of the model.
+        """
+        model_dict = super().to_dict()
+        model_dict.update(
+            {
+                "store": self.store,
+                "reasoning_effort": self.reasoning_effort,
+                "verbosity": self.verbosity,
+                "frequency_penalty": self.frequency_penalty,
+                "logit_bias": self.logit_bias,
+                "logprobs": self.logprobs,
+                "top_logprobs": self.top_logprobs,
+                "max_tokens": self.max_tokens,
+                "max_completion_tokens": self.max_completion_tokens,
+                "modalities": self.modalities,
+                "audio": self.audio,
+                "presence_penalty": self.presence_penalty,
+                "seed": self.seed,
+                "stop": self.stop,
+                "temperature": self.temperature,
+                "top_p": self.top_p,
+                "user": self.user,
+                "extra_headers": self.extra_headers,
+                "extra_query": self.extra_query,
+                "extra_body": self.extra_body,
+                "service_tier": self.service_tier,
+            }
+        )
+        cleaned_dict = {k: v for k, v in model_dict.items() if v is not None}
+        return cleaned_dict
+    def _format_message(self, message: Message) -> Dict[str, Any]:
+        """
+        Format a message into the format expected by OpenAI.
+        Args:
+            message (Message): The message to format.
+        Returns:
+            Dict[str, Any]: The formatted message.
+        """
+        message_dict: Dict[str, Any] = {
+            "role": self.role_map[message.role] if self.role_map else self.default_role_map[message.role],
+            "content": message.content,
+            "name": message.name,
+            "tool_call_id": message.tool_call_id,
+            "tool_calls": message.tool_calls,
+        }
+        message_dict = {k: v for k, v in message_dict.items() if v is not None}
+        # Ignore non-string message content
+        # because we assume that the images/audio are already added to the message
+        if (message.images is not None and len(message.images) > 0) or (
+            message.audio is not None and len(message.audio) > 0
+        ):
+            # Ignore non-string message content
+            # because we assume that the images/audio are already added to the message
+            if isinstance(message.content, str):
+                message_dict["content"] = [{"type": "text", "text": message.content}]
+                if message.images is not None:
+                    message_dict["content"].extend(images_to_message(images=message.images))
+                if message.audio is not None:
+                    message_dict["content"].extend(audio_to_message(audio=message.audio))
+        if message.audio_output is not None:
+            message_dict["content"] = ""
+            message_dict["audio"] = {"id": message.audio_output.id}
+        if message.videos is not None and len(message.videos) > 0:
+            log_warning("Video input is currently unsupported.")
+        # OpenAI expects the tool_calls to be None if empty, not an empty list
+        if message.tool_calls is not None and len(message.tool_calls) == 0:
+            message_dict["tool_calls"] = None
+        if message.files is not None:
+            # Ensure content is a list of parts
+            content = message_dict.get("content")
+            if isinstance(content, str):  # wrap existing text
+                text = content
+                message_dict["content"] = [{"type": "text", "text": text}]
+            elif content is None:
+                message_dict["content"] = []
+            # Insert each file part before text parts
+            for file in message.files:
+                file_part = _format_file_for_message(file)
+                if file_part:
+                    message_dict["content"].insert(0, file_part)
+        # Manually add the content field even if it is None
+        if message.content is None:
+            message_dict["content"] = ""
+        return message_dict
+    def invoke(
+        self,
+        messages: List[Message],
+        assistant_message: Message,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+        run_response: Optional[Union[RunOutput, TeamRunOutput]] = None,
+    ) -> ModelResponse:
+        """
+        Send a chat completion request to the OpenAI API and parse the response.
+        Args:
+            messages (List[Message]): A list of messages to send to the model.
+            assistant_message (Message): The assistant message to populate.
+            response_format (Optional[Union[Dict, Type[BaseModel]]]): The response format to use.
+            tools (Optional[List[Dict[str, Any]]]): The tools to use.
+            tool_choice (Optional[Union[str, Dict[str, Any]]]): The tool choice to use.
+        Returns:
+            ModelResponse: The chat completion response from the API.
+        """
+        try:
+            if run_response and run_response.metrics:
+                run_response.metrics.set_time_to_first_token()
+            assistant_message.metrics.start_timer()
+            provider_response = self.get_client().chat.completions.create(
+                model=self.id,
+                messages=[self._format_message(m) for m in messages],  # type: ignore
+                **self.get_request_params(
+                    response_format=response_format, tools=tools, tool_choice=tool_choice, run_response=run_response
+                ),
+            )
+            assistant_message.metrics.stop_timer()
+            # Parse the response into an Agno ModelResponse object
+            model_response = self._parse_provider_response(provider_response, response_format=response_format)
+            return model_response
+        except RateLimitError as e:
+            log_error(f"Rate limit error from OpenAI API: {e}")
+            error_message = e.response.json().get("error", {})
+            error_message = (
+                error_message.get("message", "Unknown model error")
+                if isinstance(error_message, dict)
+                else error_message
+            )
+            raise ModelProviderError(
+                message=error_message,
+                status_code=e.response.status_code,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except APIConnectionError as e:
+            log_error(f"API connection error from OpenAI API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+        except APIStatusError as e:
+            log_error(f"API status error from OpenAI API: {e}")
+            try:
+                error_message = e.response.json().get("error", {})
+            except Exception:
+                error_message = e.response.text
+            error_message = (
+                error_message.get("message", "Unknown model error")
+                if isinstance(error_message, dict)
+                else error_message
+            )
+            raise ModelProviderError(
+                message=error_message,
+                status_code=e.response.status_code,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except Exception as e:
+            log_error(f"Error from OpenAI API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+    async def ainvoke(
+        self,
+        messages: List[Message],
+        assistant_message: Message,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+        run_response: Optional[Union[RunOutput, TeamRunOutput]] = None,
+    ) -> ModelResponse:
+        """
+        Sends an asynchronous chat completion request to the OpenAI API.
+        Args:
+            messages (List[Message]): A list of messages to send to the model.
+            assistant_message (Message): The assistant message to populate.
+            response_format (Optional[Union[Dict, Type[BaseModel]]]): The response format to use.
+            tools (Optional[List[Dict[str, Any]]]): The tools to use.
+            tool_choice (Optional[Union[str, Dict[str, Any]]]): The tool choice to use.
+        Returns:
+            ModelResponse: The chat completion response from the API.
+        """
+        try:
+            if run_response and run_response.metrics:
+                run_response.metrics.set_time_to_first_token()
+            assistant_message.metrics.start_timer()
+            response = await self.get_async_client().chat.completions.create(
+                model=self.id,
+                messages=[self._format_message(m) for m in messages],  # type: ignore
+                **self.get_request_params(
+                    response_format=response_format, tools=tools, tool_choice=tool_choice, run_response=run_response
+                ),
+            )
+            assistant_message.metrics.stop_timer()
+            # Parse the response into an Agno ModelResponse object
+            provider_response: ModelResponse = self._parse_provider_response(response, response_format=response_format)
+            return provider_response
+        except RateLimitError as e:
+            log_error(f"Rate limit error from OpenAI API: {e}")
+            error_message = e.response.json().get("error", {})
+            error_message = (
+                error_message.get("message", "Unknown model error")
+                if isinstance(error_message, dict)
+                else error_message
+            )
+            raise ModelProviderError(
+                message=error_message,
+                status_code=e.response.status_code,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except APIConnectionError as e:
+            log_error(f"API connection error from OpenAI API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+        except APIStatusError as e:
+            log_error(f"API status error from OpenAI API: {e}")
+            try:
+                error_message = e.response.json().get("error", {})
+            except Exception:
+                error_message = e.response.text
+            error_message = (
+                error_message.get("message", "Unknown model error")
+                if isinstance(error_message, dict)
+                else error_message
+            )
+            raise ModelProviderError(
+                message=error_message,
+                status_code=e.response.status_code,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except Exception as e:
+            log_error(f"Error from OpenAI API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+    def invoke_stream(
+        self,
+        messages: List[Message],
+        assistant_message: Message,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+        run_response: Optional[Union[RunOutput, TeamRunOutput]] = None,
+    ) -> Iterator[ModelResponse]:
+        """
+        Send a streaming chat completion request to the OpenAI API.
+        Args:
+            messages (List[Message]): A list of messages to send to the model.
+        Returns:
+            Iterator[ModelResponse]: An iterator of model responses.
+        """
+        try:
+            if run_response and run_response.metrics:
+                run_response.metrics.set_time_to_first_token()
+            assistant_message.metrics.start_timer()
+            for chunk in self.get_client().chat.completions.create(
+                model=self.id,
+                messages=[self._format_message(m) for m in messages],  # type: ignore
+                stream=True,
+                stream_options={"include_usage": True},
+                **self.get_request_params(
+                    response_format=response_format, tools=tools, tool_choice=tool_choice, run_response=run_response
+                ),
+            ):
+                yield self._parse_provider_response_delta(chunk)
+            assistant_message.metrics.stop_timer()
+        except RateLimitError as e:
+            log_error(f"Rate limit error from OpenAI API: {e}")
+            error_message = e.response.json().get("error", {})
+            error_message = (
+                error_message.get("message", "Unknown model error")
+                if isinstance(error_message, dict)
+                else error_message
+            )
+            raise ModelProviderError(
+                message=error_message,
+                status_code=e.response.status_code,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except APIConnectionError as e:
+            log_error(f"API connection error from OpenAI API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+        except APIStatusError as e:
+            log_error(f"API status error from OpenAI API: {e}")
+            try:
+                error_message = e.response.json().get("error", {})
+            except Exception:
+                error_message = e.response.text
+            error_message = (
+                error_message.get("message", "Unknown model error")
+                if isinstance(error_message, dict)
+                else error_message
+            )
+            raise ModelProviderError(
+                message=error_message,
+                status_code=e.response.status_code,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except Exception as e:
+            log_error(f"Error from OpenAI API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+    async def ainvoke_stream(
+        self,
+        messages: List[Message],
+        assistant_message: Message,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+        run_response: Optional[Union[RunOutput, TeamRunOutput]] = None,
+    ) -> AsyncIterator[ModelResponse]:
+        """
+        Sends an asynchronous streaming chat completion request to the OpenAI API.
+        Args:
+            messages (List[Message]): A list of messages to send to the model.
+        Returns:
+            Any: An asynchronous iterator of model responses.
+        """
+        try:
+            if run_response and run_response.metrics:
+                run_response.metrics.set_time_to_first_token()
+            assistant_message.metrics.start_timer()
+            async_stream = await self.get_async_client().chat.completions.create(
+                model=self.id,
+                messages=[self._format_message(m) for m in messages],  # type: ignore
+                stream=True,
+                stream_options={"include_usage": True},
+                **self.get_request_params(
+                    response_format=response_format, tools=tools, tool_choice=tool_choice, run_response=run_response
+                ),
+            )
+            async for chunk in async_stream:
+                yield self._parse_provider_response_delta(chunk)
+            assistant_message.metrics.stop_timer()
+        except RateLimitError as e:
+            log_error(f"Rate limit error from OpenAI API: {e}")
+            error_message = e.response.json().get("error", {})
+            error_message = (
+                error_message.get("message", "Unknown model error")
+                if isinstance(error_message, dict)
+                else error_message
+            )
+            raise ModelProviderError(
+                message=error_message,
+                status_code=e.response.status_code,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except APIConnectionError as e:
+            log_error(f"API connection error from OpenAI API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+        except APIStatusError as e:
+            log_error(f"API status error from OpenAI API: {e}")
+            try:
+                error_message = e.response.json().get("error", {})
+            except Exception:
+                error_message = e.response.text
+            error_message = (
+                error_message.get("message", "Unknown model error")
+                if isinstance(error_message, dict)
+                else error_message
+            )
+            raise ModelProviderError(
+                message=error_message,
+                status_code=e.response.status_code,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except Exception as e:
+            log_error(f"Error from OpenAI API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+    @staticmethod
+    def parse_tool_calls(tool_calls_data: List[ChoiceDeltaToolCall]) -> List[Dict[str, Any]]:
+        """
+        Build tool calls from streamed tool call data.
+        Args:
+            tool_calls_data (List[ChoiceDeltaToolCall]): The tool call data to build from.
+        Returns:
+            List[Dict[str, Any]]: The built tool calls.
+        """
+        tool_calls: List[Dict[str, Any]] = []
+        for _tool_call in tool_calls_data:
+            _index = _tool_call.index or 0
+            _tool_call_id = _tool_call.id
+            _tool_call_type = _tool_call.type
+            _function_name = _tool_call.function.name if _tool_call.function else None
+            _function_arguments = _tool_call.function.arguments if _tool_call.function else None
+            if len(tool_calls) <= _index:
+                tool_calls.extend([{}] * (_index - len(tool_calls) + 1))
+            tool_call_entry = tool_calls[_index]
+            if not tool_call_entry:
+                tool_call_entry["id"] = _tool_call_id
+                tool_call_entry["type"] = _tool_call_type
+                tool_call_entry["function"] = {
+                    "name": _function_name or "",
+                    "arguments": _function_arguments or "",
+                }
+            else:
+                if _function_name:
+                    tool_call_entry["function"]["name"] += _function_name
+                if _function_arguments:
+                    tool_call_entry["function"]["arguments"] += _function_arguments
+                if _tool_call_id:
+                    tool_call_entry["id"] = _tool_call_id
+                if _tool_call_type:
+                    tool_call_entry["type"] = _tool_call_type
+        return tool_calls
+    def _parse_provider_response(
+        self,
+        response: ChatCompletion,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+    ) -> ModelResponse:
+        """
+        Parse the OpenAI response into a ModelResponse.
+        """
+        model_response = ModelResponse()
+        if hasattr(response, "error") and response.error:  # type: ignore
+            raise ModelProviderError(
+                message=response.error.get("message", "Unknown model error"),  # type: ignore
+                model_name=self.name,
+                model_id=self.id,
+            )
+        # Get response message
+        response_message = response.choices[0].message
+        # Add role
+        if response_message.role is not None:
+            model_response.role = response_message.role
+        # Add content
+        if response_message.content is not None:
+            model_response.content = response_message.content
+            # Extract thinking content before any structured parsing
+            if model_response.content:
+                reasoning_content, output_content = extract_thinking_content(model_response.content)
+                if reasoning_content:
+                    model_response.reasoning_content = reasoning_content
+                    model_response.content = output_content
+        # Add tool calls
+        if response_message.tool_calls is not None and len(response_message.tool_calls) > 0:
+            try:
+                model_response.tool_calls = [t.model_dump() for t in response_message.tool_calls]
+            except Exception as e:
+                log_warning(f"Error processing tool calls: {e}")
+        # Add audio transcript to content if available
+        response_audio: Optional[ChatCompletionAudio] = response_message.audio
+        if response_audio and response_audio.transcript and not model_response.content:
+            model_response.content = response_audio.transcript
+        # Add audio if present
+        if hasattr(response_message, "audio") and response_message.audio is not None:
+            # If the audio output modality is requested, we can extract an audio response
+            try:
+                if isinstance(response_message.audio, dict):
+                    model_response.audio = Audio(
+                        id=response_message.audio.get("id"),
+                        content=response_message.audio.get("data"),
+                        expires_at=response_message.audio.get("expires_at"),
+                        transcript=response_message.audio.get("transcript"),
+                    )
+                else:
+                    model_response.audio = Audio(
+                        id=response_message.audio.id,
+                        content=response_message.audio.data,
+                        expires_at=response_message.audio.expires_at,
+                        transcript=response_message.audio.transcript,
+                    )
+            except Exception as e:
+                log_warning(f"Error processing audio: {e}")
+        if hasattr(response_message, "reasoning_content") and response_message.reasoning_content is not None:  # type: ignore
+            model_response.reasoning_content = response_message.reasoning_content  # type: ignore
+        if response.usage is not None:
+            model_response.response_usage = self._get_metrics(response.usage)
+        return model_response
+    def _parse_provider_response_delta(self, response_delta: ChatCompletionChunk) -> ModelResponse:
+        """
+        Parse the OpenAI streaming response into a ModelResponse.
+        Args:
+            response_delta: Raw response chunk from OpenAI
+        Returns:
+            ModelResponse: Parsed response data
+        """
+        model_response = ModelResponse()
+        if response_delta.choices and len(response_delta.choices) > 0:
+            choice_delta: ChoiceDelta = response_delta.choices[0].delta
+            if choice_delta:
+                # Add content
+                if choice_delta.content is not None:
+                    model_response.content = choice_delta.content
+                # Add tool calls
+                if choice_delta.tool_calls is not None:
+                    model_response.tool_calls = choice_delta.tool_calls  # type: ignore
+                if hasattr(choice_delta, "reasoning_content") and choice_delta.reasoning_content is not None:
+                    model_response.reasoning_content = choice_delta.reasoning_content
+                # Add audio if present
+                if hasattr(choice_delta, "audio") and choice_delta.audio is not None:
+                    try:
+                        audio_data = None
+                        audio_id = None
+                        audio_expires_at = None
+                        audio_transcript = None
+                        if isinstance(choice_delta.audio, dict):
+                            audio_data = choice_delta.audio.get("data")
+                            audio_id = choice_delta.audio.get("id")
+                            audio_expires_at = choice_delta.audio.get("expires_at")
+                            audio_transcript = choice_delta.audio.get("transcript")
+                        else:
+                            audio_data = choice_delta.audio.data
+                            audio_id = choice_delta.audio.id
+                            audio_expires_at = choice_delta.audio.expires_at
+                            audio_transcript = choice_delta.audio.transcript
+                        # Only create Audio object if there's actual content
+                        if audio_data is not None:
+                            model_response.audio = Audio(
+                                id=audio_id,
+                                content=audio_data,
+                                expires_at=audio_expires_at,
+                                transcript=audio_transcript,
+                                sample_rate=24000,
+                                mime_type="pcm16",
+                            )
+                        # If no content but there's transcript/metadata, create minimal Audio object
+                        elif audio_transcript is not None or audio_id is not None:
+                            model_response.audio = Audio(
+                                id=audio_id or str(uuid4()),
+                                content=b"",
+                                expires_at=audio_expires_at,
+                                transcript=audio_transcript,
+                                sample_rate=24000,
+                                mime_type="pcm16",
+                            )
+                    except Exception as e:
+                        log_warning(f"Error processing audio: {e}")
+        # Add usage metrics if present
+        if response_delta.usage is not None:
+            model_response.response_usage = self._get_metrics(response_delta.usage)
+        return model_response
+    def _get_metrics(self, response_usage: CompletionUsage) -> Metrics:
+        """
+        Parse the given OpenAI-specific usage into an Agno Metrics object.
+        Args:
+            response_usage: Usage data from OpenAI
+        Returns:
+            Metrics: Parsed metrics data
+        """
+        metrics = Metrics()
+        metrics.input_tokens = response_usage.prompt_tokens or 0
+        metrics.output_tokens = response_usage.completion_tokens or 0
+        metrics.total_tokens = response_usage.total_tokens or 0
+        # Add the prompt_tokens_details field
+        if prompt_token_details := response_usage.prompt_tokens_details:
+            metrics.audio_input_tokens = prompt_token_details.audio_tokens or 0
+            metrics.cache_read_tokens = prompt_token_details.cached_tokens or 0
+        # Add the completion_tokens_details field
+        if completion_tokens_details := response_usage.completion_tokens_details:
+            metrics.audio_output_tokens = completion_tokens_details.audio_tokens or 0
+            metrics.reasoning_tokens = completion_tokens_details.reasoning_tokens or 0
+        return metrics