PyPI - agno - Versions diffs - 0.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl - Mend

agno 0.1.2py3-none-any.whl → 2.3.13py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (723) hide show

agno/__init__.py +8 -0
agno/agent/__init__.py +44 -5
agno/agent/agent.py +10531 -2975
agno/api/agent.py +14 -53
agno/api/api.py +7 -46
agno/api/evals.py +22 -0
agno/api/os.py +17 -0
agno/api/routes.py +6 -25
agno/api/schemas/__init__.py +9 -0
agno/api/schemas/agent.py +6 -9
agno/api/schemas/evals.py +16 -0
agno/api/schemas/os.py +14 -0
agno/api/schemas/team.py +10 -10
agno/api/schemas/utils.py +21 -0
agno/api/schemas/workflows.py +16 -0
agno/api/settings.py +53 -0
agno/api/team.py +22 -26
agno/api/workflow.py +28 -0
agno/cloud/aws/base.py +214 -0
agno/cloud/aws/s3/__init__.py +2 -0
agno/cloud/aws/s3/api_client.py +43 -0
agno/cloud/aws/s3/bucket.py +195 -0
agno/cloud/aws/s3/object.py +57 -0
agno/compression/__init__.py +3 -0
agno/compression/manager.py +247 -0
agno/culture/__init__.py +3 -0
agno/culture/manager.py +956 -0
agno/db/__init__.py +24 -0
agno/db/async_postgres/__init__.py +3 -0
agno/db/base.py +946 -0
agno/db/dynamo/__init__.py +3 -0
agno/db/dynamo/dynamo.py +2781 -0
agno/db/dynamo/schemas.py +442 -0
agno/db/dynamo/utils.py +743 -0
agno/db/firestore/__init__.py +3 -0
agno/db/firestore/firestore.py +2379 -0
agno/db/firestore/schemas.py +181 -0
agno/db/firestore/utils.py +376 -0
agno/db/gcs_json/__init__.py +3 -0
agno/db/gcs_json/gcs_json_db.py +1791 -0
agno/db/gcs_json/utils.py +228 -0
agno/db/in_memory/__init__.py +3 -0
agno/db/in_memory/in_memory_db.py +1312 -0
agno/db/in_memory/utils.py +230 -0
agno/db/json/__init__.py +3 -0
agno/db/json/json_db.py +1777 -0
agno/db/json/utils.py +230 -0
agno/db/migrations/manager.py +199 -0
agno/db/migrations/v1_to_v2.py +635 -0
agno/db/migrations/versions/v2_3_0.py +938 -0
agno/db/mongo/__init__.py +17 -0
agno/db/mongo/async_mongo.py +2760 -0
agno/db/mongo/mongo.py +2597 -0
agno/db/mongo/schemas.py +119 -0
agno/db/mongo/utils.py +276 -0
agno/db/mysql/__init__.py +4 -0
agno/db/mysql/async_mysql.py +2912 -0
agno/db/mysql/mysql.py +2923 -0
agno/db/mysql/schemas.py +186 -0
agno/db/mysql/utils.py +488 -0
agno/db/postgres/__init__.py +4 -0
agno/db/postgres/async_postgres.py +2579 -0
agno/db/postgres/postgres.py +2870 -0
agno/db/postgres/schemas.py +187 -0
agno/db/postgres/utils.py +442 -0
agno/db/redis/__init__.py +3 -0
agno/db/redis/redis.py +2141 -0
agno/db/redis/schemas.py +159 -0
agno/db/redis/utils.py +346 -0
agno/db/schemas/__init__.py +4 -0
agno/db/schemas/culture.py +120 -0
agno/db/schemas/evals.py +34 -0
agno/db/schemas/knowledge.py +40 -0
agno/db/schemas/memory.py +61 -0
agno/db/singlestore/__init__.py +3 -0
agno/db/singlestore/schemas.py +179 -0
agno/db/singlestore/singlestore.py +2877 -0
agno/db/singlestore/utils.py +384 -0
agno/db/sqlite/__init__.py +4 -0
agno/db/sqlite/async_sqlite.py +2911 -0
agno/db/sqlite/schemas.py +181 -0
agno/db/sqlite/sqlite.py +2908 -0
agno/db/sqlite/utils.py +429 -0
agno/db/surrealdb/__init__.py +3 -0
agno/db/surrealdb/metrics.py +292 -0
agno/db/surrealdb/models.py +334 -0
agno/db/surrealdb/queries.py +71 -0
agno/db/surrealdb/surrealdb.py +1908 -0
agno/db/surrealdb/utils.py +147 -0
agno/db/utils.py +118 -0
agno/eval/__init__.py +24 -0
agno/eval/accuracy.py +666 -276
agno/eval/agent_as_judge.py +861 -0
agno/eval/base.py +29 -0
agno/eval/performance.py +779 -0
agno/eval/reliability.py +241 -62
agno/eval/utils.py +120 -0
agno/exceptions.py +143 -1
agno/filters.py +354 -0
agno/guardrails/__init__.py +6 -0
agno/guardrails/base.py +19 -0
agno/guardrails/openai.py +144 -0
agno/guardrails/pii.py +94 -0
agno/guardrails/prompt_injection.py +52 -0
agno/hooks/__init__.py +3 -0
agno/hooks/decorator.py +164 -0
agno/integrations/discord/__init__.py +3 -0
agno/integrations/discord/client.py +203 -0
agno/knowledge/__init__.py +5 -1
agno/{document → knowledge}/chunking/agentic.py +22 -14
agno/{document → knowledge}/chunking/document.py +2 -2
agno/{document → knowledge}/chunking/fixed.py +7 -6
agno/knowledge/chunking/markdown.py +151 -0
agno/{document → knowledge}/chunking/recursive.py +15 -3
agno/knowledge/chunking/row.py +39 -0
agno/knowledge/chunking/semantic.py +91 -0
agno/knowledge/chunking/strategy.py +165 -0
agno/knowledge/content.py +74 -0
agno/knowledge/document/__init__.py +5 -0
agno/{document → knowledge/document}/base.py +12 -2
agno/knowledge/embedder/__init__.py +5 -0
agno/knowledge/embedder/aws_bedrock.py +343 -0
agno/knowledge/embedder/azure_openai.py +210 -0
agno/{embedder → knowledge/embedder}/base.py +8 -0
agno/knowledge/embedder/cohere.py +323 -0
agno/knowledge/embedder/fastembed.py +62 -0
agno/{embedder → knowledge/embedder}/fireworks.py +1 -1
agno/knowledge/embedder/google.py +258 -0
agno/knowledge/embedder/huggingface.py +94 -0
agno/knowledge/embedder/jina.py +182 -0
agno/knowledge/embedder/langdb.py +22 -0
agno/knowledge/embedder/mistral.py +206 -0
agno/knowledge/embedder/nebius.py +13 -0
agno/knowledge/embedder/ollama.py +154 -0
agno/knowledge/embedder/openai.py +195 -0
agno/knowledge/embedder/sentence_transformer.py +63 -0
agno/{embedder → knowledge/embedder}/together.py +1 -1
agno/knowledge/embedder/vllm.py +262 -0
agno/knowledge/embedder/voyageai.py +165 -0
agno/knowledge/knowledge.py +3006 -0
agno/knowledge/reader/__init__.py +7 -0
agno/knowledge/reader/arxiv_reader.py +81 -0
agno/knowledge/reader/base.py +95 -0
agno/knowledge/reader/csv_reader.py +164 -0
agno/knowledge/reader/docx_reader.py +82 -0
agno/knowledge/reader/field_labeled_csv_reader.py +290 -0
agno/knowledge/reader/firecrawl_reader.py +201 -0
agno/knowledge/reader/json_reader.py +88 -0
agno/knowledge/reader/markdown_reader.py +137 -0
agno/knowledge/reader/pdf_reader.py +431 -0
agno/knowledge/reader/pptx_reader.py +101 -0
agno/knowledge/reader/reader_factory.py +313 -0
agno/knowledge/reader/s3_reader.py +89 -0
agno/knowledge/reader/tavily_reader.py +193 -0
agno/knowledge/reader/text_reader.py +127 -0
agno/knowledge/reader/web_search_reader.py +325 -0
agno/knowledge/reader/website_reader.py +455 -0
agno/knowledge/reader/wikipedia_reader.py +91 -0
agno/knowledge/reader/youtube_reader.py +78 -0
agno/knowledge/remote_content/remote_content.py +88 -0
agno/knowledge/reranker/__init__.py +3 -0
agno/{reranker → knowledge/reranker}/base.py +1 -1
agno/{reranker → knowledge/reranker}/cohere.py +2 -2
agno/knowledge/reranker/infinity.py +195 -0
agno/knowledge/reranker/sentence_transformer.py +54 -0
agno/knowledge/types.py +39 -0
agno/knowledge/utils.py +234 -0
agno/media.py +439 -95
agno/memory/__init__.py +16 -3
agno/memory/manager.py +1474 -123
agno/memory/strategies/__init__.py +15 -0
agno/memory/strategies/base.py +66 -0
agno/memory/strategies/summarize.py +196 -0
agno/memory/strategies/types.py +37 -0
agno/models/aimlapi/__init__.py +5 -0
agno/models/aimlapi/aimlapi.py +62 -0
agno/models/anthropic/__init__.py +4 -0
agno/models/anthropic/claude.py +960 -496
agno/models/aws/__init__.py +15 -0
agno/models/aws/bedrock.py +686 -451
agno/models/aws/claude.py +190 -183
agno/models/azure/__init__.py +18 -1
agno/models/azure/ai_foundry.py +489 -0
agno/models/azure/openai_chat.py +89 -40
agno/models/base.py +2477 -550
agno/models/cerebras/__init__.py +12 -0
agno/models/cerebras/cerebras.py +565 -0
agno/models/cerebras/cerebras_openai.py +131 -0
agno/models/cohere/__init__.py +4 -0
agno/models/cohere/chat.py +306 -492
agno/models/cometapi/__init__.py +5 -0
agno/models/cometapi/cometapi.py +74 -0
agno/models/dashscope/__init__.py +5 -0
agno/models/dashscope/dashscope.py +90 -0
agno/models/deepinfra/__init__.py +5 -0
agno/models/deepinfra/deepinfra.py +45 -0
agno/models/deepseek/__init__.py +4 -0
agno/models/deepseek/deepseek.py +110 -9
agno/models/fireworks/__init__.py +4 -0
agno/models/fireworks/fireworks.py +19 -22
agno/models/google/__init__.py +3 -7
agno/models/google/gemini.py +1717 -662
agno/models/google/utils.py +22 -0
agno/models/groq/__init__.py +4 -0
agno/models/groq/groq.py +391 -666
agno/models/huggingface/__init__.py +4 -0
agno/models/huggingface/huggingface.py +266 -538
agno/models/ibm/__init__.py +5 -0
agno/models/ibm/watsonx.py +432 -0
agno/models/internlm/__init__.py +3 -0
agno/models/internlm/internlm.py +20 -3
agno/models/langdb/__init__.py +1 -0
agno/models/langdb/langdb.py +60 -0
agno/models/litellm/__init__.py +14 -0
agno/models/litellm/chat.py +503 -0
agno/models/litellm/litellm_openai.py +42 -0
agno/models/llama_cpp/__init__.py +5 -0
agno/models/llama_cpp/llama_cpp.py +22 -0
agno/models/lmstudio/__init__.py +5 -0
agno/models/lmstudio/lmstudio.py +25 -0
agno/models/message.py +361 -39
agno/models/meta/__init__.py +12 -0
agno/models/meta/llama.py +502 -0
agno/models/meta/llama_openai.py +79 -0
agno/models/metrics.py +120 -0
agno/models/mistral/__init__.py +4 -0
agno/models/mistral/mistral.py +293 -393
agno/models/nebius/__init__.py +3 -0
agno/models/nebius/nebius.py +53 -0
agno/models/nexus/__init__.py +3 -0
agno/models/nexus/nexus.py +22 -0
agno/models/nvidia/__init__.py +4 -0
agno/models/nvidia/nvidia.py +22 -3
agno/models/ollama/__init__.py +4 -2
agno/models/ollama/chat.py +257 -492
agno/models/openai/__init__.py +7 -0
agno/models/openai/chat.py +725 -770
agno/models/openai/like.py +16 -2
agno/models/openai/responses.py +1121 -0
agno/models/openrouter/__init__.py +4 -0
agno/models/openrouter/openrouter.py +62 -5
agno/models/perplexity/__init__.py +5 -0
agno/models/perplexity/perplexity.py +203 -0
agno/models/portkey/__init__.py +3 -0
agno/models/portkey/portkey.py +82 -0
agno/models/requesty/__init__.py +5 -0
agno/models/requesty/requesty.py +69 -0
agno/models/response.py +177 -7
agno/models/sambanova/__init__.py +4 -0
agno/models/sambanova/sambanova.py +23 -4
agno/models/siliconflow/__init__.py +5 -0
agno/models/siliconflow/siliconflow.py +42 -0
agno/models/together/__init__.py +4 -0
agno/models/together/together.py +21 -164
agno/models/utils.py +266 -0
agno/models/vercel/__init__.py +3 -0
agno/models/vercel/v0.py +43 -0
agno/models/vertexai/__init__.py +0 -1
agno/models/vertexai/claude.py +190 -0
agno/models/vllm/__init__.py +3 -0
agno/models/vllm/vllm.py +83 -0
agno/models/xai/__init__.py +2 -0
agno/models/xai/xai.py +111 -7
agno/os/__init__.py +3 -0
agno/os/app.py +1027 -0
agno/os/auth.py +244 -0
agno/os/config.py +126 -0
agno/os/interfaces/__init__.py +1 -0
agno/os/interfaces/a2a/__init__.py +3 -0
agno/os/interfaces/a2a/a2a.py +42 -0
agno/os/interfaces/a2a/router.py +249 -0
agno/os/interfaces/a2a/utils.py +924 -0
agno/os/interfaces/agui/__init__.py +3 -0
agno/os/interfaces/agui/agui.py +47 -0
agno/os/interfaces/agui/router.py +147 -0
agno/os/interfaces/agui/utils.py +574 -0
agno/os/interfaces/base.py +25 -0
agno/os/interfaces/slack/__init__.py +3 -0
agno/os/interfaces/slack/router.py +148 -0
agno/os/interfaces/slack/security.py +30 -0
agno/os/interfaces/slack/slack.py +47 -0
agno/os/interfaces/whatsapp/__init__.py +3 -0
agno/os/interfaces/whatsapp/router.py +210 -0
agno/os/interfaces/whatsapp/security.py +55 -0
agno/os/interfaces/whatsapp/whatsapp.py +36 -0
agno/os/mcp.py +293 -0
agno/os/middleware/__init__.py +9 -0
agno/os/middleware/jwt.py +797 -0
agno/os/router.py +258 -0
agno/os/routers/__init__.py +3 -0
agno/os/routers/agents/__init__.py +3 -0
agno/os/routers/agents/router.py +599 -0
agno/os/routers/agents/schema.py +261 -0
agno/os/routers/evals/__init__.py +3 -0
agno/os/routers/evals/evals.py +450 -0
agno/os/routers/evals/schemas.py +174 -0
agno/os/routers/evals/utils.py +231 -0
agno/os/routers/health.py +31 -0
agno/os/routers/home.py +52 -0
agno/os/routers/knowledge/__init__.py +3 -0
agno/os/routers/knowledge/knowledge.py +1008 -0
agno/os/routers/knowledge/schemas.py +178 -0
agno/os/routers/memory/__init__.py +3 -0
agno/os/routers/memory/memory.py +661 -0
agno/os/routers/memory/schemas.py +88 -0
agno/os/routers/metrics/__init__.py +3 -0
agno/os/routers/metrics/metrics.py +190 -0
agno/os/routers/metrics/schemas.py +47 -0
agno/os/routers/session/__init__.py +3 -0
agno/os/routers/session/session.py +997 -0
agno/os/routers/teams/__init__.py +3 -0
agno/os/routers/teams/router.py +512 -0
agno/os/routers/teams/schema.py +257 -0
agno/os/routers/traces/__init__.py +3 -0
agno/os/routers/traces/schemas.py +414 -0
agno/os/routers/traces/traces.py +499 -0
agno/os/routers/workflows/__init__.py +3 -0
agno/os/routers/workflows/router.py +624 -0
agno/os/routers/workflows/schema.py +75 -0
agno/os/schema.py +534 -0
agno/os/scopes.py +469 -0
agno/{playground → os}/settings.py +7 -15
agno/os/utils.py +973 -0
agno/reasoning/anthropic.py +80 -0
agno/reasoning/azure_ai_foundry.py +67 -0
agno/reasoning/deepseek.py +63 -0
agno/reasoning/default.py +97 -0
agno/reasoning/gemini.py +73 -0
agno/reasoning/groq.py +71 -0
agno/reasoning/helpers.py +24 -1
agno/reasoning/ollama.py +67 -0
agno/reasoning/openai.py +86 -0
agno/reasoning/step.py +2 -1
agno/reasoning/vertexai.py +76 -0
agno/run/__init__.py +6 -0
agno/run/agent.py +822 -0
agno/run/base.py +247 -0
agno/run/cancel.py +81 -0
agno/run/requirement.py +181 -0
agno/run/team.py +767 -0
agno/run/workflow.py +708 -0
agno/session/__init__.py +10 -0
agno/session/agent.py +260 -0
agno/session/summary.py +265 -0
agno/session/team.py +342 -0
agno/session/workflow.py +501 -0
agno/table.py +10 -0
agno/team/__init__.py +37 -0
agno/team/team.py +9536 -0
agno/tools/__init__.py +7 -0
agno/tools/agentql.py +120 -0
agno/tools/airflow.py +22 -12
agno/tools/api.py +122 -0
agno/tools/apify.py +276 -83
agno/tools/{arxiv_toolkit.py → arxiv.py} +20 -12
agno/tools/aws_lambda.py +28 -7
agno/tools/aws_ses.py +66 -0
agno/tools/baidusearch.py +11 -4
agno/tools/bitbucket.py +292 -0
agno/tools/brandfetch.py +213 -0
agno/tools/bravesearch.py +106 -0
agno/tools/brightdata.py +367 -0
agno/tools/browserbase.py +209 -0
agno/tools/calcom.py +32 -23
agno/tools/calculator.py +24 -37
agno/tools/cartesia.py +187 -0
agno/tools/{clickup_tool.py → clickup.py} +17 -28
agno/tools/confluence.py +91 -26
agno/tools/crawl4ai.py +139 -43
agno/tools/csv_toolkit.py +28 -22
agno/tools/dalle.py +36 -22
agno/tools/daytona.py +475 -0
agno/tools/decorator.py +169 -14
agno/tools/desi_vocal.py +23 -11
agno/tools/discord.py +32 -29
agno/tools/docker.py +716 -0
agno/tools/duckdb.py +76 -81
agno/tools/duckduckgo.py +43 -40
agno/tools/e2b.py +703 -0
agno/tools/eleven_labs.py +65 -54
agno/tools/email.py +13 -5
agno/tools/evm.py +129 -0
agno/tools/exa.py +324 -42
agno/tools/fal.py +39 -35
agno/tools/file.py +196 -30
agno/tools/file_generation.py +356 -0
agno/tools/financial_datasets.py +288 -0
agno/tools/firecrawl.py +108 -33
agno/tools/function.py +960 -122
agno/tools/giphy.py +34 -12
agno/tools/github.py +1294 -97
agno/tools/gmail.py +922 -0
agno/tools/google_bigquery.py +117 -0
agno/tools/google_drive.py +271 -0
agno/tools/google_maps.py +253 -0
agno/tools/googlecalendar.py +607 -107
agno/tools/googlesheets.py +377 -0
agno/tools/hackernews.py +20 -12
agno/tools/jina.py +24 -14
agno/tools/jira.py +48 -19
agno/tools/knowledge.py +218 -0
agno/tools/linear.py +82 -43
agno/tools/linkup.py +58 -0
agno/tools/local_file_system.py +15 -7
agno/tools/lumalab.py +41 -26
agno/tools/mcp/__init__.py +10 -0
agno/tools/mcp/mcp.py +331 -0
agno/tools/mcp/multi_mcp.py +347 -0
agno/tools/mcp/params.py +24 -0
agno/tools/mcp_toolbox.py +284 -0
agno/tools/mem0.py +193 -0
agno/tools/memory.py +419 -0
agno/tools/mlx_transcribe.py +11 -9
agno/tools/models/azure_openai.py +190 -0
agno/tools/models/gemini.py +203 -0
agno/tools/models/groq.py +158 -0
agno/tools/models/morph.py +186 -0
agno/tools/models/nebius.py +124 -0
agno/tools/models_labs.py +163 -82
agno/tools/moviepy_video.py +18 -13
agno/tools/nano_banana.py +151 -0
agno/tools/neo4j.py +134 -0
agno/tools/newspaper.py +15 -4
agno/tools/newspaper4k.py +19 -6
agno/tools/notion.py +204 -0
agno/tools/openai.py +181 -17
agno/tools/openbb.py +27 -20
agno/tools/opencv.py +321 -0
agno/tools/openweather.py +233 -0
agno/tools/oxylabs.py +385 -0
agno/tools/pandas.py +25 -15
agno/tools/parallel.py +314 -0
agno/tools/postgres.py +238 -185
agno/tools/pubmed.py +125 -13
agno/tools/python.py +48 -35
agno/tools/reasoning.py +283 -0
agno/tools/reddit.py +207 -29
agno/tools/redshift.py +406 -0
agno/tools/replicate.py +69 -26
agno/tools/resend.py +11 -6
agno/tools/scrapegraph.py +179 -19
agno/tools/searxng.py +23 -31
agno/tools/serpapi.py +15 -10
agno/tools/serper.py +255 -0
agno/tools/shell.py +23 -12
agno/tools/shopify.py +1519 -0
agno/tools/slack.py +56 -14
agno/tools/sleep.py +8 -6
agno/tools/spider.py +35 -11
agno/tools/spotify.py +919 -0
agno/tools/sql.py +34 -19
agno/tools/tavily.py +158 -8
agno/tools/telegram.py +18 -8
agno/tools/todoist.py +218 -0
agno/tools/toolkit.py +134 -9
agno/tools/trafilatura.py +388 -0
agno/tools/trello.py +25 -28
agno/tools/twilio.py +18 -9
agno/tools/user_control_flow.py +78 -0
agno/tools/valyu.py +228 -0
agno/tools/visualization.py +467 -0
agno/tools/webbrowser.py +28 -0
agno/tools/webex.py +76 -0
agno/tools/website.py +23 -19
agno/tools/webtools.py +45 -0
agno/tools/whatsapp.py +286 -0
agno/tools/wikipedia.py +28 -19
agno/tools/workflow.py +285 -0
agno/tools/{twitter.py → x.py} +142 -46
agno/tools/yfinance.py +41 -39
agno/tools/youtube.py +34 -17
agno/tools/zendesk.py +15 -5
agno/tools/zep.py +454 -0
agno/tools/zoom.py +86 -37
agno/tracing/__init__.py +12 -0
agno/tracing/exporter.py +157 -0
agno/tracing/schemas.py +276 -0
agno/tracing/setup.py +111 -0
agno/utils/agent.py +938 -0
agno/utils/audio.py +37 -1
agno/utils/certs.py +27 -0
agno/utils/code_execution.py +11 -0
agno/utils/common.py +103 -20
agno/utils/cryptography.py +22 -0
agno/utils/dttm.py +33 -0
agno/utils/events.py +700 -0
agno/utils/functions.py +107 -37
agno/utils/gemini.py +426 -0
agno/utils/hooks.py +171 -0
agno/utils/http.py +185 -0
agno/utils/json_schema.py +159 -37
agno/utils/knowledge.py +36 -0
agno/utils/location.py +19 -0
agno/utils/log.py +221 -8
agno/utils/mcp.py +214 -0
agno/utils/media.py +335 -14
agno/utils/merge_dict.py +22 -1
agno/utils/message.py +77 -2
agno/utils/models/ai_foundry.py +50 -0
agno/utils/models/claude.py +373 -0
agno/utils/models/cohere.py +94 -0
agno/utils/models/llama.py +85 -0
agno/utils/models/mistral.py +100 -0
agno/utils/models/openai_responses.py +140 -0
agno/utils/models/schema_utils.py +153 -0
agno/utils/models/watsonx.py +41 -0
agno/utils/openai.py +257 -0
agno/utils/pickle.py +1 -1
agno/utils/pprint.py +124 -8
agno/utils/print_response/agent.py +930 -0
agno/utils/print_response/team.py +1914 -0
agno/utils/print_response/workflow.py +1668 -0
agno/utils/prompts.py +111 -0
agno/utils/reasoning.py +108 -0
agno/utils/response.py +163 -0
agno/utils/serialize.py +32 -0
agno/utils/shell.py +4 -4
agno/utils/streamlit.py +487 -0
agno/utils/string.py +204 -51
agno/utils/team.py +139 -0
agno/utils/timer.py +9 -2
agno/utils/tokens.py +657 -0
agno/utils/tools.py +19 -1
agno/utils/whatsapp.py +305 -0
agno/utils/yaml_io.py +3 -3
agno/vectordb/__init__.py +2 -0
agno/vectordb/base.py +87 -9
agno/vectordb/cassandra/__init__.py +5 -1
agno/vectordb/cassandra/cassandra.py +383 -27
agno/vectordb/chroma/__init__.py +4 -0
agno/vectordb/chroma/chromadb.py +748 -83
agno/vectordb/clickhouse/__init__.py +7 -1
agno/vectordb/clickhouse/clickhousedb.py +554 -53
agno/vectordb/couchbase/__init__.py +3 -0
agno/vectordb/couchbase/couchbase.py +1446 -0
agno/vectordb/lancedb/__init__.py +5 -0
agno/vectordb/lancedb/lance_db.py +730 -98
agno/vectordb/langchaindb/__init__.py +5 -0
agno/vectordb/langchaindb/langchaindb.py +163 -0
agno/vectordb/lightrag/__init__.py +5 -0
agno/vectordb/lightrag/lightrag.py +388 -0
agno/vectordb/llamaindex/__init__.py +3 -0
agno/vectordb/llamaindex/llamaindexdb.py +166 -0
agno/vectordb/milvus/__init__.py +3 -0
agno/vectordb/milvus/milvus.py +966 -78
agno/vectordb/mongodb/__init__.py +9 -1
agno/vectordb/mongodb/mongodb.py +1175 -172
agno/vectordb/pgvector/__init__.py +8 -0
agno/vectordb/pgvector/pgvector.py +599 -115
agno/vectordb/pineconedb/__init__.py +5 -1
agno/vectordb/pineconedb/pineconedb.py +406 -43
agno/vectordb/qdrant/__init__.py +4 -0
agno/vectordb/qdrant/qdrant.py +914 -61
agno/vectordb/redis/__init__.py +9 -0
agno/vectordb/redis/redisdb.py +682 -0
agno/vectordb/singlestore/__init__.py +8 -1
agno/vectordb/singlestore/singlestore.py +771 -0
agno/vectordb/surrealdb/__init__.py +3 -0
agno/vectordb/surrealdb/surrealdb.py +663 -0
agno/vectordb/upstashdb/__init__.py +5 -0
agno/vectordb/upstashdb/upstashdb.py +718 -0
agno/vectordb/weaviate/__init__.py +8 -0
agno/vectordb/weaviate/index.py +15 -0
agno/vectordb/weaviate/weaviate.py +1009 -0
agno/workflow/__init__.py +23 -1
agno/workflow/agent.py +299 -0
agno/workflow/condition.py +759 -0
agno/workflow/loop.py +756 -0
agno/workflow/parallel.py +853 -0
agno/workflow/router.py +723 -0
agno/workflow/step.py +1564 -0
agno/workflow/steps.py +613 -0
agno/workflow/types.py +556 -0
agno/workflow/workflow.py +4327 -514
agno-2.3.13.dist-info/METADATA +639 -0
agno-2.3.13.dist-info/RECORD +613 -0
{agno-0.1.2.dist-info → agno-2.3.13.dist-info}/WHEEL +1 -1
agno-2.3.13.dist-info/licenses/LICENSE +201 -0
agno/api/playground.py +0 -91
agno/api/schemas/playground.py +0 -22
agno/api/schemas/user.py +0 -22
agno/api/schemas/workspace.py +0 -46
agno/api/user.py +0 -160
agno/api/workspace.py +0 -151
agno/cli/auth_server.py +0 -118
agno/cli/config.py +0 -275
agno/cli/console.py +0 -88
agno/cli/credentials.py +0 -23
agno/cli/entrypoint.py +0 -571
agno/cli/operator.py +0 -355
agno/cli/settings.py +0 -85
agno/cli/ws/ws_cli.py +0 -817
agno/constants.py +0 -13
agno/document/__init__.py +0 -1
agno/document/chunking/semantic.py +0 -47
agno/document/chunking/strategy.py +0 -31
agno/document/reader/__init__.py +0 -1
agno/document/reader/arxiv_reader.py +0 -41
agno/document/reader/base.py +0 -22
agno/document/reader/csv_reader.py +0 -84
agno/document/reader/docx_reader.py +0 -46
agno/document/reader/firecrawl_reader.py +0 -99
agno/document/reader/json_reader.py +0 -43
agno/document/reader/pdf_reader.py +0 -219
agno/document/reader/s3/pdf_reader.py +0 -46
agno/document/reader/s3/text_reader.py +0 -51
agno/document/reader/text_reader.py +0 -41
agno/document/reader/website_reader.py +0 -175
agno/document/reader/youtube_reader.py +0 -50
agno/embedder/__init__.py +0 -1
agno/embedder/azure_openai.py +0 -86
agno/embedder/cohere.py +0 -72
agno/embedder/fastembed.py +0 -37
agno/embedder/google.py +0 -73
agno/embedder/huggingface.py +0 -54
agno/embedder/mistral.py +0 -80
agno/embedder/ollama.py +0 -57
agno/embedder/openai.py +0 -74
agno/embedder/sentence_transformer.py +0 -38
agno/embedder/voyageai.py +0 -64
agno/eval/perf.py +0 -201
agno/file/__init__.py +0 -1
agno/file/file.py +0 -16
agno/file/local/csv.py +0 -32
agno/file/local/txt.py +0 -19
agno/infra/app.py +0 -240
agno/infra/base.py +0 -144
agno/infra/context.py +0 -20
agno/infra/db_app.py +0 -52
agno/infra/resource.py +0 -205
agno/infra/resources.py +0 -55
agno/knowledge/agent.py +0 -230
agno/knowledge/arxiv.py +0 -22
agno/knowledge/combined.py +0 -22
agno/knowledge/csv.py +0 -28
agno/knowledge/csv_url.py +0 -19
agno/knowledge/document.py +0 -20
agno/knowledge/docx.py +0 -30
agno/knowledge/json.py +0 -28
agno/knowledge/langchain.py +0 -71
agno/knowledge/llamaindex.py +0 -66
agno/knowledge/pdf.py +0 -28
agno/knowledge/pdf_url.py +0 -26
agno/knowledge/s3/base.py +0 -60
agno/knowledge/s3/pdf.py +0 -21
agno/knowledge/s3/text.py +0 -23
agno/knowledge/text.py +0 -30
agno/knowledge/website.py +0 -88
agno/knowledge/wikipedia.py +0 -31
agno/knowledge/youtube.py +0 -22
agno/memory/agent.py +0 -392
agno/memory/classifier.py +0 -104
agno/memory/db/__init__.py +0 -1
agno/memory/db/base.py +0 -42
agno/memory/db/mongodb.py +0 -189
agno/memory/db/postgres.py +0 -203
agno/memory/db/sqlite.py +0 -193
agno/memory/memory.py +0 -15
agno/memory/row.py +0 -36
agno/memory/summarizer.py +0 -192
agno/memory/summary.py +0 -19
agno/memory/workflow.py +0 -38
agno/models/google/gemini_openai.py +0 -26
agno/models/ollama/hermes.py +0 -221
agno/models/ollama/tools.py +0 -362
agno/models/vertexai/gemini.py +0 -595
agno/playground/__init__.py +0 -3
agno/playground/async_router.py +0 -421
agno/playground/deploy.py +0 -249
agno/playground/operator.py +0 -92
agno/playground/playground.py +0 -91
agno/playground/schemas.py +0 -76
agno/playground/serve.py +0 -55
agno/playground/sync_router.py +0 -405
agno/reasoning/agent.py +0 -68
agno/run/response.py +0 -112
agno/storage/agent/__init__.py +0 -0
agno/storage/agent/base.py +0 -38
agno/storage/agent/dynamodb.py +0 -350
agno/storage/agent/json.py +0 -92
agno/storage/agent/mongodb.py +0 -228
agno/storage/agent/postgres.py +0 -367
agno/storage/agent/session.py +0 -79
agno/storage/agent/singlestore.py +0 -303
agno/storage/agent/sqlite.py +0 -357
agno/storage/agent/yaml.py +0 -93
agno/storage/workflow/__init__.py +0 -0
agno/storage/workflow/base.py +0 -40
agno/storage/workflow/mongodb.py +0 -233
agno/storage/workflow/postgres.py +0 -366
agno/storage/workflow/session.py +0 -60
agno/storage/workflow/sqlite.py +0 -359
agno/tools/googlesearch.py +0 -88
agno/utils/defaults.py +0 -57
agno/utils/filesystem.py +0 -39
agno/utils/git.py +0 -52
agno/utils/json_io.py +0 -30
agno/utils/load_env.py +0 -19
agno/utils/py_io.py +0 -19
agno/utils/pyproject.py +0 -18
agno/utils/resource_filter.py +0 -31
agno/vectordb/singlestore/s2vectordb.py +0 -390
agno/vectordb/singlestore/s2vectordb2.py +0 -355
agno/workspace/__init__.py +0 -0
agno/workspace/config.py +0 -325
agno/workspace/enums.py +0 -6
agno/workspace/helpers.py +0 -48
agno/workspace/operator.py +0 -758
agno/workspace/settings.py +0 -63
agno-0.1.2.dist-info/LICENSE +0 -375
agno-0.1.2.dist-info/METADATA +0 -502
agno-0.1.2.dist-info/RECORD +0 -352
agno-0.1.2.dist-info/entry_points.txt +0 -3
/agno/{cli → db/migrations}/__init__.py +0 -0
/agno/{cli/ws → db/migrations/versions}/__init__.py +0 -0
/agno/{document/chunking/__init__.py → db/schemas/metrics.py} +0 -0
/agno/{document/reader/s3 → integrations}/__init__.py +0 -0
/agno/{file/local → knowledge/chunking}/__init__.py +0 -0
/agno/{infra → knowledge/remote_content}/__init__.py +0 -0
/agno/{knowledge/s3 → tools/models}/__init__.py +0 -0
/agno/{reranker → utils/models}/__init__.py +0 -0
/agno/{storage → utils/print_response}/__init__.py +0 -0
{agno-0.1.2.dist-info → agno-2.3.13.dist-info}/top_level.txt +0 -0

agno/models/google/gemini.py CHANGED Viewed

@@ -1,827 +1,1882 @@
+import asyncio
+import base64
 import json
 import time
-import traceback
-from dataclasses import dataclass, field
+from collections.abc import AsyncIterator
+from dataclasses import dataclass
 from os import getenv
 from pathlib import Path
-from typing import Any, Callable, Dict, Iterator, List, Optional, Union
-from agno.media import Audio, Image, Video
-from agno.models.base import Metrics, Model
-from agno.models.message import Message
-from agno.models.response import ModelResponse, ModelResponseEvent
-from agno.tools import Function, Toolkit
-from agno.utils.log import logger
+from typing import Any, Dict, Iterator, List, Optional, Type, Union
+from uuid import uuid4
+from pydantic import BaseModel
+from agno.exceptions import ModelProviderError
+from agno.media import Audio, File, Image, Video
+from agno.models.base import Model, RetryableModelProviderError
+from agno.models.google.utils import MALFORMED_FUNCTION_CALL_GUIDANCE, GeminiFinishReason
+from agno.models.message import Citations, Message, UrlCitation
+from agno.models.metrics import Metrics
+from agno.models.response import ModelResponse
+from agno.run.agent import RunOutput
+from agno.tools.function import Function
+from agno.utils.gemini import format_function_definitions, format_image_for_message, prepare_response_schema
+from agno.utils.log import log_debug, log_error, log_info, log_warning
+from agno.utils.tokens import count_schema_tokens, count_text_tokens, count_tool_tokens
 try:
-    import google.generativeai as genai
-    from google.ai.generativelanguage_v1beta.types import (
-        FunctionCall as GeminiFunctionCall,
-    )
-    from google.ai.generativelanguage_v1beta.types import (
-        FunctionResponse as GeminiFunctionResponse,
-    )
-    from google.ai.generativelanguage_v1beta.types import (
+    from google import genai
+    from google.genai import Client as GeminiClient
+    from google.genai.errors import ClientError, ServerError
+    from google.genai.types import (
+        Content,
+        DynamicRetrievalConfig,
+        FileSearch,
+        FunctionCallingConfigMode,
+        GenerateContentConfig,
+        GenerateContentResponse,
+        GenerateContentResponseUsageMetadata,
+        GoogleSearch,
+        GoogleSearchRetrieval,
+        GroundingMetadata,
+        Operation,
         Part,
+        Retrieval,
+        ThinkingConfig,
+        Tool,
+        UrlContext,
+        VertexAISearch,
+    )
+    from google.genai.types import (
+        File as GeminiFile,
     )
-    from google.ai.generativelanguage_v1beta.types.generative_service import (
-        GenerateContentResponse as ResultGenerateContentResponse,
+except ImportError:
+    raise ImportError(
+        "`google-genai` not installed or not at the latest version. Please install it using `pip install -U google-genai`"
     )
-    from google.api_core.exceptions import PermissionDenied
-    from google.generativeai import GenerativeModel
-    from google.generativeai.types import file_types
-    from google.generativeai.types.content_types import FunctionDeclaration
-    from google.generativeai.types.content_types import Tool as GeminiTool
-    from google.generativeai.types.generation_types import GenerateContentResponse
-    from google.protobuf.struct_pb2 import Struct
-except (ModuleNotFoundError, ImportError):
-    raise ImportError("`google-generativeai` not installed. Please install it using `pip install google-generativeai`")
 @dataclass
-class MessageData:
-    response_content: str = ""
-    response_block: Optional[GenerateContentResponse] = None
-    response_role: Optional[str] = None
-    response_parts: Optional[List] = None
-    valid_response_parts: Optional[List] = None
-    response_tool_calls: List[Dict[str, Any]] = field(default_factory=list)
-    response_usage: Optional[ResultGenerateContentResponse] = None
-def _format_image_for_message(image: Image) -> Optional[Dict[str, Any]]:
-    # Case 1: Image is a URL
-    # Download the image from the URL and add it as base64 encoded data
-    if image.url is not None and image.image_url_content is not None:
-        try:
-            import base64
-            content_bytes = image.image_url_content
-            image_data = {
-                "mime_type": "image/jpeg",
-                "data": base64.b64encode(content_bytes).decode("utf-8"),
-            }
-            return image_data
-        except Exception as e:
-            logger.warning(f"Failed to download image from {image}: {e}")
-            return None
-    # Case 2: Image is a local path
-    # Open the image file and add it as base64 encoded data
-    elif image.filepath is not None:
-        try:
-            import PIL.Image
-        except ImportError:
-            logger.error("`PIL.Image not installed. Please install it using 'pip install pillow'`")
-            raise
+class Gemini(Model):
+    """
+    Gemini model class for Google's Generative AI models.
-        try:
-            image_path = Path(image.filepath)
-            if image_path.exists() and image_path.is_file():
-                image_data = PIL.Image.open(image_path)  # type: ignore
-            else:
-                logger.error(f"Image file {image_path} does not exist.")
-                raise
-            return image_data  # type: ignore
-        except Exception as e:
-            logger.warning(f"Failed to load image from {image.filepath}: {e}")
-            return None
+    Vertex AI:
+    - You will need Google Cloud credentials to use the Vertex AI API. Run `gcloud auth application-default login` to set credentials.
+    - Set `vertexai` to `True` to use the Vertex AI API.
+    - Set your `project_id` (or set `GOOGLE_CLOUD_PROJECT` environment variable) and `location` (optional).
+    - Set `http_options` (optional) to configure the HTTP options.
-    # Case 3: Image is a bytes object
-    # Add it as base64 encoded data
-    elif image.content is not None and isinstance(image.content, bytes):
-        import base64
+    Based on https://googleapis.github.io/python-genai/
+    """
-        image_data = {"mime_type": "image/jpeg", "data": base64.b64encode(image.content).decode("utf-8")}
-        return image_data
-    else:
-        logger.warning(f"Unknown image type: {type(image)}")
-        return None
+    id: str = "gemini-2.0-flash-001"
+    name: str = "Gemini"
+    provider: str = "Google"
+    supports_native_structured_outputs: bool = True
-def _format_audio_for_message(audio: Audio) -> Optional[Union[Dict[str, Any], file_types.File]]:
-    if audio.content and isinstance(audio.content, bytes):
-        audio_content = {"mime_type": "audio/mp3", "data": audio.content}
-        return audio_content
+    # Request parameters
+    function_declarations: Optional[List[Any]] = None
+    generation_config: Optional[Any] = None
+    safety_settings: Optional[List[Any]] = None
+    generative_model_kwargs: Optional[Dict[str, Any]] = None
+    search: bool = False
+    grounding: bool = False
+    grounding_dynamic_threshold: Optional[float] = None
+    url_context: bool = False
+    vertexai_search: bool = False
+    vertexai_search_datastore: Optional[str] = None
+    # Gemini File Search capabilities
+    file_search_store_names: Optional[List[str]] = None
+    file_search_metadata_filter: Optional[str] = None
+    temperature: Optional[float] = None
+    top_p: Optional[float] = None
+    top_k: Optional[int] = None
+    max_output_tokens: Optional[int] = None
+    stop_sequences: Optional[list[str]] = None
+    logprobs: Optional[bool] = None
+    presence_penalty: Optional[float] = None
+    frequency_penalty: Optional[float] = None
+    seed: Optional[int] = None
+    response_modalities: Optional[list[str]] = None  # "TEXT", "IMAGE", and/or "AUDIO"
+    speech_config: Optional[dict[str, Any]] = None
+    cached_content: Optional[Any] = None
+    thinking_budget: Optional[int] = None  # Thinking budget for Gemini 2.5 models
+    include_thoughts: Optional[bool] = None  # Include thought summaries in response
+    thinking_level: Optional[str] = None  # "low", "high"
+    request_params: Optional[Dict[str, Any]] = None
-    elif audio.filepath is not None:
-        audio_path = audio.filepath if isinstance(audio.filepath, Path) else Path(audio.filepath)
+    # Client parameters
+    api_key: Optional[str] = None
+    vertexai: bool = False
+    project_id: Optional[str] = None
+    location: Optional[str] = None
+    client_params: Optional[Dict[str, Any]] = None
-        remote_file_name = f"files/{audio_path.stem.lower()}"
-        # Check if video is already uploaded
-        existing_audio_upload = None
-        try:
-            existing_audio_upload = genai.get_file(remote_file_name)
-        except PermissionDenied:
-            pass
+    # Gemini client
+    client: Optional[GeminiClient] = None
-        if existing_audio_upload:
-            audio_file = existing_audio_upload
-        else:
-            # Upload the video file to the Gemini API
-            if audio_path.exists() and audio_path.is_file():
-                audio_file = genai.upload_file(path=audio_path, name=remote_file_name, display_name=audio_path.stem)
-            else:
-                logger.error(f"Audio file {audio_path} does not exist.")
-                raise Exception(f"Audio file {audio_path} does not exist.")
-            # Check whether the file is ready to be used.
-            while audio_file.state.name == "PROCESSING":
-                time.sleep(2)
-                audio_file = genai.get_file(audio_file.name)
-            if audio_file.state.name == "FAILED":
-                raise ValueError(audio_file.state.name)
-        return audio_file
-    else:
-        logger.warning(f"Unknown audio type: {type(audio.content)}")
-        return None
+    # The role to map the Gemini response
+    role_map = {
+        "model": "assistant",
+    }
+    # The role to map the Message
+    reverse_role_map = {
+        "assistant": "model",
+        "tool": "user",
+    }
-def _format_video_for_message(video: Video) -> Optional[file_types.File]:
-    # If video is stored locally
-    if video.filepath is not None:
-        video_path = video.filepath if isinstance(video.filepath, Path) else Path(video.filepath)
+    def get_client(self) -> GeminiClient:
+        """
+        Returns an instance of the GeminiClient client.
-        remote_file_name = f"files/{video_path.stem.lower()}"
-        # Check if video is already uploaded
-        existing_video_upload = None
-        try:
-            existing_video_upload = genai.get_file(remote_file_name)
-        except PermissionDenied:
-            pass
+        Returns:
+            GeminiClient: The GeminiClient client.
+        """
+        if self.client:
+            return self.client
+        client_params: Dict[str, Any] = {}
+        vertexai = self.vertexai or getenv("GOOGLE_GENAI_USE_VERTEXAI", "false").lower() == "true"
-        if existing_video_upload:
-            video_file = existing_video_upload
+        if not vertexai:
+            self.api_key = self.api_key or getenv("GOOGLE_API_KEY")
+            if not self.api_key:
+                log_error("GOOGLE_API_KEY not set. Please set the GOOGLE_API_KEY environment variable.")
+            client_params["api_key"] = self.api_key
         else:
-            # Upload the video file to the Gemini API
-            if video_path.exists() and video_path.is_file():
-                video_file = genai.upload_file(path=video_path, name=remote_file_name, display_name=video_path.stem)
-            else:
-                logger.error(f"Video file {video_path} does not exist.")
-                raise Exception(f"Video file {video_path} does not exist.")
-            # Check whether the file is ready to be used.
-            while video_file.state.name == "PROCESSING":
-                time.sleep(2)
-                video_file = genai.get_file(video_file.name)
+            log_info("Using Vertex AI API")
+            client_params["vertexai"] = True
+            project_id = self.project_id or getenv("GOOGLE_CLOUD_PROJECT")
+            if not project_id:
+                log_error("GOOGLE_CLOUD_PROJECT not set. Please set the GOOGLE_CLOUD_PROJECT environment variable.")
+            location = self.location or getenv("GOOGLE_CLOUD_LOCATION")
+            if not location:
+                log_error("GOOGLE_CLOUD_LOCATION not set. Please set the GOOGLE_CLOUD_LOCATION environment variable.")
+            client_params["project"] = project_id
+            client_params["location"] = location
+        client_params = {k: v for k, v in client_params.items() if v is not None}
-            if video_file.state.name == "FAILED":
-                raise ValueError(video_file.state.name)
+        if self.client_params:
+            client_params.update(self.client_params)
-        return video_file
-    else:
-        logger.warning(f"Unknown video type: {type(video.content)}")
-        return None
+        self.client = genai.Client(**client_params)
+        return self.client
+    def _append_file_search_tool(self, builtin_tools: List[Tool]) -> None:
+        """Append Gemini File Search tool to builtin_tools if file search is enabled.
-def _format_messages(messages: List[Message]) -> List[Dict[str, Any]]:
-    """
-    Converts a list of Message objects to the Gemini-compatible format.
+        Args:
+            builtin_tools: List of built-in tools to append to.
+        """
+        if not self.file_search_store_names:
+            return
-    Args:
-        messages (List[Message]): The list of messages to convert.
+        log_debug("Gemini File Search enabled.")
+        file_search_config: Dict[str, Any] = {"file_search_store_names": self.file_search_store_names}
+        if self.file_search_metadata_filter:
+            file_search_config["metadata_filter"] = self.file_search_metadata_filter
+        builtin_tools.append(Tool(file_search=FileSearch(**file_search_config)))  # type: ignore[arg-type]
-    Returns:
-        List[Dict[str, Any]]: The formatted_messages list of messages.
-    """
-    formatted_messages: List = []
-    for message in messages:
-        message_for_model: Dict[str, Any] = {}
+    def get_request_params(
+        self,
+        system_message: Optional[str] = None,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+    ) -> Dict[str, Any]:
+        """
+        Returns the request keyword arguments for the GenerativeModel client.
+        """
+        request_params = {}
+        # User provides their own generation config
+        if self.generation_config is not None:
+            if isinstance(self.generation_config, GenerateContentConfig):
+                config = self.generation_config.model_dump()
+            else:
+                config = self.generation_config
+        else:
+            config = {}
-        # Add role to the message for the model
-        role = (
-            "model" if message.role in ["system", "developer"] else "user" if message.role == "tool" else message.role
+        if self.generative_model_kwargs:
+            config.update(self.generative_model_kwargs)
+        config.update(
+            {
+                "safety_settings": self.safety_settings,
+                "temperature": self.temperature,
+                "top_p": self.top_p,
+                "top_k": self.top_k,
+                "max_output_tokens": self.max_output_tokens,
+                "stop_sequences": self.stop_sequences,
+                "logprobs": self.logprobs,
+                "presence_penalty": self.presence_penalty,
+                "frequency_penalty": self.frequency_penalty,
+                "seed": self.seed,
+                "response_modalities": self.response_modalities,
+                "speech_config": self.speech_config,
+                "cached_content": self.cached_content,
+            }
         )
-        message_for_model["role"] = role
-        # Add content to the message for the model
-        content = message.content
-        # Initialize message_parts to be used for Gemini
-        message_parts: List[Any] = []
-        # Function calls
-        if (not content or message.role == "model") and message.tool_calls:
-            for tool_call in message.tool_calls:
-                message_parts.append(
-                    Part(
-                        function_call=GeminiFunctionCall(
-                            name=tool_call["function"]["name"],
-                            args=json.loads(tool_call["function"]["arguments"]),
+        if system_message is not None:
+            config["system_instruction"] = system_message  # type: ignore
+        if response_format is not None and isinstance(response_format, type) and issubclass(response_format, BaseModel):
+            config["response_mime_type"] = "application/json"  # type: ignore
+            # Convert Pydantic model using our hybrid approach
+            # This will handle complex schemas with nested models, dicts, and circular refs
+            config["response_schema"] = prepare_response_schema(response_format)
+        # Add thinking configuration
+        thinking_config_params: Dict[str, Any] = {}
+        if self.thinking_budget is not None:
+            thinking_config_params["thinking_budget"] = self.thinking_budget
+        if self.include_thoughts is not None:
+            thinking_config_params["include_thoughts"] = self.include_thoughts
+        if self.thinking_level is not None:
+            thinking_config_params["thinking_level"] = self.thinking_level
+        if thinking_config_params:
+            config["thinking_config"] = ThinkingConfig(**thinking_config_params)
+        # Build tools array based on enabled built-in tools
+        builtin_tools = []
+        if self.grounding:
+            log_debug(
+                "Gemini Grounding enabled. This is a legacy tool. For Gemini 2.0+ Please use enable `search` flag instead."
+            )
+            builtin_tools.append(
+                Tool(
+                    google_search=GoogleSearchRetrieval(
+                        dynamic_retrieval_config=DynamicRetrievalConfig(
+                            dynamic_threshold=self.grounding_dynamic_threshold
                         )
                     )
                 )
-        # Function results
-        elif message.role == "tool" and hasattr(message, "combined_function_result"):
-            s = Struct()
-            for combined_result in message.combined_function_result:
-                function_name = combined_result[0]
-                function_response = combined_result[1]
-                s.update({"result": [function_response]})
-                message_parts.append(Part(function_response=GeminiFunctionResponse(name=function_name, response=s)))
-        # Normal content
-        else:
-            if isinstance(content, str):
-                message_parts = [content]
-            elif isinstance(content, list):
-                message_parts = content
+            )
+        if self.search:
+            log_debug("Gemini Google Search enabled.")
+            builtin_tools.append(Tool(google_search=GoogleSearch()))
+        if self.url_context:
+            log_debug("Gemini URL context enabled.")
+            builtin_tools.append(Tool(url_context=UrlContext()))
+        if self.vertexai_search:
+            log_debug("Gemini Vertex AI Search enabled.")
+            if not self.vertexai_search_datastore:
+                log_error("vertexai_search_datastore must be provided when vertexai_search is enabled.")
+                raise ValueError("vertexai_search_datastore must be provided when vertexai_search is enabled.")
+            builtin_tools.append(
+                Tool(retrieval=Retrieval(vertex_ai_search=VertexAISearch(datastore=self.vertexai_search_datastore)))
+            )
+        self._append_file_search_tool(builtin_tools)
+        # Set tools in config
+        if builtin_tools:
+            if tools:
+                log_info("Built-in tools enabled. External tools will be disabled.")
+            config["tools"] = builtin_tools
+        elif tools:
+            config["tools"] = [format_function_definitions(tools)]
+        if tool_choice is not None:
+            if isinstance(tool_choice, str) and tool_choice.lower() == "auto":
+                config["tool_config"] = {"function_calling_config": {"mode": FunctionCallingConfigMode.AUTO}}
+            elif isinstance(tool_choice, str) and tool_choice.lower() == "none":
+                config["tool_config"] = {"function_calling_config": {"mode": FunctionCallingConfigMode.NONE}}
+            elif isinstance(tool_choice, str) and tool_choice.lower() == "validated":
+                config["tool_config"] = {"function_calling_config": {"mode": FunctionCallingConfigMode.VALIDATED}}
+            elif isinstance(tool_choice, str) and tool_choice.lower() == "any":
+                config["tool_config"] = {"function_calling_config": {"mode": FunctionCallingConfigMode.ANY}}
             else:
-                message_parts = [" "]
-        if message.role == "user":
-            # Add images to the message for the model
-            if message.images is not None:
-                for image in message.images:
-                    if image.content is not None and isinstance(image.content, file_types.File):
-                        # Google recommends that if using a single image, place the text prompt after the image.
-                        message_parts.insert(0, image.content)
-                    else:
-                        image_content = _format_image_for_message(image)
-                        if image_content:
-                            message_parts.append(image_content)
+                config["tool_config"] = {"function_calling_config": {"mode": tool_choice}}
-            # Add videos to the message for the model
-            if message.videos is not None:
-                try:
-                    for video in message.videos:
-                        # Case 1: Video is a file_types.File object (Recommended)
-                        # Add it as a File object
-                        if video.content is not None and isinstance(video.content, file_types.File):
-                            # Google recommends that if using a single image, place the text prompt after the image.
-                            message_parts.insert(0, video.content)
-                        else:
-                            video_file = _format_video_for_message(video)
-                            # Google recommends that if using a single video, place the text prompt after the video.
-                            if video_file is not None:
-                                message_parts.insert(0, video_file)  # type: ignore
-                except Exception as e:
-                    traceback.print_exc()
-                    logger.warning(f"Failed to load video from {message.videos}: {e}")
-                    continue
-            # Add audio to the message for the model
-            if message.audio is not None:
-                try:
-                    for audio_snippet in message.audio:
-                        if audio_snippet.content is not None and isinstance(audio_snippet.content, file_types.File):
-                            # Google recommends that if using a single image, place the text prompt after the image.
-                            message_parts.insert(0, audio_snippet.content)
-                        else:
-                            audio_content = _format_audio_for_message(audio_snippet)
-                            if audio_content:
-                                message_parts.append(audio_content)
-                except Exception as e:
-                    logger.warning(f"Failed to load audio from {message.audio}: {e}")
-                    continue
+        config = {k: v for k, v in config.items() if v is not None}
-        message_for_model["parts"] = message_parts
-        formatted_messages.append(message_for_model)
-    return formatted_messages
+        if config:
+            request_params["config"] = GenerateContentConfig(**config)
+        # Filter out None values
+        if self.request_params:
+            request_params.update(self.request_params)
-def _format_functions(params: Dict[str, Any]) -> Dict[str, Any]:
-    """
-    Converts function parameters to a Gemini-compatible format.
+        if request_params:
+            log_debug(f"Calling {self.provider} with request parameters: {request_params}", log_level=2)
+        return request_params
+    def count_tokens(
+        self,
+        messages: List[Message],
+        tools: Optional[List[Union[Function, Dict[str, Any]]]] = None,
+        output_schema: Optional[Union[Dict, Type[BaseModel]]] = None,
+    ) -> int:
+        contents, system_instruction = self._format_messages(messages, compress_tool_results=True)
+        schema_tokens = count_schema_tokens(output_schema, self.id)
+        if self.vertexai:
+            # VertexAI supports full token counting with system_instruction and tools
+            config: Dict[str, Any] = {}
+            if system_instruction:
+                config["system_instruction"] = system_instruction
+            if tools:
+                formatted_tools = self._format_tools(tools)
+                gemini_tools = format_function_definitions(formatted_tools)
+                if gemini_tools:
+                    config["tools"] = [gemini_tools]
+            response = self.get_client().models.count_tokens(
+                model=self.id,
+                contents=contents,
+                config=config if config else None,  # type: ignore
+            )
+            return (response.total_tokens or 0) + schema_tokens
+        else:
+            # Google AI Studio: Use API for content tokens + local estimation for system/tools
+            # The API doesn't support system_instruction or tools in config, so we use a hybrid approach:
+            # 1. Get accurate token count for contents (text + multimodal) from API
+            # 2. Add estimated tokens for system_instruction and tools locally
+            try:
+                response = self.get_client().models.count_tokens(
+                    model=self.id,
+                    contents=contents,
+                )
+                total = response.total_tokens or 0
+            except Exception as e:
+                log_warning(f"Gemini count_tokens API failed: {e}. Falling back to tiktoken-based estimation.")
+                return super().count_tokens(messages, tools, output_schema)
-    Args:
-        params (Dict[str, Any]): The original parameters dictionary.
+            # Add estimated tokens for system instruction (not supported by Google AI Studio API)
+            if system_instruction:
+                system_text = system_instruction if isinstance(system_instruction, str) else str(system_instruction)
+                total += count_text_tokens(system_text, self.id)
-    Returns:
-        Dict[str, Any]: The converted parameters dictionary compatible with Gemini.
-    """
-    formatted_params = {}
-    for key, value in params.items():
-        if key == "properties" and isinstance(value, dict):
-            converted_properties = {}
-            for prop_key, prop_value in value.items():
-                property_type = prop_value.get("type")
-                if property_type == "array":
-                    converted_properties[prop_key] = prop_value
-                    continue
-                if isinstance(property_type, list):
-                    # Create a copy to avoid modifying the original list
-                    non_null_types = [t for t in property_type if t != "null"]
-                    if non_null_types:
-                        # Use the first non-null type
-                        converted_type = non_null_types[0]
-                        if converted_type == "array":
-                            prop_value["type"] = converted_type
-                            converted_properties[prop_key] = prop_value
-                            continue
-                    else:
-                        # Default type if all types are 'null'
-                        converted_type = "string"
-                else:
-                    converted_type = property_type
+            # Add estimated tokens for tools (not supported by Google AI Studio API)
+            if tools:
+                total += count_tool_tokens(tools, self.id)
+            # Add estimated tokens for response_format/output_schema
+            total += schema_tokens
-                converted_properties[prop_key] = {"type": converted_type}
-            formatted_params[key] = converted_properties
+            return total
+    async def acount_tokens(
+        self,
+        messages: List[Message],
+        tools: Optional[List[Union[Function, Dict[str, Any]]]] = None,
+        output_schema: Optional[Union[Dict, Type[BaseModel]]] = None,
+    ) -> int:
+        contents, system_instruction = self._format_messages(messages, compress_tool_results=True)
+        schema_tokens = count_schema_tokens(output_schema, self.id)
+        # VertexAI supports full token counting with system_instruction and tools
+        if self.vertexai:
+            config: Dict[str, Any] = {}
+            if system_instruction:
+                config["system_instruction"] = system_instruction
+            if tools:
+                formatted_tools = self._format_tools(tools)
+                gemini_tools = format_function_definitions(formatted_tools)
+                if gemini_tools:
+                    config["tools"] = [gemini_tools]
+            response = await self.get_client().aio.models.count_tokens(
+                model=self.id,
+                contents=contents,
+                config=config if config else None,  # type: ignore
+            )
+            return (response.total_tokens or 0) + schema_tokens
         else:
-            formatted_params[key] = value
+            # Hybrid approach - Google AI Studio does not support system_instruction or tools in config
+            try:
+                response = await self.get_client().aio.models.count_tokens(
+                    model=self.id,
+                    contents=contents,
+                )
+                total = response.total_tokens or 0
+            except Exception as e:
+                log_warning(f"Gemini count_tokens API failed: {e}. Falling back to tiktoken-based estimation.")
+                return await super().acount_tokens(messages, tools, output_schema)
-    return formatted_params
+            # Add estimated tokens for system instruction
+            if system_instruction:
+                system_text = system_instruction if isinstance(system_instruction, str) else str(system_instruction)
+                total += count_text_tokens(system_text, self.id)
+            # Add estimated tokens for tools
+            if tools:
+                total += count_tool_tokens(tools, self.id)
-def _build_function_declaration(func: Function) -> FunctionDeclaration:
-    """
-    Builds the function declaration for Gemini tool calling.
+            # Add estimated tokens for response_format/output_schema
+            total += schema_tokens
-    Args:
-        func: An instance of the function.
+            return total
-    Returns:
-        FunctionDeclaration: The formatted function declaration.
-    """
-    formatted_params = _format_functions(func.parameters)
-    if "properties" in formatted_params and formatted_params["properties"]:
-        # We have parameters to add
-        return FunctionDeclaration(
-            name=func.name,
-            description=func.description,
-            parameters=formatted_params,
+    def invoke(
+        self,
+        messages: List[Message],
+        assistant_message: Message,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+        run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
+        retry_with_guidance: bool = False,
+    ) -> ModelResponse:
+        """
+        Invokes the model with a list of messages and returns the response.
+        """
+        formatted_messages, system_message = self._format_messages(messages, compress_tool_results)
+        request_kwargs = self.get_request_params(
+            system_message, response_format=response_format, tools=tools, tool_choice=tool_choice
         )
-    else:
-        return FunctionDeclaration(
-            name=func.name,
-            description=func.description,
+        try:
+            if run_response and run_response.metrics:
+                run_response.metrics.set_time_to_first_token()
+            assistant_message.metrics.start_timer()
+            provider_response = self.get_client().models.generate_content(
+                model=self.id,
+                contents=formatted_messages,
+                **request_kwargs,
+            )
+            assistant_message.metrics.stop_timer()
+            model_response = self._parse_provider_response(
+                provider_response, response_format=response_format, retry_with_guidance=retry_with_guidance
+            )
+            # If we were retrying the invoke with guidance, remove the guidance message
+            if retry_with_guidance is True:
+                self._remove_temporary_messages(messages)
+            return model_response
+        except (ClientError, ServerError) as e:
+            log_error(f"Error from Gemini API: {e}")
+            error_message = str(e.response) if hasattr(e, "response") else str(e)
+            raise ModelProviderError(
+                message=error_message,
+                status_code=e.code if hasattr(e, "code") and e.code is not None else 502,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except RetryableModelProviderError:
+            raise
+        except Exception as e:
+            log_error(f"Unknown error from Gemini API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+    def invoke_stream(
+        self,
+        messages: List[Message],
+        assistant_message: Message,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+        run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
+        retry_with_guidance: bool = False,
+    ) -> Iterator[ModelResponse]:
+        """
+        Invokes the model with a list of messages and returns the response as a stream.
+        """
+        formatted_messages, system_message = self._format_messages(messages, compress_tool_results)
+        request_kwargs = self.get_request_params(
+            system_message, response_format=response_format, tools=tools, tool_choice=tool_choice
         )
+        try:
+            if run_response and run_response.metrics:
+                run_response.metrics.set_time_to_first_token()
+            assistant_message.metrics.start_timer()
+            for response in self.get_client().models.generate_content_stream(
+                model=self.id,
+                contents=formatted_messages,
+                **request_kwargs,
+            ):
+                yield self._parse_provider_response_delta(response, retry_with_guidance=retry_with_guidance)
+            # If we were retrying the invoke with guidance, remove the guidance message
+            if retry_with_guidance is True:
+                self._remove_temporary_messages(messages)
+            assistant_message.metrics.stop_timer()
+        except (ClientError, ServerError) as e:
+            log_error(f"Error from Gemini API: {e}")
+            raise ModelProviderError(
+                message=str(e.response) if hasattr(e, "response") else str(e),
+                status_code=e.code if hasattr(e, "code") and e.code is not None else 502,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except RetryableModelProviderError:
+            raise
+        except Exception as e:
+            log_error(f"Unknown error from Gemini API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+    async def ainvoke(
+        self,
+        messages: List[Message],
+        assistant_message: Message,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+        run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
+        retry_with_guidance: bool = False,
+    ) -> ModelResponse:
+        """
+        Invokes the model with a list of messages and returns the response.
+        """
+        formatted_messages, system_message = self._format_messages(messages, compress_tool_results)
-@dataclass
-class Gemini(Model):
-    """
-    Gemini model class for Google's Generative AI models.
+        request_kwargs = self.get_request_params(
+            system_message, response_format=response_format, tools=tools, tool_choice=tool_choice
+        )
-    Based on https://ai.google.dev/gemini-api/docs/function-calling
-    Attributes:
-        id (str): Model ID. Default is `gemini-2.0-flash-exp`.
-        name (str): The name of this chat model instance. Default is `Gemini`.
-        provider (str): Model provider. Default is `Google`.
-        function_declarations (List[FunctionDeclaration]): List of function declarations.
-        generation_config (Any): Generation configuration.
-        safety_settings (Any): Safety settings.
-        generative_model_kwargs (Dict[str, Any]): Generative model keyword arguments.
-        api_key (str): API key.
-        client (GenerativeModel): Generative model client.
-    """
+        try:
+            if run_response and run_response.metrics:
+                run_response.metrics.set_time_to_first_token()
+            assistant_message.metrics.start_timer()
+            provider_response = await self.get_client().aio.models.generate_content(
+                model=self.id,
+                contents=formatted_messages,
+                **request_kwargs,
+            )
+            assistant_message.metrics.stop_timer()
-    id: str = "gemini-2.0-flash-exp"
-    name: str = "Gemini"
-    provider: str = "Google"
+            model_response = self._parse_provider_response(
+                provider_response, response_format=response_format, retry_with_guidance=retry_with_guidance
+            )
-    # Request parameters
-    function_declarations: Optional[List[FunctionDeclaration]] = None
-    generation_config: Optional[Any] = None
-    safety_settings: Optional[Any] = None
-    generative_model_kwargs: Optional[Dict[str, Any]] = None
+            # If we were retrying the invoke with guidance, remove the guidance message
+            if retry_with_guidance is True:
+                self._remove_temporary_messages(messages)
-    # Client parameters
-    api_key: Optional[str] = None
-    client_params: Optional[Dict[str, Any]] = None
+            return model_response
-    # Gemini client
-    client: Optional[GenerativeModel] = None
+        except (ClientError, ServerError) as e:
+            log_error(f"Error from Gemini API: {e}")
+            raise ModelProviderError(
+                message=str(e.response) if hasattr(e, "response") else str(e),
+                status_code=e.code if hasattr(e, "code") and e.code is not None else 502,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except RetryableModelProviderError:
+            raise
+        except Exception as e:
+            log_error(f"Unknown error from Gemini API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
-    def get_client(self) -> GenerativeModel:
+    async def ainvoke_stream(
+        self,
+        messages: List[Message],
+        assistant_message: Message,
+        response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
+        run_response: Optional[RunOutput] = None,
+        compress_tool_results: bool = False,
+        retry_with_guidance: bool = False,
+    ) -> AsyncIterator[ModelResponse]:
         """
-        Returns an instance of the GenerativeModel client.
-        Returns:
-            GenerativeModel: The GenerativeModel client.
+        Invokes the model with a list of messages and returns the response as a stream.
         """
-        if self.client:
-            return self.client
+        formatted_messages, system_message = self._format_messages(messages, compress_tool_results)
-        client_params: Dict[str, Any] = {}
+        request_kwargs = self.get_request_params(
+            system_message, response_format=response_format, tools=tools, tool_choice=tool_choice
+        )
-        self.api_key = self.api_key or getenv("GOOGLE_API_KEY")
-        if not self.api_key:
-            logger.error("GOOGLE_API_KEY not set. Please set the GOOGLE_API_KEY environment variable.")
-        client_params["api_key"] = self.api_key
+        try:
+            if run_response and run_response.metrics:
+                run_response.metrics.set_time_to_first_token()
-        if self.client_params:
-            client_params.update(self.client_params)
-        genai.configure(**client_params)
-        return genai.GenerativeModel(model_name=self.id, **self.request_kwargs)
+            assistant_message.metrics.start_timer()
-    @property
-    def request_kwargs(self) -> Dict[str, Any]:
+            async_stream = await self.get_client().aio.models.generate_content_stream(
+                model=self.id,
+                contents=formatted_messages,
+                **request_kwargs,
+            )
+            async for chunk in async_stream:
+                yield self._parse_provider_response_delta(chunk, retry_with_guidance=retry_with_guidance)
+            # If we were retrying the invoke with guidance, remove the guidance message
+            if retry_with_guidance is True:
+                self._remove_temporary_messages(messages)
+            assistant_message.metrics.stop_timer()
+        except (ClientError, ServerError) as e:
+            log_error(f"Error from Gemini API: {e}")
+            raise ModelProviderError(
+                message=str(e.response) if hasattr(e, "response") else str(e),
+                status_code=e.code if hasattr(e, "code") and e.code is not None else 502,
+                model_name=self.name,
+                model_id=self.id,
+            ) from e
+        except RetryableModelProviderError:
+            raise
+        except Exception as e:
+            log_error(f"Unknown error from Gemini API: {e}")
+            raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
+    def _format_messages(self, messages: List[Message], compress_tool_results: bool = False):
         """
-        Returns the request keyword arguments for the GenerativeModel client.
+        Converts a list of Message objects to the Gemini-compatible format.
-        Returns:
-            Dict[str, Any]: The request keyword arguments.
+        Args:
+            messages (List[Message]): The list of messages to convert.
+            compress_tool_results: Whether to compress tool results.
         """
-        request_params: Dict[str, Any] = {}
-        if self.generation_config:
-            request_params["generation_config"] = self.generation_config
-        if self.safety_settings:
-            request_params["safety_settings"] = self.safety_settings
-        if self.generative_model_kwargs:
-            request_params.update(self.generative_model_kwargs)
-        if self.function_declarations:
-            request_params["tools"] = [GeminiTool(function_declarations=self.function_declarations)]
-        return request_params
+        formatted_messages: List = []
+        file_content: Optional[Union[GeminiFile, Part]] = None
+        system_message = None
+        for message in messages:
+            role = message.role
+            if role in ["system", "developer"]:
+                system_message = message.content
+                continue
+            # Set the role for the message according to Gemini's requirements
+            role = self.reverse_role_map.get(role, role)
+            # Add content to the message for the model
+            content = message.get_content(use_compressed_content=compress_tool_results)
+            # Initialize message_parts to be used for Gemini
+            message_parts: List[Any] = []
+            # Function calls
+            if role == "model" and message.tool_calls is not None and len(message.tool_calls) > 0:
+                if content is not None:
+                    content_str = content if isinstance(content, str) else str(content)
+                    part = Part.from_text(text=content_str)
+                    if message.provider_data and "thought_signature" in message.provider_data:
+                        part.thought_signature = base64.b64decode(message.provider_data["thought_signature"])
+                    message_parts.append(part)
+                for tool_call in message.tool_calls:
+                    part = Part.from_function_call(
+                        name=tool_call["function"]["name"],
+                        args=json.loads(tool_call["function"]["arguments"]),
+                    )
+                    if "thought_signature" in tool_call:
+                        part.thought_signature = base64.b64decode(tool_call["thought_signature"])
+                    message_parts.append(part)
+            # Function call results
+            elif message.tool_calls is not None and len(message.tool_calls) > 0:
+                for idx, tool_call in enumerate(message.tool_calls):
+                    if isinstance(content, list) and idx < len(content):
+                        original_from_list = content[idx]
+                        if compress_tool_results:
+                            compressed_from_tool_call = tool_call.get("content")
+                            tc_content = compressed_from_tool_call if compressed_from_tool_call else original_from_list
+                        else:
+                            tc_content = original_from_list
+                    else:
+                        tc_content = message.get_content(use_compressed_content=compress_tool_results)
+                        if tc_content is None:
+                            tc_content = tool_call.get("content")
+                            if tc_content is None:
+                                tc_content = content
+                    message_parts.append(
+                        Part.from_function_response(name=tool_call["tool_name"], response={"result": tc_content})
+                    )
+            # Regular text content
+            else:
+                if isinstance(content, str):
+                    part = Part.from_text(text=content)
+                    if message.provider_data and "thought_signature" in message.provider_data:
+                        part.thought_signature = base64.b64decode(message.provider_data["thought_signature"])
+                    message_parts = [part]
+            if role == "user" and message.tool_calls is None:
+                # Add images to the message for the model
+                if message.images is not None:
+                    for image in message.images:
+                        if image.content is not None and isinstance(image.content, GeminiFile):
+                            # Google recommends that if using a single image, place the text prompt after the image.
+                            message_parts.insert(0, image.content)
+                        else:
+                            image_content = format_image_for_message(image)
+                            if image_content:
+                                message_parts.append(Part.from_bytes(**image_content))
+                # Add videos to the message for the model
+                if message.videos is not None:
+                    try:
+                        for video in message.videos:
+                            # Case 1: Video is a file_types.File object (Recommended)
+                            # Add it as a File object
+                            if video.content is not None and isinstance(video.content, GeminiFile):
+                                # Google recommends that if using a single video, place the text prompt after the video.
+                                if video.content.uri and video.content.mime_type:
+                                    message_parts.insert(
+                                        0, Part.from_uri(file_uri=video.content.uri, mime_type=video.content.mime_type)
+                                    )
+                            else:
+                                video_file = self._format_video_for_message(video)
+                                if video_file is not None:
+                                    message_parts.insert(0, video_file)
+                    except Exception as e:
+                        log_warning(f"Failed to load video from {message.videos}: {e}")
+                        continue
+                # Add audio to the message for the model
+                if message.audio is not None:
+                    try:
+                        for audio_snippet in message.audio:
+                            if audio_snippet.content is not None and isinstance(audio_snippet.content, GeminiFile):
+                                # Google recommends that if using a single audio file, place the text prompt after the audio file.
+                                if audio_snippet.content.uri and audio_snippet.content.mime_type:
+                                    message_parts.insert(
+                                        0,
+                                        Part.from_uri(
+                                            file_uri=audio_snippet.content.uri,
+                                            mime_type=audio_snippet.content.mime_type,
+                                        ),
+                                    )
+                            else:
+                                audio_content = self._format_audio_for_message(audio_snippet)
+                                if audio_content:
+                                    message_parts.append(audio_content)
+                    except Exception as e:
+                        log_warning(f"Failed to load audio from {message.audio}: {e}")
+                        continue
+                # Add files to the message for the model
+                if message.files is not None:
+                    for file in message.files:
+                        file_content = self._format_file_for_message(file)
+                        if isinstance(file_content, Part):
+                            formatted_messages.append(file_content)
+            final_message = Content(role=role, parts=message_parts)
+            formatted_messages.append(final_message)
+            if isinstance(file_content, GeminiFile):
+                formatted_messages.insert(0, file_content)
+        return formatted_messages, system_message
+    def _format_audio_for_message(self, audio: Audio) -> Optional[Union[Part, GeminiFile]]:
+        # Case 1: Audio is a bytes object
+        if audio.content and isinstance(audio.content, bytes):
+            mime_type = f"audio/{audio.format}" if audio.format else "audio/mp3"
+            return Part.from_bytes(mime_type=mime_type, data=audio.content)
+        # Case 2: Audio is an url
+        elif audio.url is not None:
+            audio_bytes = audio.get_content_bytes()  # type: ignore
+            if audio_bytes is not None:
+                mime_type = f"audio/{audio.format}" if audio.format else "audio/mp3"
+                return Part.from_bytes(mime_type=mime_type, data=audio_bytes)
+            else:
+                log_warning(f"Failed to download audio from {audio}")
+                return None
+        # Case 3: Audio is a local file path
+        elif audio.filepath is not None:
+            audio_path = audio.filepath if isinstance(audio.filepath, Path) else Path(audio.filepath)
+            remote_file_name = f"files/{audio_path.stem.lower().replace('_', '')}"
+            # Check if video is already uploaded
+            existing_audio_upload = None
+            try:
+                if remote_file_name:
+                    existing_audio_upload = self.get_client().files.get(name=remote_file_name)
+            except Exception as e:
+                log_warning(f"Error getting file {remote_file_name}: {e}")
+            if existing_audio_upload and existing_audio_upload.state and existing_audio_upload.state.name == "SUCCESS":
+                audio_file = existing_audio_upload
+            else:
+                # Upload the video file to the Gemini API
+                if audio_path.exists() and audio_path.is_file():
+                    audio_file = self.get_client().files.upload(
+                        file=audio_path,
+                        config=dict(
+                            name=remote_file_name,
+                            display_name=audio_path.stem,
+                            mime_type=f"audio/{audio.format}" if audio.format else "audio/mp3",
+                        ),
+                    )
+                else:
+                    log_error(f"Audio file {audio_path} does not exist.")
+                    return None
+                # Check whether the file is ready to be used.
+                while audio_file.state and audio_file.state.name == "PROCESSING":
+                    if audio_file.name:
+                        audio_file = self.get_client().files.get(name=audio_file.name)
+                    time.sleep(2)
+                if audio_file.state and audio_file.state.name == "FAILED":
+                    log_error(f"Audio file processing failed: {audio_file.state.name}")
+                    return None
+            if audio_file.uri:
+                mime_type = f"audio/{audio.format}" if audio.format else "audio/mp3"
+                return Part.from_uri(file_uri=audio_file.uri, mime_type=mime_type)
+            return None
+        else:
+            log_warning(f"Unknown audio type: {type(audio.content)}")
+            return None
+    def _format_video_for_message(self, video: Video) -> Optional[Part]:
+        # Case 1: Video is a bytes object
+        if video.content and isinstance(video.content, bytes):
+            mime_type = f"video/{video.format}" if video.format else "video/mp4"
+            return Part.from_bytes(mime_type=mime_type, data=video.content)
+        # Case 2: Video is stored locally
+        elif video.filepath is not None:
+            video_path = video.filepath if isinstance(video.filepath, Path) else Path(video.filepath)
+            remote_file_name = f"files/{video_path.stem.lower().replace('_', '')}"
+            # Check if video is already uploaded
+            existing_video_upload = None
+            try:
+                if remote_file_name:
+                    existing_video_upload = self.get_client().files.get(name=remote_file_name)
+            except Exception as e:
+                log_warning(f"Error getting file {remote_file_name}: {e}")
+            if existing_video_upload and existing_video_upload.state and existing_video_upload.state.name == "SUCCESS":
+                video_file = existing_video_upload
+            else:
+                # Upload the video file to the Gemini API
+                if video_path.exists() and video_path.is_file():
+                    video_file = self.get_client().files.upload(
+                        file=video_path,
+                        config=dict(
+                            name=remote_file_name,
+                            display_name=video_path.stem,
+                            mime_type=f"video/{video.format}" if video.format else "video/mp4",
+                        ),
+                    )
+                else:
+                    log_error(f"Video file {video_path} does not exist.")
+                    return None
+                # Check whether the file is ready to be used.
+                while video_file.state and video_file.state.name == "PROCESSING":
+                    if video_file.name:
+                        video_file = self.get_client().files.get(name=video_file.name)
+                    time.sleep(2)
+                if video_file.state and video_file.state.name == "FAILED":
+                    log_error(f"Video file processing failed: {video_file.state.name}")
+                    return None
+            if video_file.uri:
+                mime_type = f"video/{video.format}" if video.format else "video/mp4"
+                return Part.from_uri(file_uri=video_file.uri, mime_type=mime_type)
+            return None
+        # Case 3: Video is a URL
+        elif video.url is not None:
+            mime_type = f"video/{video.format}" if video.format else "video/webm"
+            return Part.from_uri(
+                file_uri=video.url,
+                mime_type=mime_type,
+            )
+        else:
+            log_warning(f"Unknown video type: {type(video.content)}")
+            return None
+    def _format_file_for_message(self, file: File) -> Optional[Part]:
+        # Case 1: File is a bytes object
+        if file.content and isinstance(file.content, bytes) and file.mime_type:
+            return Part.from_bytes(mime_type=file.mime_type, data=file.content)
+        # Case 2: File is a URL
+        elif file.url is not None:
+            url_content = file.file_url_content
+            if url_content is not None:
+                content, mime_type = url_content
+                if mime_type and content:
+                    return Part.from_bytes(mime_type=mime_type, data=content)
+            log_warning(f"Failed to download file from {file.url}")
+            return None
+        # Case 3: File is a local file path
+        elif file.filepath is not None:
+            file_path = file.filepath if isinstance(file.filepath, Path) else Path(file.filepath)
+            if file_path.exists() and file_path.is_file():
+                if file_path.stat().st_size < 20 * 1024 * 1024:  # 20MB in bytes
+                    if file.mime_type:
+                        file_content = file_path.read_bytes()
+                        if file_content:
+                            return Part.from_bytes(mime_type=file.mime_type, data=file_content)
+                    else:
+                        import mimetypes
+                        mime_type_guess = mimetypes.guess_type(file_path)[0]
+                        if mime_type_guess is not None:
+                            file_content = file_path.read_bytes()
+                            if file_content:
+                                mime_type_str: str = str(mime_type_guess)
+                                return Part.from_bytes(mime_type=mime_type_str, data=file_content)
+                    return None
+                else:
+                    clean_file_name = f"files/{file_path.stem.lower().replace('_', '')}"
+                    remote_file = None
+                    try:
+                        if clean_file_name:
+                            remote_file = self.get_client().files.get(name=clean_file_name)
+                    except Exception as e:
+                        log_warning(f"Error getting file {clean_file_name}: {e}")
+                    if (
+                        remote_file
+                        and remote_file.state
+                        and remote_file.state.name == "SUCCESS"
+                        and remote_file.uri
+                        and remote_file.mime_type
+                    ):
+                        file_uri: str = remote_file.uri
+                        file_mime_type: str = remote_file.mime_type
+                        return Part.from_uri(file_uri=file_uri, mime_type=file_mime_type)
+            else:
+                log_error(f"File {file_path} does not exist.")
+            return None
-    def add_tool(
+        # Case 4: File is a Gemini File object
+        elif isinstance(file.external, GeminiFile):
+            if file.external.uri and file.external.mime_type:
+                return Part.from_uri(file_uri=file.external.uri, mime_type=file.external.mime_type)
+            return None
+        return None
+    def format_function_call_results(
         self,
-        tool: Union[Toolkit, Callable, Dict, Function],
-        strict: bool = False,
-        agent: Optional[Any] = None,
+        messages: List[Message],
+        function_call_results: List[Message],
+        compress_tool_results: bool = False,
+        **kwargs,
     ) -> None:
         """
-        Adds tools to the model.
+        Format function call results for Gemini.
+        For combined messages:
+        - content: list of ORIGINAL content (for preservation)
+        - tool_calls[i]["content"]: compressed content if available (for API sending)
+        This allows the message to be saved with both original and compressed versions.
+        """
+        combined_original_content: List = []
+        combined_function_result: List = []
+        tool_names: List[str] = []
+        message_metrics = Metrics()
+        if len(function_call_results) > 0:
+            for idx, result in enumerate(function_call_results):
+                combined_original_content.append(result.content)
+                compressed_content = result.get_content(use_compressed_content=compress_tool_results)
+                combined_function_result.append(
+                    {"tool_call_id": result.tool_call_id, "tool_name": result.tool_name, "content": compressed_content}
+                )
+                if result.tool_name:
+                    tool_names.append(result.tool_name)
+                message_metrics += result.metrics
+        tool_name = ", ".join(tool_names) if tool_names else None
+        if combined_original_content:
+            messages.append(
+                Message(
+                    role="tool",
+                    content=combined_original_content,
+                    tool_name=tool_name,
+                    tool_calls=combined_function_result,
+                    metrics=message_metrics,
+                )
+            )
+    def _parse_provider_response(self, response: GenerateContentResponse, **kwargs) -> ModelResponse:
+        """
+        Parse the Gemini response into a ModelResponse.
         Args:
-            tool: The tool to add. Can be a Tool, Toolkit, Callable, dict, or Function.
-            strict: If True, raise an error if the tool is not a Toolkit or Callable.
-            agent: The agent to associate with the tool.
-        """
-        if self.function_declarations is None:
-            self.function_declarations = []
-        # If the tool is a Tool or Dict, log a warning.
-        if isinstance(tool, Dict):
-            logger.warning("Tool of type 'dict' is not yet supported by Gemini.")
-        # If the tool is a Callable or Toolkit, add its functions to the Model
-        elif callable(tool) or isinstance(tool, Toolkit) or isinstance(tool, Function):
-            if self._functions is None:
-                self._functions: Dict[str, Any] = {}
-            if isinstance(tool, Toolkit):
-                # For each function in the toolkit, process entrypoint and add to self.tools
-                for name, func in tool.functions.items():
-                    # If the function does not exist in self._functions, add to self.tools
-                    if name not in self._functions:
-                        func._agent = agent
-                        func.process_entrypoint()
-                        self._functions[name] = func
-                        function_declaration = _build_function_declaration(func)
-                        self.function_declarations.append(function_declaration)
-                        logger.debug(f"Function {name} from {tool.name} added to model.")
-            elif isinstance(tool, Function):
-                if tool.name not in self._functions:
-                    tool._agent = agent
-                    tool.process_entrypoint()
-                    self._functions[tool.name] = tool
-                    function_declaration = _build_function_declaration(tool)
-                    self.function_declarations.append(function_declaration)
-                    logger.debug(f"Function {tool.name} added to model.")
-            elif callable(tool):
+            response: Raw response from Gemini
+        Returns:
+            ModelResponse: Parsed response data
+        """
+        model_response = ModelResponse()
+        # Get response message
+        response_message = Content(role="model", parts=[])
+        if response.candidates and len(response.candidates) > 0:
+            candidate = response.candidates[0]
+            # Raise if the request failed because of a malformed function call
+            if hasattr(candidate, "finish_reason") and candidate.finish_reason:
+                if candidate.finish_reason == GeminiFinishReason.MALFORMED_FUNCTION_CALL.value:
+                    if self.retry_with_guidance:
+                        raise RetryableModelProviderError(
+                            retry_guidance_message=MALFORMED_FUNCTION_CALL_GUIDANCE,
+                            original_error=f"Generation ended with finish reason: {candidate.finish_reason}",
+                        )
+            if candidate.content:
+                response_message = candidate.content
+        # Add role
+        if response_message.role is not None:
+            model_response.role = self.role_map[response_message.role]
+        # Add content
+        if response_message.parts is not None and len(response_message.parts) > 0:
+            for part in response_message.parts:
+                # Extract text if present
+                if hasattr(part, "text") and part.text is not None:
+                    text_content: Optional[str] = getattr(part, "text")
+                    if isinstance(text_content, str):
+                        # Check if this is a thought summary
+                        if hasattr(part, "thought") and part.thought:
+                            # Add all parts as single message
+                            if model_response.reasoning_content is None:
+                                model_response.reasoning_content = text_content
+                            else:
+                                model_response.reasoning_content += text_content
+                        else:
+                            if model_response.content is None:
+                                model_response.content = text_content
+                            else:
+                                model_response.content += text_content
+                    else:
+                        content_str = str(text_content) if text_content is not None else ""
+                        if hasattr(part, "thought") and part.thought:
+                            # Add all parts as single message
+                            if model_response.reasoning_content is None:
+                                model_response.reasoning_content = content_str
+                            else:
+                                model_response.reasoning_content += content_str
+                        else:
+                            if model_response.content is None:
+                                model_response.content = content_str
+                            else:
+                                model_response.content += content_str
+                    # Capture thought signature for text parts
+                    if hasattr(part, "thought_signature") and part.thought_signature:
+                        if model_response.provider_data is None:
+                            model_response.provider_data = {}
+                        model_response.provider_data["thought_signature"] = base64.b64encode(
+                            part.thought_signature
+                        ).decode("ascii")
+                if hasattr(part, "inline_data") and part.inline_data is not None:
+                    # Handle audio responses (for TTS models)
+                    if part.inline_data.mime_type and part.inline_data.mime_type.startswith("audio/"):
+                        # Store raw bytes data
+                        model_response.audio = Audio(
+                            id=str(uuid4()),
+                            content=part.inline_data.data,
+                            mime_type=part.inline_data.mime_type,
+                        )
+                    # Image responses
+                    else:
+                        if model_response.images is None:
+                            model_response.images = []
+                        model_response.images.append(
+                            Image(id=str(uuid4()), content=part.inline_data.data, mime_type=part.inline_data.mime_type)
+                        )
+                # Extract function call if present
+                if hasattr(part, "function_call") and part.function_call is not None:
+                    call_id = part.function_call.id if part.function_call.id else str(uuid4())
+                    tool_call = {
+                        "id": call_id,
+                        "type": "function",
+                        "function": {
+                            "name": part.function_call.name,
+                            "arguments": json.dumps(part.function_call.args)
+                            if part.function_call.args is not None
+                            else "",
+                        },
+                    }
+                    # Capture thought signature for function calls
+                    if hasattr(part, "thought_signature") and part.thought_signature:
+                        tool_call["thought_signature"] = base64.b64encode(part.thought_signature).decode("ascii")
+                    model_response.tool_calls.append(tool_call)
+            citations = Citations()
+            citations_raw = {}
+            citations_urls = []
+            web_search_queries: List[str] = []
+            if response.candidates and response.candidates[0].grounding_metadata is not None:
+                grounding_metadata: GroundingMetadata = response.candidates[0].grounding_metadata
+                citations_raw["grounding_metadata"] = grounding_metadata.model_dump()
+                chunks = grounding_metadata.grounding_chunks or []
+                web_search_queries = grounding_metadata.web_search_queries or []
+                for chunk in chunks:
+                    if not chunk:
+                        continue
+                    web = chunk.web
+                    if not web:
+                        continue
+                    uri = web.uri
+                    title = web.title
+                    if uri:
+                        citations_urls.append(UrlCitation(url=uri, title=title))
+            # Handle URLs from URL context tool
+            if (
+                response.candidates
+                and hasattr(response.candidates[0], "url_context_metadata")
+                and response.candidates[0].url_context_metadata is not None
+            ):
+                url_context_metadata = response.candidates[0].url_context_metadata
+                citations_raw["url_context_metadata"] = url_context_metadata.model_dump()
+                url_metadata_list = url_context_metadata.url_metadata or []
+                for url_meta in url_metadata_list:
+                    retrieved_url = url_meta.retrieved_url
+                    status = "UNKNOWN"
+                    if url_meta.url_retrieval_status:
+                        status = url_meta.url_retrieval_status.value
+                    if retrieved_url and status == "URL_RETRIEVAL_STATUS_SUCCESS":
+                        # Avoid duplicate URLs
+                        existing_urls = [citation.url for citation in citations_urls]
+                        if retrieved_url not in existing_urls:
+                            citations_urls.append(UrlCitation(url=retrieved_url, title=retrieved_url))
+            if citations_raw:
+                citations.raw = citations_raw
+            if citations_urls:
+                citations.urls = citations_urls
+            if web_search_queries:
+                citations.search_queries = web_search_queries
+            if citations_raw or citations_urls:
+                model_response.citations = citations
+        # Extract usage metadata if present
+        if hasattr(response, "usage_metadata") and response.usage_metadata is not None:
+            model_response.response_usage = self._get_metrics(response.usage_metadata)
+        # If we have no content but have a role, add a default empty content
+        if model_response.role and model_response.content is None and not model_response.tool_calls:
+            model_response.content = ""
+        return model_response
+    def _parse_provider_response_delta(self, response_delta: GenerateContentResponse, **kwargs) -> ModelResponse:
+        model_response = ModelResponse()
+        if response_delta.candidates and len(response_delta.candidates) > 0:
+            candidate = response_delta.candidates[0]
+            candidate_content = candidate.content
+            # Raise if the request failed because of a malformed function call
+            if hasattr(candidate, "finish_reason") and candidate.finish_reason:
+                if candidate.finish_reason == GeminiFinishReason.MALFORMED_FUNCTION_CALL.value:
+                    if self.retry_with_guidance:
+                        raise RetryableModelProviderError(
+                            retry_guidance_message=MALFORMED_FUNCTION_CALL_GUIDANCE,
+                            original_error=f"Generation ended with finish reason: {candidate.finish_reason}",
+                        )
+            response_message: Content = Content(role="model", parts=[])
+            if candidate_content is not None:
+                response_message = candidate_content
+            # Add role
+            if response_message.role is not None:
+                model_response.role = self.role_map[response_message.role]
+            if response_message.parts is not None:
+                for part in response_message.parts:
+                    # Extract text if present
+                    if hasattr(part, "text") and part.text is not None:
+                        text_content = str(part.text) if part.text is not None else ""
+                        # Check if this is a thought summary
+                        if hasattr(part, "thought") and part.thought:
+                            if model_response.reasoning_content is None:
+                                model_response.reasoning_content = text_content
+                            else:
+                                model_response.reasoning_content += text_content
+                        else:
+                            if model_response.content is None:
+                                model_response.content = text_content
+                            else:
+                                model_response.content += text_content
+                        # Capture thought signature for text parts
+                        if hasattr(part, "thought_signature") and part.thought_signature:
+                            if model_response.provider_data is None:
+                                model_response.provider_data = {}
+                            model_response.provider_data["thought_signature"] = base64.b64encode(
+                                part.thought_signature
+                            ).decode("ascii")
+                    if hasattr(part, "inline_data") and part.inline_data is not None:
+                        # Audio responses
+                        if part.inline_data.mime_type and part.inline_data.mime_type.startswith("audio/"):
+                            # Store raw bytes audio data
+                            model_response.audio = Audio(
+                                id=str(uuid4()),
+                                content=part.inline_data.data,
+                                mime_type=part.inline_data.mime_type,
+                            )
+                        # Image responses
+                        else:
+                            if model_response.images is None:
+                                model_response.images = []
+                            model_response.images.append(
+                                Image(
+                                    id=str(uuid4()), content=part.inline_data.data, mime_type=part.inline_data.mime_type
+                                )
+                            )
+                    # Extract function call if present
+                    if hasattr(part, "function_call") and part.function_call is not None:
+                        call_id = part.function_call.id if part.function_call.id else str(uuid4())
+                        tool_call = {
+                            "id": call_id,
+                            "type": "function",
+                            "function": {
+                                "name": part.function_call.name,
+                                "arguments": json.dumps(part.function_call.args)
+                                if part.function_call.args is not None
+                                else "",
+                            },
+                        }
+                        # Capture thought signature for function calls
+                        if hasattr(part, "thought_signature") and part.thought_signature:
+                            tool_call["thought_signature"] = base64.b64encode(part.thought_signature).decode("ascii")
+                        model_response.tool_calls.append(tool_call)
+            citations = Citations()
+            citations.raw = {}
+            citations.urls = []
+            if (
+                hasattr(response_delta.candidates[0], "grounding_metadata")
+                and response_delta.candidates[0].grounding_metadata is not None
+            ):
+                grounding_metadata = response_delta.candidates[0].grounding_metadata
+                citations.raw["grounding_metadata"] = grounding_metadata.model_dump()
+                citations.search_queries = grounding_metadata.web_search_queries or []
+                # Extract url and title
+                chunks = grounding_metadata.grounding_chunks or []
+                for chunk in chunks:
+                    if not chunk:
+                        continue
+                    web = chunk.web
+                    if not web:
+                        continue
+                    uri = web.uri
+                    title = web.title
+                    if uri:
+                        citations.urls.append(UrlCitation(url=uri, title=title))
+            # Handle URLs from URL context tool
+            if (
+                hasattr(response_delta.candidates[0], "url_context_metadata")
+                and response_delta.candidates[0].url_context_metadata is not None
+            ):
+                url_context_metadata = response_delta.candidates[0].url_context_metadata
+                citations.raw["url_context_metadata"] = url_context_metadata.model_dump()
+                url_metadata_list = url_context_metadata.url_metadata or []
+                for url_meta in url_metadata_list:
+                    retrieved_url = url_meta.retrieved_url
+                    status = "UNKNOWN"
+                    if url_meta.url_retrieval_status:
+                        status = url_meta.url_retrieval_status.value
+                    if retrieved_url and status == "URL_RETRIEVAL_STATUS_SUCCESS":
+                        # Avoid duplicate URLs
+                        existing_urls = [citation.url for citation in citations.urls]
+                        if retrieved_url not in existing_urls:
+                            citations.urls.append(UrlCitation(url=retrieved_url, title=retrieved_url))
+            if citations.raw or citations.urls:
+                model_response.citations = citations
+            # Extract usage metadata if present
+            if hasattr(response_delta, "usage_metadata") and response_delta.usage_metadata is not None:
+                model_response.response_usage = self._get_metrics(response_delta.usage_metadata)
+        return model_response
+    def __deepcopy__(self, memo):
+        """
+        Creates a deep copy of the Gemini model instance but sets the client to None.
+        This is useful when we need to copy the model configuration without duplicating
+        the client connection.
+        This overrides the base class implementation.
+        """
+        from copy import copy, deepcopy
+        # Create a new instance without calling __init__
+        cls = self.__class__
+        new_instance = cls.__new__(cls)
+        # Update memo with the new instance to avoid circular references
+        memo[id(self)] = new_instance
+        # Deep copy all attributes except client and unpickleable attributes
+        for key, value in self.__dict__.items():
+            # Skip client and other unpickleable attributes
+            if key in {"client", "response_format", "_tools", "_functions", "_function_call_stack"}:
+                continue
+            # Try deep copy first, fall back to shallow copy, then direct assignment
+            try:
+                setattr(new_instance, key, deepcopy(value, memo))
+            except Exception:
                 try:
-                    function_name = tool.__name__
-                    if function_name not in self._functions:
-                        func = Function.from_callable(tool)
-                        self._functions[func.name] = func
-                        function_declaration = _build_function_declaration(func)
-                        self.function_declarations.append(function_declaration)
-                        logger.debug(f"Function '{func.name}' added to model.")
-                except Exception as e:
-                    logger.warning(f"Could not add function {tool}: {e}")
-    def invoke(self, messages: List[Message]):
+                    setattr(new_instance, key, copy(value))
+                except Exception:
+                    setattr(new_instance, key, value)
+        # Explicitly set client to None
+        setattr(new_instance, "client", None)
+        return new_instance
+    def _get_metrics(self, response_usage: GenerateContentResponseUsageMetadata) -> Metrics:
         """
-        Invokes the model with a list of messages and returns the response.
+        Parse the given Google Gemini usage into an Agno Metrics object.
         Args:
-            messages (List[Message]): The list of messages to send to the model.
+            response_usage: Usage data from Google Gemini
         Returns:
-            GenerateContentResponse: The response from the model.
+            Metrics: Parsed metrics data
         """
-        return self.get_client().generate_content(contents=_format_messages(messages))
+        metrics = Metrics()
+        metrics.input_tokens = response_usage.prompt_token_count or 0
+        metrics.output_tokens = response_usage.candidates_token_count or 0
+        if response_usage.thoughts_token_count is not None:
+            metrics.output_tokens += response_usage.thoughts_token_count or 0
+        metrics.total_tokens = metrics.input_tokens + metrics.output_tokens
-    def invoke_stream(self, messages: List[Message]):
+        metrics.cache_read_tokens = response_usage.cached_content_token_count or 0
+        if response_usage.traffic_type is not None:
+            metrics.provider_metrics = {"traffic_type": response_usage.traffic_type}
+        return metrics
+    def create_file_search_store(self, display_name: Optional[str] = None) -> Any:
         """
-        Invokes the model with a list of messages and returns the response as a stream.
+        Create a new File Search store.
         Args:
-            messages (List[Message]): The list of messages to send to the model.
+            display_name: Optional display name for the store
         Returns:
-            Iterator[GenerateContentResponse]: The response from the model as a stream.
+            FileSearchStore: The created File Search store object
         """
-        yield from self.get_client().generate_content(
-            contents=_format_messages(messages),
-            stream=True,
-        )
+        config: Dict[str, Any] = {}
+        if display_name:
+            config["display_name"] = display_name
-    def update_usage_metrics(
-        self,
-        assistant_message: Message,
-        usage: Optional[ResultGenerateContentResponse] = None,
-        metrics: Metrics = Metrics(),
-    ) -> None:
-        """
-        Update the usage metrics.
+        try:
+            store = self.get_client().file_search_stores.create(config=config or None)  # type: ignore[arg-type]
+            log_info(f"Created File Search store: {store.name}")
+            return store
+        except Exception as e:
+            log_error(f"Error creating File Search store: {e}")
+            raise
+    async def async_create_file_search_store(self, display_name: Optional[str] = None) -> Any:
+        """
         Args:
-            assistant_message (Message): The assistant message.
-            usage (ResultGenerateContentResponse): The usage metrics.
-            stream_usage (Optional[StreamUsageData]): The stream usage metrics.
+            display_name: Optional display name for the store
+        Returns:
+            FileSearchStore: The created File Search store object
         """
-        if usage:
-            metrics.input_tokens = usage.prompt_token_count or 0
-            metrics.output_tokens = usage.candidates_token_count or 0
-            metrics.total_tokens = usage.total_token_count or 0
+        config: Dict[str, Any] = {}
+        if display_name:
+            config["display_name"] = display_name
-        self._update_model_metrics(metrics_for_run=metrics)
-        self._update_assistant_message_metrics(assistant_message=assistant_message, metrics_for_run=metrics)
+        try:
+            store = await self.get_client().aio.file_search_stores.create(config=config or None)  # type: ignore[arg-type]
+            log_info(f"Created File Search store: {store.name}")
+            return store
+        except Exception as e:
+            log_error(f"Error creating File Search store: {e}")
+            raise
-    def create_assistant_message(self, response: GenerateContentResponse, metrics: Metrics) -> Message:
+    def list_file_search_stores(self, page_size: int = 100) -> List[Any]:
         """
-        Create an assistant message from the response.
+        List all File Search stores.
         Args:
-            response (GenerateContentResponse): The model response.
-            response_timer (Timer): The response timer.
+            page_size: Maximum number of stores to return per page
         Returns:
-            Message: The assistant message.
+            List: List of FileSearchStore objects
         """
-        message_data = MessageData()
+        try:
+            stores = []
+            for store in self.get_client().file_search_stores.list(config={"page_size": page_size}):
+                stores.append(store)
+            log_debug(f"Found {len(stores)} File Search stores")
+            return stores
+        except Exception as e:
+            log_error(f"Error listing File Search stores: {e}")
+            raise
-        message_data.response_block = response.candidates[0].content
-        message_data.response_role = message_data.response_block.role
-        message_data.response_parts = message_data.response_block.parts
-        message_data.response_usage = response.usage_metadata
+    async def async_list_file_search_stores(self, page_size: int = 100) -> List[Any]:
+        """
+        Async version of list_file_search_stores.
-        if message_data.response_parts is not None:
-            for part in message_data.response_parts:
-                part_dict = type(part).to_dict(part)
+        Args:
+            page_size: Maximum number of stores to return per page
-                # Extract text if present
-                if "text" in part_dict:
-                    message_data.response_content = part_dict.get("text")
+        Returns:
+            List: List of FileSearchStore objects
+        """
+        try:
+            stores = []
+            async for store in await self.get_client().aio.file_search_stores.list(config={"page_size": page_size}):
+                stores.append(store)
+            log_debug(f"Found {len(stores)} File Search stores")
+            return stores
+        except Exception as e:
+            log_error(f"Error listing File Search stores: {e}")
+            raise
-                # Parse function calls
-                if "function_call" in part_dict:
-                    message_data.response_tool_calls.append(
-                        {
-                            "type": "function",
-                            "function": {
-                                "name": part_dict.get("function_call").get("name"),
-                                "arguments": json.dumps(part_dict.get("function_call").get("args")),
-                            },
-                        }
-                    )
+    def get_file_search_store(self, name: str) -> Any:
+        """
+        Get a specific File Search store by name.
-        # -*- Create assistant message
-        assistant_message = Message(
-            role=message_data.response_role or "model",
-            content=message_data.response_content,
-        )
+        Args:
+            name: The name of the store (e.g., 'fileSearchStores/my-store-123')
-        # -*- Update assistant message if tool calls are present
-        if len(message_data.response_tool_calls) > 0:
-            assistant_message.tool_calls = message_data.response_tool_calls
+        Returns:
+            FileSearchStore: The File Search store object
+        """
+        try:
+            store = self.get_client().file_search_stores.get(name=name)
+            log_debug(f"Retrieved File Search store: {name}")
+            return store
+        except Exception as e:
+            log_error(f"Error getting File Search store {name}: {e}")
+            raise
-        # -*- Update usage metrics
-        self.update_usage_metrics(assistant_message, message_data.response_usage, metrics)
-        return assistant_message
+    async def async_get_file_search_store(self, name: str) -> Any:
+        """
+        Args:
+            name: The name of the store
-    def format_function_call_results(
-        self,
-        function_call_results: List[Message],
-        messages: List[Message],
-    ):
+        Returns:
+            FileSearchStore: The File Search store object
+        """
+        try:
+            store = await self.get_client().aio.file_search_stores.get(name=name)
+            log_debug(f"Retrieved File Search store: {name}")
+            return store
+        except Exception as e:
+            log_error(f"Error getting File Search store {name}: {e}")
+            raise
+    def delete_file_search_store(self, name: str, force: bool = False) -> None:
         """
-        Processes the results of function calls and appends them to messages.
+        Delete a File Search store.
         Args:
-            function_call_results (List[Message]): The results from running function calls.
-            messages (List[Message]): The list of conversation messages.
+            name: The name of the store to delete
+            force: If True, force delete even if store contains documents
         """
-        if function_call_results:
-            combined_content: List = []
-            combined_function_result: List = []
+        try:
+            self.get_client().file_search_stores.delete(name=name, config={"force": force})
+            log_info(f"Deleted File Search store: {name}")
+        except Exception as e:
+            log_error(f"Error deleting File Search store {name}: {e}")
+            raise
-            for result in function_call_results:
-                combined_content.append(result.content)
-                combined_function_result.append((result.tool_name, result.content))
+    async def async_delete_file_search_store(self, name: str, force: bool = True) -> None:
+        """
+        Async version of delete_file_search_store.
-            messages.append(
-                Message(role="tool", content=combined_content, combined_function_details=combined_function_result)
-            )
+        Args:
+            name: The name of the store to delete
+            force: If True, force delete even if store contains documents
+        """
+        try:
+            await self.get_client().aio.file_search_stores.delete(name=name, config={"force": force})
+            log_info(f"Deleted File Search store: {name}")
+        except Exception as e:
+            log_error(f"Error deleting File Search store {name}: {e}")
+            raise
-    def handle_tool_calls(self, assistant_message: Message, messages: List[Message], model_response: ModelResponse):
+    def wait_for_operation(self, operation: Operation, poll_interval: int = 5, max_wait: int = 600) -> Operation:
         """
-        Handle tool calls in the assistant message.
+        Wait for a long-running operation to complete.
         Args:
-            assistant_message (Message): The assistant message.
-            messages (List[Message]): A list of messages.
-            model_response (ModelResponse): The model response.
+            operation: The operation object to wait for
+            poll_interval: Seconds to wait between status checks
+            max_wait: Maximum seconds to wait before timing out
         Returns:
-            Optional[ModelResponse]: The updated model response.
-        """
-        if assistant_message.tool_calls:
-            if model_response.tool_calls is None:
-                model_response.tool_calls = []
-            model_response.content = assistant_message.get_content_string() or ""
-            function_calls_to_run = self._get_function_calls_to_run(
-                assistant_message, messages, error_response_role="tool"
-            )
-            if self.show_tool_calls:
-                if len(function_calls_to_run) == 1:
-                    model_response.content += f"\n - Running: {function_calls_to_run[0].get_call_str()}\n\n"
-                elif len(function_calls_to_run) > 1:
-                    model_response.content += "\nRunning:"
-                    for _f in function_calls_to_run:
-                        model_response.content += f"\n - {_f.get_call_str()}"
-                    model_response.content += "\n\n"
-            function_call_results: List[Message] = []
-            for function_call_response in self.run_function_calls(
-                function_calls=function_calls_to_run,
-                function_call_results=function_call_results,
-            ):
-                if (
-                    function_call_response.event == ModelResponseEvent.tool_call_completed.value
-                    and function_call_response.tool_calls is not None
-                ):
-                    model_response.tool_calls.extend(function_call_response.tool_calls)
+            Operation: The completed operation object
-            self.format_function_call_results(function_call_results, messages)
+        Raises:
+            TimeoutError: If operation doesn't complete within max_wait seconds
+        """
+        elapsed = 0
+        while not operation.done:
+            if elapsed >= max_wait:
+                raise TimeoutError(f"Operation timed out after {max_wait} seconds")
+            time.sleep(poll_interval)
+            elapsed += poll_interval
+            operation = self.get_client().operations.get(operation)
+            log_debug(f"Waiting for operation... ({elapsed}s elapsed)")
+        log_info("Operation completed successfully")
+        return operation
+    async def async_wait_for_operation(
+        self, operation: Operation, poll_interval: int = 5, max_wait: int = 600
+    ) -> Operation:
+        """
+        Async version of wait_for_operation.
-            return model_response
-        return None
+        Args:
+            operation: The operation object to wait for
+            poll_interval: Seconds to wait between status checks
+            max_wait: Maximum seconds to wait before timing out
-    def response(self, messages: List[Message]) -> ModelResponse:
+        Returns:
+            Operation: The completed operation object
         """
-        Send a generate cone content request to the model and return the response.
+        elapsed = 0
+        while not operation.done:
+            if elapsed >= max_wait:
+                raise TimeoutError(f"Operation timed out after {max_wait} seconds")
+            await asyncio.sleep(poll_interval)
+            elapsed += poll_interval
+            operation = await self.get_client().aio.operations.get(operation)
+            log_debug(f"Waiting for operation... ({elapsed}s elapsed)")
+        log_info("Operation completed successfully")
+        return operation
+    def upload_to_file_search_store(
+        self,
+        file_path: Union[str, Path],
+        store_name: str,
+        display_name: Optional[str] = None,
+        chunking_config: Optional[Dict[str, Any]] = None,
+        custom_metadata: Optional[List[Dict[str, Any]]] = None,
+    ) -> Any:
+        """
+        Upload a file directly to a File Search store.
         Args:
-            messages (List[Message]): The list of messages to send to the model.
+            file_path: Path to the file to upload
+            store_name: Name of the File Search store
+            display_name: Optional display name for the file (will be visible in citations)
+            chunking_config: Optional chunking configuration
+                Example: {
+                    "white_space_config": {
+                        "max_tokens_per_chunk": 200,
+                        "max_overlap_tokens": 20
+                    }
+                }
+            custom_metadata: Optional custom metadata as list of dicts
+                Example: [
+                    {"key": "author", "string_value": "John Doe"},
+                    {"key": "year", "numeric_value": 2024}
+                ]
         Returns:
-            ModelResponse: The model response.
+            Operation: Long-running operation object. Use wait_for_operation() to wait for completion.
         """
-        logger.debug("---------- Gemini Response Start ----------")
-        self._log_messages(messages)
-        model_response = ModelResponse()
-        metrics = Metrics()
+        file_path = file_path if isinstance(file_path, Path) else Path(file_path)
-        # -*- Generate response
-        metrics.start_response_timer()
-        response: GenerateContentResponse = self.invoke(messages=messages)
-        metrics.stop_response_timer()
+        if not file_path.exists():
+            raise FileNotFoundError(f"File not found: {file_path}")
-        # -*- Create assistant message
-        assistant_message = self.create_assistant_message(response=response, metrics=metrics)
+        config: Dict[str, Any] = {}
+        if display_name:
+            config["display_name"] = display_name
+        if chunking_config:
+            config["chunking_config"] = chunking_config
+        if custom_metadata:
+            config["custom_metadata"] = custom_metadata
-        # -*- Add assistant message to messages
-        messages.append(assistant_message)
+        try:
+            log_info(f"Uploading file {file_path.name} to File Search store {store_name}")
+            operation = self.get_client().file_search_stores.upload_to_file_search_store(
+                file=file_path,
+                file_search_store_name=store_name,
+                config=config or None,  # type: ignore[arg-type]
+            )
+            log_info(f"Upload initiated for {file_path.name}")
+            return operation
+        except Exception as e:
+            log_error(f"Error uploading file to File Search store: {e}")
+            raise
-        # -*- Log response and metrics
-        assistant_message.log()
-        metrics.log()
+    async def async_upload_to_file_search_store(
+        self,
+        file_path: Union[str, Path],
+        store_name: str,
+        display_name: Optional[str] = None,
+        chunking_config: Optional[Dict[str, Any]] = None,
+        custom_metadata: Optional[List[Dict[str, Any]]] = None,
+    ) -> Any:
+        """
+        Args:
+            file_path: Path to the file to upload
+            store_name: Name of the File Search store
+            display_name: Optional display name for the file
+            chunking_config: Optional chunking configuration
+            custom_metadata: Optional custom metadata
-        # -*- Update model response with assistant message content
-        if assistant_message.content is not None:
-            model_response.content = assistant_message.get_content_string()
+        Returns:
+            Operation: Long-running operation object
+        """
+        file_path = file_path if isinstance(file_path, Path) else Path(file_path)
-        # -*- Handle tool calls
-        if self.handle_tool_calls(assistant_message, messages, model_response) is not None:
-            response_after_tool_calls = self.response(messages=messages)
-            if response_after_tool_calls.content is not None:
-                if model_response.content is None:
-                    model_response.content = ""
-                model_response.content += response_after_tool_calls.content
+        if not file_path.exists():
+            raise FileNotFoundError(f"File not found: {file_path}")
-            return model_response
+        config: Dict[str, Any] = {}
+        if display_name:
+            config["display_name"] = display_name
+        if chunking_config:
+            config["chunking_config"] = chunking_config
+        if custom_metadata:
+            config["custom_metadata"] = custom_metadata
-        logger.debug("---------- Gemini Response End ----------")
-        return model_response
+        try:
+            log_info(f"Uploading file {file_path.name} to File Search store {store_name}")
+            operation = await self.get_client().aio.file_search_stores.upload_to_file_search_store(
+                file=file_path,
+                file_search_store_name=store_name,
+                config=config or None,  # type: ignore[arg-type]
+            )
+            log_info(f"Upload initiated for {file_path.name}")
+            return operation
+        except Exception as e:
+            log_error(f"Error uploading file to File Search store: {e}")
+            raise
-    def handle_stream_tool_calls(self, assistant_message: Message, messages: List[Message]):
+    def import_file_to_store(
+        self,
+        file_name: str,
+        store_name: str,
+        chunking_config: Optional[Dict[str, Any]] = None,
+        custom_metadata: Optional[List[Dict[str, Any]]] = None,
+    ) -> Any:
         """
-        Parse and run function calls and append the results to messages.
+        Import an existing uploaded file (via Files API) into a File Search store.
         Args:
-            assistant_message (Message): The assistant message containing tool calls.
-            messages (List[Message]): The list of conversation messages.
+            file_name: Name of the file already uploaded via Files API
+            store_name: Name of the File Search store
+            chunking_config: Optional chunking configuration
+            custom_metadata: Optional custom metadata
-        Yields:
-            Iterator[ModelResponse]: Yields model responses during function execution.
+        Returns:
+            Operation: Long-running operation object. Use wait_for_operation() to wait for completion.
         """
-        if assistant_message.tool_calls:
-            function_calls_to_run = self._get_function_calls_to_run(
-                assistant_message, messages, error_response_role="tool"
-            )
+        config: Dict[str, Any] = {}
+        if chunking_config:
+            config["chunking_config"] = chunking_config
+        if custom_metadata:
+            config["custom_metadata"] = custom_metadata
-            if self.show_tool_calls:
-                if len(function_calls_to_run) == 1:
-                    yield ModelResponse(content=f"\n - Running: {function_calls_to_run[0].get_call_str()}\n\n")
-                elif len(function_calls_to_run) > 1:
-                    yield ModelResponse(content="\nRunning:")
-                    for _f in function_calls_to_run:
-                        yield ModelResponse(content=f"\n - {_f.get_call_str()}")
-                    yield ModelResponse(content="\n\n")
-            function_call_results: List[Message] = []
-            for intermediate_model_response in self.run_function_calls(
-                function_calls=function_calls_to_run, function_call_results=function_call_results
-            ):
-                yield intermediate_model_response
+        try:
+            log_info(f"Importing file {file_name} to File Search store {store_name}")
+            operation = self.get_client().file_search_stores.import_file(
+                file_search_store_name=store_name,
+                file_name=file_name,
+                config=config or None,  # type: ignore[arg-type]
+            )
+            log_info(f"Import initiated for {file_name}")
+            return operation
+        except Exception as e:
+            log_error(f"Error importing file to File Search store: {e}")
+            raise
-            self.format_function_call_results(function_call_results, messages)
+    async def async_import_file_to_store(
+        self,
+        file_name: str,
+        store_name: str,
+        chunking_config: Optional[Dict[str, Any]] = None,
+        custom_metadata: Optional[List[Dict[str, Any]]] = None,
+    ) -> Any:
+        """
+        Args:
+            file_name: Name of the file already uploaded via Files API
+            store_name: Name of the File Search store
+            chunking_config: Optional chunking configuration
+            custom_metadata: Optional custom metadata
-    def response_stream(self, messages: List[Message]) -> Iterator[ModelResponse]:
+        Returns:
+            Operation: Long-running operation object
         """
-        Send a generate content request to the model and return the response as a stream.
+        config: Dict[str, Any] = {}
+        if chunking_config:
+            config["chunking_config"] = chunking_config
+        if custom_metadata:
+            config["custom_metadata"] = custom_metadata
+        try:
+            log_info(f"Importing file {file_name} to File Search store {store_name}")
+            operation = await self.get_client().aio.file_search_stores.import_file(
+                file_search_store_name=store_name,
+                file_name=file_name,
+                config=config or None,  # type: ignore[arg-type]
+            )
+            log_info(f"Import initiated for {file_name}")
+            return operation
+        except Exception as e:
+            log_error(f"Error importing file to File Search store: {e}")
+            raise
+    def list_documents(self, store_name: str, page_size: int = 20) -> List[Any]:
+        """
         Args:
-            messages (List[Message]): The list of messages to send to the model.
+            store_name: Name of the File Search store
+            page_size: Maximum number of documents to return per page
-        Yields:
-            Iterator[ModelResponse]: The model responses
+        Returns:
+            List: List of document objects
         """
-        logger.debug("---------- Gemini Response Start ----------")
-        self._log_messages(messages)
-        message_data = MessageData()
-        metrics = Metrics()
+        try:
+            documents = []
+            for doc in self.get_client().file_search_stores.documents.list(
+                parent=store_name, config={"page_size": page_size}
+            ):
+                documents.append(doc)
+            log_debug(f"Found {len(documents)} documents in store {store_name}")
+            return documents
+        except Exception as e:
+            log_error(f"Error listing documents in store {store_name}: {e}")
+            raise
-        metrics.start_response_timer()
-        for response in self.invoke_stream(messages=messages):
-            message_data.response_block = response.candidates[0].content
-            message_data.response_role = message_data.response_block.role
-            message_data.response_parts = message_data.response_block.parts
-            if message_data.response_parts is not None:
-                for part in message_data.response_parts:
-                    part_dict = type(part).to_dict(part)
-                    # -*- Yield text if present
-                    if "text" in part_dict:
-                        text = part_dict.get("text")
-                        yield ModelResponse(content=text)
-                        message_data.response_content += text
-                        metrics.output_tokens += 1
-                        if metrics.output_tokens == 1:
-                            metrics.time_to_first_token = metrics.response_timer.elapsed
-                    else:
-                        message_data.valid_response_parts = message_data.response_parts
+    async def async_list_documents(self, store_name: str, page_size: int = 20) -> List[Any]:
+        """
+        Async version of list_documents.
-                    # -*- Skip function calls if there are no parts
-                    if not message_data.response_block.parts and message_data.response_parts:
-                        continue
-                    # -*- Parse function calls
-                    if "function_call" in part_dict:
-                        message_data.response_tool_calls.append(
-                            {
-                                "type": "function",
-                                "function": {
-                                    "name": part_dict.get("function_call").get("name"),
-                                    "arguments": json.dumps(part_dict.get("function_call").get("args")),
-                                },
-                            }
-                        )
-            message_data.response_usage = response.usage_metadata
-        metrics.stop_response_timer()
+        Args:
+            store_name: Name of the File Search store
+            page_size: Maximum number of documents to return per page
-        # -*- Create assistant message
-        assistant_message = Message(
-            role=message_data.response_role or "model",
-            content=message_data.response_content,
-        )
+        Returns:
+            List: List of document objects
+        """
+        try:
+            documents = []
+            # Await the AsyncPager first, then iterate
+            async for doc in await self.get_client().aio.file_search_stores.documents.list(
+                parent=store_name, config={"page_size": page_size}
+            ):
+                documents.append(doc)
+            log_debug(f"Found {len(documents)} documents in store {store_name}")
+            return documents
+        except Exception as e:
+            log_error(f"Error listing documents in store {store_name}: {e}")
+            raise
-        # -*- Update assistant message if tool calls are present
-        if len(message_data.response_tool_calls) > 0:
-            assistant_message.tool_calls = message_data.response_tool_calls
+    def get_document(self, document_name: str) -> Any:
+        """
+        Get a specific document by name.
-        # -*- Update usage metrics
-        self.update_usage_metrics(assistant_message, message_data.response_usage, metrics)
+        Args:
+            document_name: Full name of the document
+                (e.g., 'fileSearchStores/store-123/documents/doc-456')
-        # -*- Add assistant message to messages
-        messages.append(assistant_message)
+        Returns:
+            Document object
+        """
+        try:
+            doc = self.get_client().file_search_stores.documents.get(name=document_name)
+            log_debug(f"Retrieved document: {document_name}")
+            return doc
+        except Exception as e:
+            log_error(f"Error getting document {document_name}: {e}")
+            raise
-        # -*- Log response and metrics
-        assistant_message.log()
-        metrics.log()
+    async def async_get_document(self, document_name: str) -> Any:
+        """
+        Async version of get_document.
-        if assistant_message.tool_calls is not None and len(assistant_message.tool_calls) > 0:
-            yield from self.handle_stream_tool_calls(assistant_message, messages)
-            yield from self.response_stream(messages=messages)
+        Args:
+            document_name: Full name of the document
-        logger.debug("---------- Gemini Response End ----------")
+        Returns:
+            Document object
+        """
+        try:
+            doc = await self.get_client().aio.file_search_stores.documents.get(name=document_name)
+            log_debug(f"Retrieved document: {document_name}")
+            return doc
+        except Exception as e:
+            log_error(f"Error getting document {document_name}: {e}")
+            raise
-    async def ainvoke(self, *args, **kwargs) -> Any:
-        raise NotImplementedError(f"Async not supported on {self.name}.")
+    def delete_document(self, document_name: str) -> None:
+        """
+        Delete a document from a File Search store.
-    async def ainvoke_stream(self, *args, **kwargs) -> Any:
-        raise NotImplementedError(f"Async not supported on {self.name}.")
+        Args:
+            document_name: Full name of the document to delete
-    async def aresponse(self, messages: List[Message]) -> ModelResponse:
-        raise NotImplementedError(f"Async not supported on {self.name}.")
+        Example:
+            ```python
+            model = Gemini(id="gemini-2.5-flash")
+            model.delete_document("fileSearchStores/store-123/documents/doc-456")
+            ```
+        """
+        try:
+            self.get_client().file_search_stores.documents.delete(name=document_name)
+            log_info(f"Deleted document: {document_name}")
+        except Exception as e:
+            log_error(f"Error deleting document {document_name}: {e}")
+            raise
-    async def aresponse_stream(self, messages: List[Message]) -> ModelResponse:
-        raise NotImplementedError(f"Async not supported on {self.name}.")
+    async def async_delete_document(self, document_name: str) -> None:
+        """
+        Async version of delete_document.
+        Args:
+            document_name: Full name of the document to delete
+        """
+        try:
+            await self.get_client().aio.file_search_stores.documents.delete(name=document_name)
+            log_info(f"Deleted document: {document_name}")
+        except Exception as e:
+            log_error(f"Error deleting document {document_name}: {e}")
+            raise

agno 0.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl

agno 0.1.2py3-none-any.whl → 2.3.13py3-none-any.whl