PyPI - agno - Versions diffs - 1.8.1__py3-none-any.whl → 2.0.0__py3-none-any.whl - Mend

agno 1.8.1py3-none-any.whl → 2.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (590) hide show

agno/__init__.py +8 -0
agno/agent/__init__.py +19 -27
agno/agent/agent.py +3143 -4170
agno/api/agent.py +11 -67
agno/api/api.py +5 -46
agno/api/evals.py +8 -19
agno/api/os.py +17 -0
agno/api/routes.py +6 -41
agno/api/schemas/__init__.py +9 -0
agno/api/schemas/agent.py +5 -21
agno/api/schemas/evals.py +7 -16
agno/api/schemas/os.py +14 -0
agno/api/schemas/team.py +5 -21
agno/api/schemas/utils.py +21 -0
agno/api/schemas/workflows.py +11 -7
agno/api/settings.py +53 -0
agno/api/team.py +11 -66
agno/api/workflow.py +28 -0
agno/cloud/aws/base.py +214 -0
agno/cloud/aws/s3/__init__.py +2 -0
agno/cloud/aws/s3/api_client.py +43 -0
agno/cloud/aws/s3/bucket.py +195 -0
agno/cloud/aws/s3/object.py +57 -0
agno/db/__init__.py +24 -0
agno/db/base.py +245 -0
agno/db/dynamo/__init__.py +3 -0
agno/db/dynamo/dynamo.py +1743 -0
agno/db/dynamo/schemas.py +278 -0
agno/db/dynamo/utils.py +684 -0
agno/db/firestore/__init__.py +3 -0
agno/db/firestore/firestore.py +1432 -0
agno/db/firestore/schemas.py +130 -0
agno/db/firestore/utils.py +278 -0
agno/db/gcs_json/__init__.py +3 -0
agno/db/gcs_json/gcs_json_db.py +1001 -0
agno/db/gcs_json/utils.py +194 -0
agno/db/in_memory/__init__.py +3 -0
agno/db/in_memory/in_memory_db.py +882 -0
agno/db/in_memory/utils.py +172 -0
agno/db/json/__init__.py +3 -0
agno/db/json/json_db.py +1045 -0
agno/db/json/utils.py +196 -0
agno/db/migrations/v1_to_v2.py +162 -0
agno/db/mongo/__init__.py +3 -0
agno/db/mongo/mongo.py +1416 -0
agno/db/mongo/schemas.py +77 -0
agno/db/mongo/utils.py +204 -0
agno/db/mysql/__init__.py +3 -0
agno/db/mysql/mysql.py +1719 -0
agno/db/mysql/schemas.py +124 -0
agno/db/mysql/utils.py +297 -0
agno/db/postgres/__init__.py +3 -0
agno/db/postgres/postgres.py +1710 -0
agno/db/postgres/schemas.py +124 -0
agno/db/postgres/utils.py +280 -0
agno/db/redis/__init__.py +3 -0
agno/db/redis/redis.py +1367 -0
agno/db/redis/schemas.py +109 -0
agno/db/redis/utils.py +288 -0
agno/db/schemas/__init__.py +3 -0
agno/db/schemas/evals.py +33 -0
agno/db/schemas/knowledge.py +40 -0
agno/db/schemas/memory.py +46 -0
agno/db/singlestore/__init__.py +3 -0
agno/db/singlestore/schemas.py +116 -0
agno/db/singlestore/singlestore.py +1712 -0
agno/db/singlestore/utils.py +326 -0
agno/db/sqlite/__init__.py +3 -0
agno/db/sqlite/schemas.py +119 -0
agno/db/sqlite/sqlite.py +1676 -0
agno/db/sqlite/utils.py +268 -0
agno/db/utils.py +88 -0
agno/eval/__init__.py +14 -0
agno/eval/accuracy.py +154 -48
agno/eval/performance.py +88 -23
agno/eval/reliability.py +73 -20
agno/eval/utils.py +23 -13
agno/integrations/discord/__init__.py +3 -0
agno/{app → integrations}/discord/client.py +15 -11
agno/knowledge/__init__.py +2 -2
agno/{document → knowledge}/chunking/agentic.py +2 -2
agno/{document → knowledge}/chunking/document.py +2 -2
agno/{document → knowledge}/chunking/fixed.py +3 -3
agno/{document → knowledge}/chunking/markdown.py +2 -2
agno/{document → knowledge}/chunking/recursive.py +2 -2
agno/{document → knowledge}/chunking/row.py +2 -2
agno/knowledge/chunking/semantic.py +59 -0
agno/knowledge/chunking/strategy.py +121 -0
agno/knowledge/content.py +74 -0
agno/knowledge/document/__init__.py +5 -0
agno/{document → knowledge/document}/base.py +12 -2
agno/knowledge/embedder/__init__.py +5 -0
agno/{embedder → knowledge/embedder}/aws_bedrock.py +127 -1
agno/{embedder → knowledge/embedder}/azure_openai.py +65 -1
agno/{embedder → knowledge/embedder}/base.py +6 -0
agno/{embedder → knowledge/embedder}/cohere.py +72 -1
agno/{embedder → knowledge/embedder}/fastembed.py +17 -1
agno/{embedder → knowledge/embedder}/fireworks.py +1 -1
agno/{embedder → knowledge/embedder}/google.py +74 -1
agno/{embedder → knowledge/embedder}/huggingface.py +36 -2
agno/{embedder → knowledge/embedder}/jina.py +48 -2
agno/knowledge/embedder/langdb.py +22 -0
agno/knowledge/embedder/mistral.py +139 -0
agno/{embedder → knowledge/embedder}/nebius.py +1 -1
agno/{embedder → knowledge/embedder}/ollama.py +54 -3
agno/knowledge/embedder/openai.py +223 -0
agno/{embedder → knowledge/embedder}/sentence_transformer.py +16 -1
agno/{embedder → knowledge/embedder}/together.py +1 -1
agno/{embedder → knowledge/embedder}/voyageai.py +49 -1
agno/knowledge/knowledge.py +1551 -0
agno/knowledge/reader/__init__.py +7 -0
agno/{document → knowledge}/reader/arxiv_reader.py +32 -4
agno/knowledge/reader/base.py +88 -0
agno/{document → knowledge}/reader/csv_reader.py +47 -65
agno/knowledge/reader/docx_reader.py +83 -0
agno/{document → knowledge}/reader/firecrawl_reader.py +42 -21
agno/{document → knowledge}/reader/json_reader.py +30 -9
agno/{document → knowledge}/reader/markdown_reader.py +58 -9
agno/{document → knowledge}/reader/pdf_reader.py +71 -126
agno/knowledge/reader/reader_factory.py +268 -0
agno/knowledge/reader/s3_reader.py +101 -0
agno/{document → knowledge}/reader/text_reader.py +31 -10
agno/knowledge/reader/url_reader.py +128 -0
agno/knowledge/reader/web_search_reader.py +366 -0
agno/{document → knowledge}/reader/website_reader.py +37 -10
agno/knowledge/reader/wikipedia_reader.py +59 -0
agno/knowledge/reader/youtube_reader.py +78 -0
agno/knowledge/remote_content/remote_content.py +88 -0
agno/{reranker → knowledge/reranker}/base.py +1 -1
agno/{reranker → knowledge/reranker}/cohere.py +2 -2
agno/{reranker → knowledge/reranker}/infinity.py +2 -2
agno/{reranker → knowledge/reranker}/sentence_transformer.py +2 -2
agno/knowledge/types.py +30 -0
agno/knowledge/utils.py +169 -0
agno/media.py +269 -268
agno/memory/__init__.py +2 -10
agno/memory/manager.py +1003 -148
agno/models/aimlapi/__init__.py +2 -2
agno/models/aimlapi/aimlapi.py +6 -6
agno/models/anthropic/claude.py +131 -131
agno/models/aws/bedrock.py +110 -182
agno/models/aws/claude.py +64 -18
agno/models/azure/ai_foundry.py +73 -23
agno/models/base.py +346 -290
agno/models/cerebras/cerebras.py +84 -27
agno/models/cohere/chat.py +106 -98
agno/models/google/gemini.py +105 -46
agno/models/groq/groq.py +97 -35
agno/models/huggingface/huggingface.py +92 -27
agno/models/ibm/watsonx.py +72 -13
agno/models/litellm/chat.py +85 -13
agno/models/message.py +46 -151
agno/models/meta/llama.py +85 -49
agno/models/metrics.py +120 -0
agno/models/mistral/mistral.py +90 -21
agno/models/ollama/__init__.py +0 -2
agno/models/ollama/chat.py +85 -47
agno/models/openai/chat.py +154 -37
agno/models/openai/responses.py +178 -105
agno/models/perplexity/perplexity.py +26 -2
agno/models/portkey/portkey.py +0 -7
agno/models/response.py +15 -9
agno/models/utils.py +20 -0
agno/models/vercel/__init__.py +2 -2
agno/models/vercel/v0.py +1 -1
agno/models/vllm/__init__.py +2 -2
agno/models/vllm/vllm.py +3 -3
agno/models/xai/xai.py +10 -10
agno/os/__init__.py +3 -0
agno/os/app.py +497 -0
agno/os/auth.py +47 -0
agno/os/config.py +103 -0
agno/os/interfaces/agui/__init__.py +3 -0
agno/os/interfaces/agui/agui.py +31 -0
agno/{app/agui/async_router.py → os/interfaces/agui/router.py} +16 -16
agno/{app → os/interfaces}/agui/utils.py +77 -33
agno/os/interfaces/base.py +21 -0
agno/os/interfaces/slack/__init__.py +3 -0
agno/{app/slack/async_router.py → os/interfaces/slack/router.py} +3 -5
agno/os/interfaces/slack/slack.py +32 -0
agno/os/interfaces/whatsapp/__init__.py +3 -0
agno/{app/whatsapp/async_router.py → os/interfaces/whatsapp/router.py} +4 -7
agno/os/interfaces/whatsapp/whatsapp.py +29 -0
agno/os/mcp.py +235 -0
agno/os/router.py +1400 -0
agno/os/routers/__init__.py +3 -0
agno/os/routers/evals/__init__.py +3 -0
agno/os/routers/evals/evals.py +393 -0
agno/os/routers/evals/schemas.py +142 -0
agno/os/routers/evals/utils.py +161 -0
agno/os/routers/knowledge/__init__.py +3 -0
agno/os/routers/knowledge/knowledge.py +850 -0
agno/os/routers/knowledge/schemas.py +118 -0
agno/os/routers/memory/__init__.py +3 -0
agno/os/routers/memory/memory.py +410 -0
agno/os/routers/memory/schemas.py +58 -0
agno/os/routers/metrics/__init__.py +3 -0
agno/os/routers/metrics/metrics.py +178 -0
agno/os/routers/metrics/schemas.py +47 -0
agno/os/routers/session/__init__.py +3 -0
agno/os/routers/session/session.py +536 -0
agno/os/schema.py +945 -0
agno/{app/playground → os}/settings.py +7 -15
agno/os/utils.py +270 -0
agno/reasoning/azure_ai_foundry.py +4 -4
agno/reasoning/deepseek.py +4 -4
agno/reasoning/default.py +6 -11
agno/reasoning/groq.py +4 -4
agno/reasoning/helpers.py +4 -6
agno/reasoning/ollama.py +4 -4
agno/reasoning/openai.py +4 -4
agno/run/agent.py +633 -0
agno/run/base.py +53 -77
agno/run/cancel.py +81 -0
agno/run/team.py +243 -96
agno/run/workflow.py +550 -12
agno/session/__init__.py +10 -0
agno/session/agent.py +244 -0
agno/session/summary.py +225 -0
agno/session/team.py +262 -0
agno/{storage/session/v2 → session}/workflow.py +47 -24
agno/team/__init__.py +15 -16
agno/team/team.py +3260 -4824
agno/tools/agentql.py +14 -5
agno/tools/airflow.py +9 -4
agno/tools/api.py +7 -3
agno/tools/apify.py +2 -46
agno/tools/arxiv.py +8 -3
agno/tools/aws_lambda.py +7 -5
agno/tools/aws_ses.py +7 -1
agno/tools/baidusearch.py +4 -1
agno/tools/bitbucket.py +4 -4
agno/tools/brandfetch.py +14 -11
agno/tools/bravesearch.py +4 -1
agno/tools/brightdata.py +43 -23
agno/tools/browserbase.py +13 -4
agno/tools/calcom.py +12 -10
agno/tools/calculator.py +10 -27
agno/tools/cartesia.py +20 -17
agno/tools/{clickup_tool.py → clickup.py} +12 -25
agno/tools/confluence.py +8 -8
agno/tools/crawl4ai.py +7 -1
agno/tools/csv_toolkit.py +9 -8
agno/tools/dalle.py +22 -12
agno/tools/daytona.py +13 -16
agno/tools/decorator.py +6 -3
agno/tools/desi_vocal.py +17 -8
agno/tools/discord.py +11 -8
agno/tools/docker.py +30 -42
agno/tools/duckdb.py +34 -53
agno/tools/duckduckgo.py +8 -7
agno/tools/e2b.py +62 -62
agno/tools/eleven_labs.py +36 -29
agno/tools/email.py +4 -1
agno/tools/evm.py +7 -1
agno/tools/exa.py +19 -14
agno/tools/fal.py +30 -30
agno/tools/file.py +9 -8
agno/tools/financial_datasets.py +25 -44
agno/tools/firecrawl.py +22 -22
agno/tools/function.py +127 -18
agno/tools/giphy.py +23 -11
agno/tools/github.py +48 -126
agno/tools/gmail.py +45 -61
agno/tools/google_bigquery.py +7 -6
agno/tools/google_maps.py +11 -26
agno/tools/googlesearch.py +7 -2
agno/tools/googlesheets.py +21 -17
agno/tools/hackernews.py +9 -5
agno/tools/jina.py +5 -4
agno/tools/jira.py +18 -9
agno/tools/knowledge.py +31 -32
agno/tools/linear.py +19 -34
agno/tools/linkup.py +5 -1
agno/tools/local_file_system.py +8 -5
agno/tools/lumalab.py +32 -20
agno/tools/mcp.py +1 -2
agno/tools/mem0.py +18 -12
agno/tools/memori.py +14 -10
agno/tools/mlx_transcribe.py +3 -2
agno/tools/models/azure_openai.py +33 -15
agno/tools/models/gemini.py +59 -32
agno/tools/models/groq.py +30 -23
agno/tools/models/nebius.py +28 -12
agno/tools/models_labs.py +40 -16
agno/tools/moviepy_video.py +7 -6
agno/tools/neo4j.py +10 -8
agno/tools/newspaper.py +7 -2
agno/tools/newspaper4k.py +8 -3
agno/tools/openai.py +58 -32
agno/tools/openbb.py +12 -11
agno/tools/opencv.py +63 -47
agno/tools/openweather.py +14 -12
agno/tools/pandas.py +11 -3
agno/tools/postgres.py +4 -12
agno/tools/pubmed.py +4 -1
agno/tools/python.py +9 -22
agno/tools/reasoning.py +35 -27
agno/tools/reddit.py +11 -26
agno/tools/replicate.py +55 -42
agno/tools/resend.py +4 -1
agno/tools/scrapegraph.py +15 -14
agno/tools/searxng.py +10 -23
agno/tools/serpapi.py +6 -3
agno/tools/serper.py +13 -4
agno/tools/shell.py +9 -2
agno/tools/slack.py +12 -11
agno/tools/sleep.py +3 -2
agno/tools/spider.py +24 -4
agno/tools/sql.py +7 -6
agno/tools/tavily.py +6 -4
agno/tools/telegram.py +12 -4
agno/tools/todoist.py +11 -31
agno/tools/toolkit.py +1 -1
agno/tools/trafilatura.py +22 -6
agno/tools/trello.py +9 -22
agno/tools/twilio.py +10 -3
agno/tools/user_control_flow.py +6 -1
agno/tools/valyu.py +34 -5
agno/tools/visualization.py +19 -28
agno/tools/webbrowser.py +4 -3
agno/tools/webex.py +11 -7
agno/tools/website.py +15 -46
agno/tools/webtools.py +12 -4
agno/tools/whatsapp.py +5 -9
agno/tools/wikipedia.py +20 -13
agno/tools/x.py +14 -13
agno/tools/yfinance.py +13 -40
agno/tools/youtube.py +26 -20
agno/tools/zendesk.py +7 -2
agno/tools/zep.py +10 -7
agno/tools/zoom.py +10 -9
agno/utils/common.py +1 -19
agno/utils/events.py +100 -123
agno/utils/gemini.py +32 -2
agno/utils/knowledge.py +29 -0
agno/utils/log.py +54 -4
agno/utils/mcp.py +68 -10
agno/utils/media.py +39 -0
agno/utils/message.py +12 -1
agno/utils/models/aws_claude.py +1 -1
agno/utils/models/claude.py +47 -4
agno/utils/models/cohere.py +1 -1
agno/utils/models/mistral.py +8 -7
agno/utils/models/schema_utils.py +3 -3
agno/utils/models/watsonx.py +1 -1
agno/utils/openai.py +1 -1
agno/utils/pprint.py +33 -32
agno/utils/print_response/agent.py +779 -0
agno/utils/print_response/team.py +1669 -0
agno/utils/print_response/workflow.py +1451 -0
agno/utils/prompts.py +14 -14
agno/utils/reasoning.py +87 -0
agno/utils/response.py +42 -42
agno/utils/streamlit.py +481 -0
agno/utils/string.py +8 -22
agno/utils/team.py +50 -0
agno/utils/timer.py +2 -2
agno/vectordb/base.py +33 -21
agno/vectordb/cassandra/cassandra.py +287 -23
agno/vectordb/chroma/chromadb.py +482 -59
agno/vectordb/clickhouse/clickhousedb.py +270 -63
agno/vectordb/couchbase/couchbase.py +309 -29
agno/vectordb/lancedb/lance_db.py +360 -21
agno/vectordb/langchaindb/__init__.py +5 -0
agno/vectordb/langchaindb/langchaindb.py +145 -0
agno/vectordb/lightrag/__init__.py +5 -0
agno/vectordb/lightrag/lightrag.py +374 -0
agno/vectordb/llamaindex/llamaindexdb.py +127 -0
agno/vectordb/milvus/milvus.py +242 -32
agno/vectordb/mongodb/mongodb.py +200 -24
agno/vectordb/pgvector/pgvector.py +319 -37
agno/vectordb/pineconedb/pineconedb.py +221 -27
agno/vectordb/qdrant/qdrant.py +334 -14
agno/vectordb/singlestore/singlestore.py +286 -29
agno/vectordb/surrealdb/surrealdb.py +187 -7
agno/vectordb/upstashdb/upstashdb.py +342 -26
agno/vectordb/weaviate/weaviate.py +227 -165
agno/workflow/__init__.py +17 -13
agno/workflow/{v2/condition.py → condition.py} +135 -32
agno/workflow/{v2/loop.py → loop.py} +115 -28
agno/workflow/{v2/parallel.py → parallel.py} +138 -108
agno/workflow/{v2/router.py → router.py} +133 -32
agno/workflow/{v2/step.py → step.py} +207 -49
agno/workflow/{v2/steps.py → steps.py} +147 -66
agno/workflow/types.py +482 -0
agno/workflow/workflow.py +2410 -696
agno-2.0.0.dist-info/METADATA +494 -0
agno-2.0.0.dist-info/RECORD +515 -0
agno-2.0.0.dist-info/licenses/LICENSE +201 -0
agno/agent/metrics.py +0 -107
agno/api/app.py +0 -35
agno/api/playground.py +0 -92
agno/api/schemas/app.py +0 -12
agno/api/schemas/playground.py +0 -22
agno/api/schemas/user.py +0 -35
agno/api/schemas/workspace.py +0 -46
agno/api/user.py +0 -160
agno/api/workflows.py +0 -33
agno/api/workspace.py +0 -175
agno/app/agui/__init__.py +0 -3
agno/app/agui/app.py +0 -17
agno/app/agui/sync_router.py +0 -120
agno/app/base.py +0 -186
agno/app/discord/__init__.py +0 -3
agno/app/fastapi/__init__.py +0 -3
agno/app/fastapi/app.py +0 -107
agno/app/fastapi/async_router.py +0 -457
agno/app/fastapi/sync_router.py +0 -448
agno/app/playground/app.py +0 -228
agno/app/playground/async_router.py +0 -1050
agno/app/playground/deploy.py +0 -249
agno/app/playground/operator.py +0 -183
agno/app/playground/schemas.py +0 -220
agno/app/playground/serve.py +0 -55
agno/app/playground/sync_router.py +0 -1042
agno/app/playground/utils.py +0 -46
agno/app/settings.py +0 -15
agno/app/slack/__init__.py +0 -3
agno/app/slack/app.py +0 -19
agno/app/slack/sync_router.py +0 -92
agno/app/utils.py +0 -54
agno/app/whatsapp/__init__.py +0 -3
agno/app/whatsapp/app.py +0 -15
agno/app/whatsapp/sync_router.py +0 -197
agno/cli/auth_server.py +0 -249
agno/cli/config.py +0 -274
agno/cli/console.py +0 -88
agno/cli/credentials.py +0 -23
agno/cli/entrypoint.py +0 -571
agno/cli/operator.py +0 -357
agno/cli/settings.py +0 -96
agno/cli/ws/ws_cli.py +0 -817
agno/constants.py +0 -13
agno/document/__init__.py +0 -5
agno/document/chunking/semantic.py +0 -45
agno/document/chunking/strategy.py +0 -31
agno/document/reader/__init__.py +0 -5
agno/document/reader/base.py +0 -47
agno/document/reader/docx_reader.py +0 -60
agno/document/reader/gcs/pdf_reader.py +0 -44
agno/document/reader/s3/pdf_reader.py +0 -59
agno/document/reader/s3/text_reader.py +0 -63
agno/document/reader/url_reader.py +0 -59
agno/document/reader/youtube_reader.py +0 -58
agno/embedder/__init__.py +0 -5
agno/embedder/langdb.py +0 -80
agno/embedder/mistral.py +0 -82
agno/embedder/openai.py +0 -78
agno/file/__init__.py +0 -5
agno/file/file.py +0 -16
agno/file/local/csv.py +0 -32
agno/file/local/txt.py +0 -19
agno/infra/app.py +0 -240
agno/infra/base.py +0 -144
agno/infra/context.py +0 -20
agno/infra/db_app.py +0 -52
agno/infra/resource.py +0 -205
agno/infra/resources.py +0 -55
agno/knowledge/agent.py +0 -702
agno/knowledge/arxiv.py +0 -33
agno/knowledge/combined.py +0 -36
agno/knowledge/csv.py +0 -144
agno/knowledge/csv_url.py +0 -124
agno/knowledge/document.py +0 -223
agno/knowledge/docx.py +0 -137
agno/knowledge/firecrawl.py +0 -34
agno/knowledge/gcs/__init__.py +0 -0
agno/knowledge/gcs/base.py +0 -39
agno/knowledge/gcs/pdf.py +0 -125
agno/knowledge/json.py +0 -137
agno/knowledge/langchain.py +0 -71
agno/knowledge/light_rag.py +0 -273
agno/knowledge/llamaindex.py +0 -66
agno/knowledge/markdown.py +0 -154
agno/knowledge/pdf.py +0 -164
agno/knowledge/pdf_bytes.py +0 -42
agno/knowledge/pdf_url.py +0 -148
agno/knowledge/s3/__init__.py +0 -0
agno/knowledge/s3/base.py +0 -64
agno/knowledge/s3/pdf.py +0 -33
agno/knowledge/s3/text.py +0 -34
agno/knowledge/text.py +0 -141
agno/knowledge/url.py +0 -46
agno/knowledge/website.py +0 -179
agno/knowledge/wikipedia.py +0 -32
agno/knowledge/youtube.py +0 -35
agno/memory/agent.py +0 -423
agno/memory/classifier.py +0 -104
agno/memory/db/__init__.py +0 -5
agno/memory/db/base.py +0 -42
agno/memory/db/mongodb.py +0 -189
agno/memory/db/postgres.py +0 -203
agno/memory/db/sqlite.py +0 -193
agno/memory/memory.py +0 -22
agno/memory/row.py +0 -36
agno/memory/summarizer.py +0 -201
agno/memory/summary.py +0 -19
agno/memory/team.py +0 -415
agno/memory/v2/__init__.py +0 -2
agno/memory/v2/db/__init__.py +0 -1
agno/memory/v2/db/base.py +0 -42
agno/memory/v2/db/firestore.py +0 -339
agno/memory/v2/db/mongodb.py +0 -196
agno/memory/v2/db/postgres.py +0 -214
agno/memory/v2/db/redis.py +0 -187
agno/memory/v2/db/schema.py +0 -54
agno/memory/v2/db/sqlite.py +0 -209
agno/memory/v2/manager.py +0 -437
agno/memory/v2/memory.py +0 -1097
agno/memory/v2/schema.py +0 -55
agno/memory/v2/summarizer.py +0 -215
agno/memory/workflow.py +0 -38
agno/models/ollama/tools.py +0 -430
agno/models/qwen/__init__.py +0 -5
agno/playground/__init__.py +0 -10
agno/playground/deploy.py +0 -3
agno/playground/playground.py +0 -3
agno/playground/serve.py +0 -3
agno/playground/settings.py +0 -3
agno/reranker/__init__.py +0 -0
agno/run/response.py +0 -467
agno/run/v2/__init__.py +0 -0
agno/run/v2/workflow.py +0 -567
agno/storage/__init__.py +0 -0
agno/storage/agent/__init__.py +0 -0
agno/storage/agent/dynamodb.py +0 -1
agno/storage/agent/json.py +0 -1
agno/storage/agent/mongodb.py +0 -1
agno/storage/agent/postgres.py +0 -1
agno/storage/agent/singlestore.py +0 -1
agno/storage/agent/sqlite.py +0 -1
agno/storage/agent/yaml.py +0 -1
agno/storage/base.py +0 -60
agno/storage/dynamodb.py +0 -673
agno/storage/firestore.py +0 -297
agno/storage/gcs_json.py +0 -261
agno/storage/in_memory.py +0 -234
agno/storage/json.py +0 -237
agno/storage/mongodb.py +0 -328
agno/storage/mysql.py +0 -685
agno/storage/postgres.py +0 -682
agno/storage/redis.py +0 -336
agno/storage/session/__init__.py +0 -16
agno/storage/session/agent.py +0 -64
agno/storage/session/team.py +0 -63
agno/storage/session/v2/__init__.py +0 -5
agno/storage/session/workflow.py +0 -61
agno/storage/singlestore.py +0 -606
agno/storage/sqlite.py +0 -646
agno/storage/workflow/__init__.py +0 -0
agno/storage/workflow/mongodb.py +0 -1
agno/storage/workflow/postgres.py +0 -1
agno/storage/workflow/sqlite.py +0 -1
agno/storage/yaml.py +0 -241
agno/tools/thinking.py +0 -73
agno/utils/defaults.py +0 -57
agno/utils/filesystem.py +0 -39
agno/utils/git.py +0 -52
agno/utils/json_io.py +0 -30
agno/utils/load_env.py +0 -19
agno/utils/py_io.py +0 -19
agno/utils/pyproject.py +0 -18
agno/utils/resource_filter.py +0 -31
agno/workflow/v2/__init__.py +0 -21
agno/workflow/v2/types.py +0 -357
agno/workflow/v2/workflow.py +0 -3312
agno/workspace/__init__.py +0 -0
agno/workspace/config.py +0 -325
agno/workspace/enums.py +0 -6
agno/workspace/helpers.py +0 -52
agno/workspace/operator.py +0 -757
agno/workspace/settings.py +0 -158
agno-1.8.1.dist-info/METADATA +0 -982
agno-1.8.1.dist-info/RECORD +0 -566
agno-1.8.1.dist-info/entry_points.txt +0 -3
agno-1.8.1.dist-info/licenses/LICENSE +0 -375
/agno/{app → db/migrations}/__init__.py +0 -0
/agno/{app/playground/__init__.py → db/schemas/metrics.py} +0 -0
/agno/{cli → integrations}/__init__.py +0 -0
/agno/{cli/ws → knowledge/chunking}/__init__.py +0 -0
/agno/{document/chunking → knowledge/remote_content}/__init__.py +0 -0
/agno/{document/reader/gcs → knowledge/reranker}/__init__.py +0 -0
/agno/{document/reader/s3 → os/interfaces}/__init__.py +0 -0
/agno/{app → os/interfaces}/slack/security.py +0 -0
/agno/{app → os/interfaces}/whatsapp/security.py +0 -0
/agno/{file/local → utils/print_response}/__init__.py +0 -0
/agno/{infra → vectordb/llamaindex}/__init__.py +0 -0
{agno-1.8.1.dist-info → agno-2.0.0.dist-info}/WHEEL +0 -0
{agno-1.8.1.dist-info → agno-2.0.0.dist-info}/top_level.txt +0 -0

agno/models/message.py CHANGED Viewed

@@ -1,13 +1,12 @@
 import json
-from dataclasses import asdict, dataclass
 from time import time
 from typing import Any, Dict, List, Optional, Sequence, Union
 from pydantic import BaseModel, ConfigDict, Field
-from agno.media import Audio, AudioResponse, File, Image, ImageArtifact, Video
+from agno.media import Audio, File, Image, Video
+from agno.models.metrics import Metrics
 from agno.utils.log import log_debug, log_error, log_info, log_warning
-from agno.utils.timer import Timer
 class MessageReferences(BaseModel):
@@ -49,118 +48,6 @@ class Citations(BaseModel):
     documents: Optional[List[DocumentCitation]] = None
-@dataclass
-class MessageMetrics:
-    input_tokens: int = 0
-    output_tokens: int = 0
-    total_tokens: int = 0
-    audio_tokens: int = 0
-    input_audio_tokens: int = 0
-    output_audio_tokens: int = 0
-    cached_tokens: int = 0
-    cache_write_tokens: int = 0
-    reasoning_tokens: int = 0
-    prompt_tokens: int = 0
-    completion_tokens: int = 0
-    prompt_tokens_details: Optional[dict] = None
-    completion_tokens_details: Optional[dict] = None
-    additional_metrics: Optional[dict] = None
-    time: Optional[float] = None
-    time_to_first_token: Optional[float] = None
-    timer: Optional[Timer] = None
-    def to_dict(self) -> Dict[str, Any]:
-        metrics_dict = asdict(self)
-        metrics_dict.pop("timer")
-        metrics_dict = {
-            k: v
-            for k, v in metrics_dict.items()
-            if v is not None and (not isinstance(v, (int, float)) or v != 0) and (not isinstance(v, dict) or len(v) > 0)
-        }
-        return metrics_dict
-    def start_timer(self):
-        if self.timer is None:
-            self.timer = Timer()
-        self.timer.start()
-    def stop_timer(self, set_time: bool = True):
-        if self.timer is not None:
-            self.timer.stop()
-            if set_time:
-                self.time = self.timer.elapsed
-    def set_time_to_first_token(self):
-        if self.timer is not None:
-            self.time_to_first_token = self.timer.elapsed
-    def __add__(self, other: "MessageMetrics") -> "MessageMetrics":
-        # Create new instance with summed basic metrics
-        result = MessageMetrics(
-            input_tokens=self.input_tokens + other.input_tokens,
-            output_tokens=self.output_tokens + other.output_tokens,
-            total_tokens=self.total_tokens + other.total_tokens,
-            prompt_tokens=self.prompt_tokens + other.prompt_tokens,
-            completion_tokens=self.completion_tokens + other.completion_tokens,
-            audio_tokens=self.audio_tokens + other.audio_tokens,
-            input_audio_tokens=self.input_audio_tokens + other.input_audio_tokens,
-            output_audio_tokens=self.output_audio_tokens + other.output_audio_tokens,
-            cached_tokens=self.cached_tokens + other.cached_tokens,
-            cache_write_tokens=self.cache_write_tokens + other.cache_write_tokens,
-            reasoning_tokens=self.reasoning_tokens + other.reasoning_tokens,
-        )
-        # Handle prompt_tokens_details
-        if self.prompt_tokens_details or other.prompt_tokens_details:
-            result.prompt_tokens_details = {}
-            # Merge from self
-            if self.prompt_tokens_details:
-                result.prompt_tokens_details.update(self.prompt_tokens_details)
-            # Add values from other
-            if other.prompt_tokens_details:
-                for key, value in other.prompt_tokens_details.items():
-                    result.prompt_tokens_details[key] = result.prompt_tokens_details.get(key, 0) + value
-        # Handle completion_tokens_details similarly
-        if self.completion_tokens_details or other.completion_tokens_details:
-            result.completion_tokens_details = {}
-            if self.completion_tokens_details:
-                result.completion_tokens_details.update(self.completion_tokens_details)
-            if other.completion_tokens_details:
-                for key, value in other.completion_tokens_details.items():
-                    result.completion_tokens_details[key] = result.completion_tokens_details.get(key, 0) + value
-        # Handle additional metrics
-        if self.additional_metrics or other.additional_metrics:
-            result.additional_metrics = {}
-            if self.additional_metrics:
-                result.additional_metrics.update(self.additional_metrics)
-            if other.additional_metrics:
-                result.additional_metrics.update(other.additional_metrics)
-        # Sum times if both exist
-        if self.time is not None and other.time is not None:
-            result.time = self.time + other.time
-        elif self.time is not None:
-            result.time = self.time
-        elif other.time is not None:
-            result.time = other.time
-        # Handle time_to_first_token (take the first non-None value)
-        result.time_to_first_token = self.time_to_first_token or other.time_to_first_token
-        return result
-    def __radd__(self, other: "MessageMetrics") -> "MessageMetrics":
-        if other == 0:  # Handle sum() starting value
-            return self
-        return self + other
 class Message(BaseModel):
     """Message sent to the Model"""
@@ -184,12 +71,12 @@ class Message(BaseModel):
     files: Optional[Sequence[File]] = None
     # Output from the models
-    audio_output: Optional[AudioResponse] = None
-    image_output: Optional[ImageArtifact] = None
+    audio_output: Optional[Audio] = None
+    image_output: Optional[Image] = None
+    video_output: Optional[Video] = None
     # The thinking content from the model
-    thinking: Optional[str] = None
-    redacted_thinking: Optional[str] = None
+    redacted_reasoning_content: Optional[str] = None
     # Data from the provider we might need on subsequent messages
     provider_data: Optional[Dict[str, Any]] = None
@@ -213,7 +100,7 @@ class Message(BaseModel):
     # This flag is enabled when a message is fetched from the agent's memory.
     from_history: bool = False
     # Metrics for the message.
-    metrics: MessageMetrics = Field(default_factory=MessageMetrics)
+    metrics: Metrics = Field(default_factory=Metrics)
     # The references added to the message for RAG
     references: Optional[MessageReferences] = None
     # The Unix timestamp the message was created.
@@ -232,6 +119,10 @@ class Message(BaseModel):
                 return json.dumps(self.content)
         return ""
+    @classmethod
+    def from_dict(cls, data: Dict[str, Any]) -> "Message":
+        return cls(**data)
     def to_dict(self) -> Dict[str, Any]:
         """Returns the message as a dictionary."""
         message_dict = {
@@ -246,8 +137,7 @@ class Message(BaseModel):
             "tool_args": self.tool_args,
             "tool_call_error": self.tool_call_error,
             "tool_calls": self.tool_calls,
-            "thinking": self.thinking,
-            "redacted_thinking": self.redacted_thinking,
+            "redacted_reasoning_content": self.redacted_reasoning_content,
             "provider_data": self.provider_data,
         }
         # Filter out None and empty collections
@@ -316,8 +206,8 @@ class Message(BaseModel):
             _logger(f"Name: {self.name}")
         if self.tool_call_id:
             _logger(f"Tool call Id: {self.tool_call_id}")
-        if self.thinking:
-            _logger(f"<thinking>\n{self.thinking}\n</thinking>")
+        if self.reasoning_content:
+            _logger(f"<reasoning>\n{self.reasoning_content}\n</reasoning>")
         if self.content:
             if isinstance(self.content, str) or isinstance(self.content, list):
                 _logger(self.content)
@@ -338,12 +228,13 @@ class Message(BaseModel):
                             if isinstance(tool_call_arguments, dict)
                             else json.loads(tool_call_arguments)
                         )
-                        # Ensure tool_call_args is a dictionary before calling .items()
-                        if isinstance(tool_call_args, dict):
-                            arguments = ", ".join(f"{k}: {v}" for k, v in tool_call_args.items())
-                            tool_calls_list.append(f"    Arguments: '{arguments}'")
-                        else:
-                            tool_calls_list.append(f"    Arguments: '{tool_call_args}'")
+                        if tool_call_args:
+                            # Ensure tool_call_args is a dictionary before calling .items()
+                            if isinstance(tool_call_args, dict):
+                                arguments = ", ".join(f"{k}: {v}" for k, v in tool_call_args.items())
+                                tool_calls_list.append(f"    Arguments: '{arguments}'")
+                            else:
+                                tool_calls_list.append(f"    Arguments: '{tool_call_args}'")
                     except json.JSONDecodeError:
                         tool_calls_list.append("    Arguments: 'Invalid JSON format'")
             tool_calls_str = "\n".join(tool_calls_list)
@@ -359,42 +250,46 @@ class Message(BaseModel):
             _logger(f"Files added: {len(self.files)}")
         metrics_header = " TOOL METRICS " if self.role == "tool" else " METRICS "
-        if metrics and self.metrics is not None and self.metrics != MessageMetrics():
+        if metrics and self.metrics is not None and self.metrics != Metrics():
             _logger(metrics_header, center=True, symbol="*")
-            # Combine token metrics into a single line
+            # Token metrics
             token_metrics = []
-            if self.metrics.input_tokens:
+            if self.metrics.input_tokens and self.metrics.input_tokens > 0:
                 token_metrics.append(f"input={self.metrics.input_tokens}")
-            if self.metrics.output_tokens:
+            if self.metrics.output_tokens and self.metrics.output_tokens > 0:
                 token_metrics.append(f"output={self.metrics.output_tokens}")
-            if self.metrics.total_tokens:
+            if self.metrics.total_tokens and self.metrics.total_tokens > 0:
                 token_metrics.append(f"total={self.metrics.total_tokens}")
-            if self.metrics.cached_tokens:
-                token_metrics.append(f"cached={self.metrics.cached_tokens}")
-            if self.metrics.cache_write_tokens:
+            if self.metrics.cache_read_tokens and self.metrics.cache_read_tokens > 0:
+                token_metrics.append(f"cached={self.metrics.cache_read_tokens}")
+            if self.metrics.cache_write_tokens and self.metrics.cache_write_tokens > 0:
                 token_metrics.append(f"cache_write_tokens={self.metrics.cache_write_tokens}")
-            if self.metrics.reasoning_tokens:
+            if self.metrics.reasoning_tokens and self.metrics.reasoning_tokens > 0:
                 token_metrics.append(f"reasoning={self.metrics.reasoning_tokens}")
-            if self.metrics.audio_tokens:
-                token_metrics.append(f"audio={self.metrics.audio_tokens}")
+            if self.metrics.audio_total_tokens and self.metrics.audio_total_tokens > 0:
+                token_metrics.append(f"audio={self.metrics.audio_total_tokens}")
             if token_metrics:
                 _logger(f"* Tokens:                      {', '.join(token_metrics)}")
-            if self.metrics.prompt_tokens_details:
-                _logger(f"* Prompt tokens details:       {self.metrics.prompt_tokens_details}")
-            if self.metrics.completion_tokens_details:
-                _logger(f"* Completion tokens details:   {self.metrics.completion_tokens_details}")
-            if self.metrics.time is not None:
-                _logger(f"* Time:                        {self.metrics.time:.4f}s")
-            if self.metrics.output_tokens and self.metrics.time:
-                _logger(f"* Tokens per second:           {self.metrics.output_tokens / self.metrics.time:.4f} tokens/s")
-            if self.metrics.time_to_first_token is not None:
+            # Time related metrics
+            if self.metrics.duration is not None and self.metrics.duration > 0:
+                _logger(f"* Duration:                    {self.metrics.duration:.4f}s")
+            if self.metrics.output_tokens and self.metrics.duration and self.metrics.duration > 0:
+                _logger(
+                    f"* Tokens per second:           {self.metrics.output_tokens / self.metrics.duration:.4f} tokens/s"
+                )
+            if self.metrics.time_to_first_token is not None and self.metrics.time_to_first_token > 0:
                 _logger(f"* Time to first token:         {self.metrics.time_to_first_token:.4f}s")
+            # Non-generic metrics
+            if self.metrics.provider_metrics:
+                _logger(f"* Provider metrics:            {self.metrics.provider_metrics}")
             if self.metrics.additional_metrics:
                 _logger(f"* Additional metrics:          {self.metrics.additional_metrics}")
             _logger(metrics_header, center=True, symbol="*")
     def content_is_valid(self) -> bool:
         """Check if the message content is valid."""
         return self.content is not None and len(self.content) > 0

agno/models/meta/llama.py CHANGED Viewed

@@ -9,18 +9,21 @@ from pydantic import BaseModel
 from agno.exceptions import ModelProviderError
 from agno.models.base import Model
 from agno.models.message import Message
+from agno.models.metrics import Metrics
 from agno.models.response import ModelResponse
+from agno.run.agent import RunOutput
 from agno.utils.log import log_debug, log_error, log_warning
 from agno.utils.models.llama import format_message
 try:
     from llama_api_client import AsyncLlamaAPIClient, LlamaAPIClient
-    from llama_api_client.types.create_chat_completion_response import CreateChatCompletionResponse
+    from llama_api_client.types.create_chat_completion_response import CreateChatCompletionResponse, Metric
     from llama_api_client.types.create_chat_completion_response_stream_chunk import (
         CreateChatCompletionResponseStreamChunk,
         EventDeltaTextDelta,
         EventDeltaToolCallDelta,
         EventDeltaToolCallDeltaFunction,
+        EventMetric,
     )
     from llama_api_client.types.message_text_content_item import MessageTextContentItem
 except ImportError:
@@ -192,54 +195,84 @@ class Llama(Model):
     def invoke(
         self,
         messages: List[Message],
+        assistant_message: Message,
         response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
-    ) -> CreateChatCompletionResponse:
+        run_response: Optional[RunOutput] = None,
+    ) -> ModelResponse:
         """
         Send a chat completion request to the Llama API.
         """
-        return self.get_client().chat.completions.create(
+        assistant_message.metrics.start_timer()
+        provider_response = self.get_client().chat.completions.create(
             model=self.id,
             messages=[format_message(m, tool_calls=bool(tools)) for m in messages],  # type: ignore
             **self.get_request_params(tools=tools, response_format=response_format),
         )
+        assistant_message.metrics.stop_timer()
+        model_response = self._parse_provider_response(provider_response, response_format=response_format)
+        return model_response
     async def ainvoke(
         self,
         messages: List[Message],
+        assistant_message: Message,
         response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
-    ) -> CreateChatCompletionResponse:
+        run_response: Optional[RunOutput] = None,
+    ) -> ModelResponse:
         """
         Sends an asynchronous chat completion request to the Llama API.
         """
+        if run_response and run_response.metrics:
+            run_response.metrics.set_time_to_first_token()
-        return await self.get_async_client().chat.completions.create(
+        assistant_message.metrics.start_timer()
+        provider_response = await self.get_async_client().chat.completions.create(
             model=self.id,
             messages=[format_message(m, tool_calls=bool(tools)) for m in messages],  # type: ignore
             **self.get_request_params(tools=tools, response_format=response_format),
         )
+        assistant_message.metrics.stop_timer()
+        model_response = self._parse_provider_response(provider_response, response_format=response_format)
+        return model_response
     def invoke_stream(
         self,
         messages: List[Message],
+        assistant_message: Message,
         response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
-    ) -> Iterator[CreateChatCompletionResponseStreamChunk]:
+        run_response: Optional[RunOutput] = None,
+    ) -> Iterator[ModelResponse]:
         """
         Send a streaming chat completion request to the Llama API.
         """
+        if run_response and run_response.metrics:
+            run_response.metrics.set_time_to_first_token()
         try:
-            yield from self.get_client().chat.completions.create(
+            assistant_message.metrics.start_timer()
+            for chunk in self.get_client().chat.completions.create(
                 model=self.id,
                 messages=[format_message(m, tool_calls=bool(tools)) for m in messages],  # type: ignore
                 stream=True,
                 **self.get_request_params(tools=tools, response_format=response_format),
-            )  # type: ignore
+            ):
+                yield self._parse_provider_response_delta(chunk)  # type: ignore
+            assistant_message.metrics.stop_timer()
         except Exception as e:
             log_error(f"Error from Llama API: {e}")
             raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
@@ -247,29 +280,36 @@ class Llama(Model):
     async def ainvoke_stream(
         self,
         messages: List[Message],
+        assistant_message: Message,
         response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Union[str, Dict[str, Any]]] = None,
-    ) -> AsyncIterator[CreateChatCompletionResponseStreamChunk]:
+        run_response: Optional[RunOutput] = None,
+    ) -> AsyncIterator[ModelResponse]:
         """
         Sends an asynchronous streaming chat completion request to the Llama API.
         """
+        if run_response and run_response.metrics:
+            run_response.metrics.set_time_to_first_token()
+        assistant_message.metrics.start_timer()
         try:
-            async_stream = await self.get_async_client().chat.completions.create(
+            async for chunk in await self.get_async_client().chat.completions.create(
                 model=self.id,
                 messages=[format_message(m, tool_calls=bool(tools)) for m in messages],  # type: ignore
                 stream=True,
                 **self.get_request_params(tools=tools, response_format=response_format),
-            )
-            async for chunk in async_stream:  # type: ignore
-                yield chunk  # type: ignore
+            ):
+                yield self._parse_provider_response_delta(chunk)  # type: ignore
+            assistant_message.metrics.stop_timer()
         except Exception as e:
             log_error(f"Error from Llama API: {e}")
             raise ModelProviderError(message=str(e), model_name=self.name, model_id=self.id) from e
-    @staticmethod
-    def parse_tool_calls(tool_calls_data: List[EventDeltaToolCallDeltaFunction]) -> List[Dict[str, Any]]:
+    def parse_tool_calls(self, tool_calls_data: List[EventDeltaToolCallDeltaFunction]) -> List[Dict[str, Any]]:
         """
         Parse the tool calls from the Llama API.
@@ -321,7 +361,7 @@ class Llama(Model):
         return tool_calls
-    def parse_provider_response(self, response: CreateChatCompletionResponse, **kwargs) -> ModelResponse:
+    def _parse_provider_response(self, response: CreateChatCompletionResponse, **kwargs) -> ModelResponse:
         """
         Parse the Llama response into a ModelResponse.
@@ -371,26 +411,12 @@ class Llama(Model):
         # Add metrics from the metrics list
         if hasattr(response, "metrics") and response.metrics is not None:
-            usage_data = {}
-            metric_map = {
-                "num_prompt_tokens": "input_tokens",
-                "num_completion_tokens": "output_tokens",
-                "num_total_tokens": "total_tokens",
-            }
-            for metric in response.metrics:
-                key = metric_map.get(metric.metric)
-                if key:
-                    value = int(metric.value)
-                    usage_data[key] = value
-                if usage_data:
-                    model_response.response_usage = usage_data
+            model_response.response_usage = self._get_metrics(response.metrics)
         return model_response
-    def parse_provider_response_delta(
-        self, response_delta: CreateChatCompletionResponseStreamChunk, **kwargs
+    def _parse_provider_response_delta(
+        self, response: CreateChatCompletionResponseStreamChunk, **kwargs
     ) -> ModelResponse:
         """
         Parse the Llama streaming response into a ModelResponse.
@@ -403,25 +429,12 @@ class Llama(Model):
         """
         model_response = ModelResponse()
-        if response_delta is not None:
-            delta = response_delta.event
+        if response is not None:
+            delta = response.event
             # Capture metrics event
             if delta.event_type == "metrics" and delta.metrics is not None:
-                usage_data = {}
-                metric_map = {
-                    "num_prompt_tokens": "input_tokens",
-                    "num_completion_tokens": "output_tokens",
-                    "num_total_tokens": "total_tokens",
-                }
-                for metric in delta.metrics:
-                    key = metric_map.get(metric.metric)
-                    if key:
-                        usage_data[key] = int(metric.value)
-                if usage_data:
-                    model_response.response_usage = usage_data
+                model_response.response_usage = self._get_metrics(delta.metrics)
             if isinstance(delta.delta, EventDeltaTextDelta):
                 model_response.content = delta.delta.text
@@ -431,3 +444,26 @@ class Llama(Model):
                 model_response.tool_calls = delta.delta  # type: ignore
         return model_response
+    def _get_metrics(self, response_usage: Union[List[Metric], List[EventMetric]]) -> Metrics:
+        """
+        Parse the given Llama usage into an Agno Metrics object.
+        Args:
+            response_usage: Usage data from Llama
+        Returns:
+            Metrics: Parsed metrics data
+        """
+        metrics = Metrics()
+        for metric in response_usage:
+            metrics_field = metric.metric
+            if metrics_field == "num_prompt_tokens":
+                metrics.input_tokens = int(metric.value)
+            elif metrics_field == "num_completion_tokens":
+                metrics.output_tokens = int(metric.value)
+        metrics.total_tokens = metrics.input_tokens + metrics.output_tokens
+        return metrics

agno/models/metrics.py ADDED Viewed

@@ -0,0 +1,120 @@
+from dataclasses import asdict, dataclass
+from typing import Any, Dict, Optional
+from agno.utils.timer import Timer
+@dataclass
+class Metrics:
+    """All relevant metrics for a session, run or message."""
+    # Main token consumption values
+    input_tokens: int = 0
+    output_tokens: int = 0
+    total_tokens: int = 0
+    # Audio token usage
+    audio_input_tokens: int = 0
+    audio_output_tokens: int = 0
+    audio_total_tokens: int = 0
+    # Cache token usage
+    cache_read_tokens: int = 0
+    cache_write_tokens: int = 0
+    # Tokens employed in reasoning
+    reasoning_tokens: int = 0
+    # Time metrics
+    # Internal timer utility for tracking execution time
+    timer: Optional[Timer] = None
+    # Time from run start to first token generation, in seconds
+    time_to_first_token: Optional[float] = None
+    # Total run time, in seconds
+    duration: Optional[float] = None
+    # Provider-specific metrics
+    provider_metrics: Optional[dict] = None
+    # Any additional metrics
+    additional_metrics: Optional[dict] = None
+    def to_dict(self) -> Dict[str, Any]:
+        metrics_dict = asdict(self)
+        # Remove the timer util if present
+        metrics_dict.pop("timer", None)
+        metrics_dict = {
+            k: v
+            for k, v in metrics_dict.items()
+            if v is not None and (not isinstance(v, (int, float)) or v != 0) and (not isinstance(v, dict) or len(v) > 0)
+        }
+        return metrics_dict
+    def __add__(self, other: "Metrics") -> "Metrics":
+        # Create new instance of the same type as self
+        result_class = type(self)
+        result = result_class(
+            input_tokens=self.input_tokens + other.input_tokens,
+            output_tokens=self.output_tokens + other.output_tokens,
+            total_tokens=self.total_tokens + other.total_tokens,
+            audio_total_tokens=self.audio_total_tokens + other.audio_total_tokens,
+            audio_input_tokens=self.audio_input_tokens + other.audio_input_tokens,
+            audio_output_tokens=self.audio_output_tokens + other.audio_output_tokens,
+            cache_read_tokens=self.cache_read_tokens + other.cache_read_tokens,
+            cache_write_tokens=self.cache_write_tokens + other.cache_write_tokens,
+            reasoning_tokens=self.reasoning_tokens + other.reasoning_tokens,
+        )
+        # Handle provider_metrics
+        if self.provider_metrics or other.provider_metrics:
+            result.provider_metrics = {}
+            if self.provider_metrics:
+                result.provider_metrics.update(self.provider_metrics)
+            if other.provider_metrics:
+                result.provider_metrics.update(other.provider_metrics)
+        # Handle additional metrics
+        if self.additional_metrics or other.additional_metrics:
+            result.additional_metrics = {}
+            if self.additional_metrics:
+                result.additional_metrics.update(self.additional_metrics)
+            if other.additional_metrics:
+                result.additional_metrics.update(other.additional_metrics)
+        # Sum durations if both exist
+        if self.duration is not None and other.duration is not None:
+            result.duration = self.duration + other.duration
+        elif self.duration is not None:
+            result.duration = self.duration
+        elif other.duration is not None:
+            result.duration = other.duration
+        # Sum time to first token if both exist
+        if self.time_to_first_token is not None and other.time_to_first_token is not None:
+            result.time_to_first_token = self.time_to_first_token + other.time_to_first_token
+        elif self.time_to_first_token is not None:
+            result.time_to_first_token = self.time_to_first_token
+        elif other.time_to_first_token is not None:
+            result.time_to_first_token = other.time_to_first_token
+        return result
+    def __radd__(self, other: "Metrics") -> "Metrics":
+        if other == 0:  # Handle sum() starting value
+            return self
+        return self + other
+    def start_timer(self):
+        if self.timer is None:
+            self.timer = Timer()
+        self.timer.start()
+    def stop_timer(self, set_duration: bool = True):
+        if self.timer is not None:
+            self.timer.stop()
+            if set_duration:
+                self.duration = self.timer.elapsed
+    def set_time_to_first_token(self):
+        if self.timer is not None:
+            self.time_to_first_token = self.timer.elapsed

agno 1.8.1__py3-none-any.whl → 2.0.0__py3-none-any.whl

agno 1.8.1py3-none-any.whl → 2.0.0py3-none-any.whl