agno 2.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- agno/agent/agent.py +5540 -2273
- agno/api/api.py +2 -0
- agno/api/os.py +1 -1
- agno/compression/__init__.py +3 -0
- agno/compression/manager.py +247 -0
- agno/culture/__init__.py +3 -0
- agno/culture/manager.py +956 -0
- agno/db/async_postgres/__init__.py +3 -0
- agno/db/base.py +689 -6
- agno/db/dynamo/dynamo.py +933 -37
- agno/db/dynamo/schemas.py +174 -10
- agno/db/dynamo/utils.py +63 -4
- agno/db/firestore/firestore.py +831 -9
- agno/db/firestore/schemas.py +51 -0
- agno/db/firestore/utils.py +102 -4
- agno/db/gcs_json/gcs_json_db.py +660 -12
- agno/db/gcs_json/utils.py +60 -26
- agno/db/in_memory/in_memory_db.py +287 -14
- agno/db/in_memory/utils.py +60 -2
- agno/db/json/json_db.py +590 -14
- agno/db/json/utils.py +60 -26
- agno/db/migrations/manager.py +199 -0
- agno/db/migrations/v1_to_v2.py +43 -13
- agno/db/migrations/versions/__init__.py +0 -0
- agno/db/migrations/versions/v2_3_0.py +938 -0
- agno/db/mongo/__init__.py +15 -1
- agno/db/mongo/async_mongo.py +2760 -0
- agno/db/mongo/mongo.py +879 -11
- agno/db/mongo/schemas.py +42 -0
- agno/db/mongo/utils.py +80 -8
- agno/db/mysql/__init__.py +2 -1
- agno/db/mysql/async_mysql.py +2912 -0
- agno/db/mysql/mysql.py +946 -68
- agno/db/mysql/schemas.py +72 -10
- agno/db/mysql/utils.py +198 -7
- agno/db/postgres/__init__.py +2 -1
- agno/db/postgres/async_postgres.py +2579 -0
- agno/db/postgres/postgres.py +942 -57
- agno/db/postgres/schemas.py +81 -18
- agno/db/postgres/utils.py +164 -2
- agno/db/redis/redis.py +671 -7
- agno/db/redis/schemas.py +50 -0
- agno/db/redis/utils.py +65 -7
- agno/db/schemas/__init__.py +2 -1
- agno/db/schemas/culture.py +120 -0
- agno/db/schemas/evals.py +1 -0
- agno/db/schemas/memory.py +17 -2
- agno/db/singlestore/schemas.py +63 -0
- agno/db/singlestore/singlestore.py +949 -83
- agno/db/singlestore/utils.py +60 -2
- agno/db/sqlite/__init__.py +2 -1
- agno/db/sqlite/async_sqlite.py +2911 -0
- agno/db/sqlite/schemas.py +62 -0
- agno/db/sqlite/sqlite.py +965 -46
- agno/db/sqlite/utils.py +169 -8
- agno/db/surrealdb/__init__.py +3 -0
- agno/db/surrealdb/metrics.py +292 -0
- agno/db/surrealdb/models.py +334 -0
- agno/db/surrealdb/queries.py +71 -0
- agno/db/surrealdb/surrealdb.py +1908 -0
- agno/db/surrealdb/utils.py +147 -0
- agno/db/utils.py +2 -0
- agno/eval/__init__.py +10 -0
- agno/eval/accuracy.py +75 -55
- agno/eval/agent_as_judge.py +861 -0
- agno/eval/base.py +29 -0
- agno/eval/performance.py +16 -7
- agno/eval/reliability.py +28 -16
- agno/eval/utils.py +35 -17
- agno/exceptions.py +27 -2
- agno/filters.py +354 -0
- agno/guardrails/prompt_injection.py +1 -0
- agno/hooks/__init__.py +3 -0
- agno/hooks/decorator.py +164 -0
- agno/integrations/discord/client.py +1 -1
- agno/knowledge/chunking/agentic.py +13 -10
- agno/knowledge/chunking/fixed.py +4 -1
- agno/knowledge/chunking/semantic.py +9 -4
- agno/knowledge/chunking/strategy.py +59 -15
- agno/knowledge/embedder/fastembed.py +1 -1
- agno/knowledge/embedder/nebius.py +1 -1
- agno/knowledge/embedder/ollama.py +8 -0
- agno/knowledge/embedder/openai.py +8 -8
- agno/knowledge/embedder/sentence_transformer.py +6 -2
- agno/knowledge/embedder/vllm.py +262 -0
- agno/knowledge/knowledge.py +1618 -318
- agno/knowledge/reader/base.py +6 -2
- agno/knowledge/reader/csv_reader.py +8 -10
- agno/knowledge/reader/docx_reader.py +5 -6
- agno/knowledge/reader/field_labeled_csv_reader.py +16 -20
- agno/knowledge/reader/json_reader.py +5 -4
- agno/knowledge/reader/markdown_reader.py +8 -8
- agno/knowledge/reader/pdf_reader.py +17 -19
- agno/knowledge/reader/pptx_reader.py +101 -0
- agno/knowledge/reader/reader_factory.py +32 -3
- agno/knowledge/reader/s3_reader.py +3 -3
- agno/knowledge/reader/tavily_reader.py +193 -0
- agno/knowledge/reader/text_reader.py +22 -10
- agno/knowledge/reader/web_search_reader.py +1 -48
- agno/knowledge/reader/website_reader.py +10 -10
- agno/knowledge/reader/wikipedia_reader.py +33 -1
- agno/knowledge/types.py +1 -0
- agno/knowledge/utils.py +72 -7
- agno/media.py +22 -6
- agno/memory/__init__.py +14 -1
- agno/memory/manager.py +544 -83
- agno/memory/strategies/__init__.py +15 -0
- agno/memory/strategies/base.py +66 -0
- agno/memory/strategies/summarize.py +196 -0
- agno/memory/strategies/types.py +37 -0
- agno/models/aimlapi/aimlapi.py +17 -0
- agno/models/anthropic/claude.py +515 -40
- agno/models/aws/bedrock.py +102 -21
- agno/models/aws/claude.py +131 -274
- agno/models/azure/ai_foundry.py +41 -19
- agno/models/azure/openai_chat.py +39 -8
- agno/models/base.py +1249 -525
- agno/models/cerebras/cerebras.py +91 -21
- agno/models/cerebras/cerebras_openai.py +21 -2
- agno/models/cohere/chat.py +40 -6
- agno/models/cometapi/cometapi.py +18 -1
- agno/models/dashscope/dashscope.py +2 -3
- agno/models/deepinfra/deepinfra.py +18 -1
- agno/models/deepseek/deepseek.py +69 -3
- agno/models/fireworks/fireworks.py +18 -1
- agno/models/google/gemini.py +877 -80
- agno/models/google/utils.py +22 -0
- agno/models/groq/groq.py +51 -18
- agno/models/huggingface/huggingface.py +17 -6
- agno/models/ibm/watsonx.py +16 -6
- agno/models/internlm/internlm.py +18 -1
- agno/models/langdb/langdb.py +13 -1
- agno/models/litellm/chat.py +44 -9
- agno/models/litellm/litellm_openai.py +18 -1
- agno/models/message.py +28 -5
- agno/models/meta/llama.py +47 -14
- agno/models/meta/llama_openai.py +22 -17
- agno/models/mistral/mistral.py +8 -4
- agno/models/nebius/nebius.py +6 -7
- agno/models/nvidia/nvidia.py +20 -3
- agno/models/ollama/chat.py +24 -8
- agno/models/openai/chat.py +104 -29
- agno/models/openai/responses.py +101 -81
- agno/models/openrouter/openrouter.py +60 -3
- agno/models/perplexity/perplexity.py +17 -1
- agno/models/portkey/portkey.py +7 -6
- agno/models/requesty/requesty.py +24 -4
- agno/models/response.py +73 -2
- agno/models/sambanova/sambanova.py +20 -3
- agno/models/siliconflow/siliconflow.py +19 -2
- agno/models/together/together.py +20 -3
- agno/models/utils.py +254 -8
- agno/models/vercel/v0.py +20 -3
- agno/models/vertexai/__init__.py +0 -0
- agno/models/vertexai/claude.py +190 -0
- agno/models/vllm/vllm.py +19 -14
- agno/models/xai/xai.py +19 -2
- agno/os/app.py +549 -152
- agno/os/auth.py +190 -3
- agno/os/config.py +23 -0
- agno/os/interfaces/a2a/router.py +8 -11
- agno/os/interfaces/a2a/utils.py +1 -1
- agno/os/interfaces/agui/router.py +18 -3
- agno/os/interfaces/agui/utils.py +152 -39
- agno/os/interfaces/slack/router.py +55 -37
- agno/os/interfaces/slack/slack.py +9 -1
- agno/os/interfaces/whatsapp/router.py +0 -1
- agno/os/interfaces/whatsapp/security.py +3 -1
- agno/os/mcp.py +110 -52
- agno/os/middleware/__init__.py +2 -0
- agno/os/middleware/jwt.py +676 -112
- agno/os/router.py +40 -1478
- agno/os/routers/agents/__init__.py +3 -0
- agno/os/routers/agents/router.py +599 -0
- agno/os/routers/agents/schema.py +261 -0
- agno/os/routers/evals/evals.py +96 -39
- agno/os/routers/evals/schemas.py +65 -33
- agno/os/routers/evals/utils.py +80 -10
- agno/os/routers/health.py +10 -4
- agno/os/routers/knowledge/knowledge.py +196 -38
- agno/os/routers/knowledge/schemas.py +82 -22
- agno/os/routers/memory/memory.py +279 -52
- agno/os/routers/memory/schemas.py +46 -17
- agno/os/routers/metrics/metrics.py +20 -8
- agno/os/routers/metrics/schemas.py +16 -16
- agno/os/routers/session/session.py +462 -34
- agno/os/routers/teams/__init__.py +3 -0
- agno/os/routers/teams/router.py +512 -0
- agno/os/routers/teams/schema.py +257 -0
- agno/os/routers/traces/__init__.py +3 -0
- agno/os/routers/traces/schemas.py +414 -0
- agno/os/routers/traces/traces.py +499 -0
- agno/os/routers/workflows/__init__.py +3 -0
- agno/os/routers/workflows/router.py +624 -0
- agno/os/routers/workflows/schema.py +75 -0
- agno/os/schema.py +256 -693
- agno/os/scopes.py +469 -0
- agno/os/utils.py +514 -36
- agno/reasoning/anthropic.py +80 -0
- agno/reasoning/gemini.py +73 -0
- agno/reasoning/openai.py +5 -0
- agno/reasoning/vertexai.py +76 -0
- agno/run/__init__.py +6 -0
- agno/run/agent.py +155 -32
- agno/run/base.py +55 -3
- agno/run/requirement.py +181 -0
- agno/run/team.py +125 -38
- agno/run/workflow.py +72 -18
- agno/session/agent.py +102 -89
- agno/session/summary.py +56 -15
- agno/session/team.py +164 -90
- agno/session/workflow.py +405 -40
- agno/table.py +10 -0
- agno/team/team.py +3974 -1903
- agno/tools/dalle.py +2 -4
- agno/tools/eleven_labs.py +23 -25
- agno/tools/exa.py +21 -16
- agno/tools/file.py +153 -23
- agno/tools/file_generation.py +16 -10
- agno/tools/firecrawl.py +15 -7
- agno/tools/function.py +193 -38
- agno/tools/gmail.py +238 -14
- agno/tools/google_drive.py +271 -0
- agno/tools/googlecalendar.py +36 -8
- agno/tools/googlesheets.py +20 -5
- agno/tools/jira.py +20 -0
- agno/tools/mcp/__init__.py +10 -0
- agno/tools/mcp/mcp.py +331 -0
- agno/tools/mcp/multi_mcp.py +347 -0
- agno/tools/mcp/params.py +24 -0
- agno/tools/mcp_toolbox.py +3 -3
- agno/tools/models/nebius.py +5 -5
- agno/tools/models_labs.py +20 -10
- agno/tools/nano_banana.py +151 -0
- agno/tools/notion.py +204 -0
- agno/tools/parallel.py +314 -0
- agno/tools/postgres.py +76 -36
- agno/tools/redshift.py +406 -0
- agno/tools/scrapegraph.py +1 -1
- agno/tools/shopify.py +1519 -0
- agno/tools/slack.py +18 -3
- agno/tools/spotify.py +919 -0
- agno/tools/tavily.py +146 -0
- agno/tools/toolkit.py +25 -0
- agno/tools/workflow.py +8 -1
- agno/tools/yfinance.py +12 -11
- agno/tracing/__init__.py +12 -0
- agno/tracing/exporter.py +157 -0
- agno/tracing/schemas.py +276 -0
- agno/tracing/setup.py +111 -0
- agno/utils/agent.py +938 -0
- agno/utils/cryptography.py +22 -0
- agno/utils/dttm.py +33 -0
- agno/utils/events.py +151 -3
- agno/utils/gemini.py +15 -5
- agno/utils/hooks.py +118 -4
- agno/utils/http.py +113 -2
- agno/utils/knowledge.py +12 -5
- agno/utils/log.py +1 -0
- agno/utils/mcp.py +92 -2
- agno/utils/media.py +187 -1
- agno/utils/merge_dict.py +3 -3
- agno/utils/message.py +60 -0
- agno/utils/models/ai_foundry.py +9 -2
- agno/utils/models/claude.py +49 -14
- agno/utils/models/cohere.py +9 -2
- agno/utils/models/llama.py +9 -2
- agno/utils/models/mistral.py +4 -2
- agno/utils/print_response/agent.py +109 -16
- agno/utils/print_response/team.py +223 -30
- agno/utils/print_response/workflow.py +251 -34
- agno/utils/streamlit.py +1 -1
- agno/utils/team.py +98 -9
- agno/utils/tokens.py +657 -0
- agno/vectordb/base.py +39 -7
- agno/vectordb/cassandra/cassandra.py +21 -5
- agno/vectordb/chroma/chromadb.py +43 -12
- agno/vectordb/clickhouse/clickhousedb.py +21 -5
- agno/vectordb/couchbase/couchbase.py +29 -5
- agno/vectordb/lancedb/lance_db.py +92 -181
- agno/vectordb/langchaindb/langchaindb.py +24 -4
- agno/vectordb/lightrag/lightrag.py +17 -3
- agno/vectordb/llamaindex/llamaindexdb.py +25 -5
- agno/vectordb/milvus/milvus.py +50 -37
- agno/vectordb/mongodb/__init__.py +7 -1
- agno/vectordb/mongodb/mongodb.py +36 -30
- agno/vectordb/pgvector/pgvector.py +201 -77
- agno/vectordb/pineconedb/pineconedb.py +41 -23
- agno/vectordb/qdrant/qdrant.py +67 -54
- agno/vectordb/redis/__init__.py +9 -0
- agno/vectordb/redis/redisdb.py +682 -0
- agno/vectordb/singlestore/singlestore.py +50 -29
- agno/vectordb/surrealdb/surrealdb.py +31 -41
- agno/vectordb/upstashdb/upstashdb.py +34 -6
- agno/vectordb/weaviate/weaviate.py +53 -14
- agno/workflow/__init__.py +2 -0
- agno/workflow/agent.py +299 -0
- agno/workflow/condition.py +120 -18
- agno/workflow/loop.py +77 -10
- agno/workflow/parallel.py +231 -143
- agno/workflow/router.py +118 -17
- agno/workflow/step.py +609 -170
- agno/workflow/steps.py +73 -6
- agno/workflow/types.py +96 -21
- agno/workflow/workflow.py +2039 -262
- {agno-2.1.2.dist-info → agno-2.3.13.dist-info}/METADATA +201 -66
- agno-2.3.13.dist-info/RECORD +613 -0
- agno/tools/googlesearch.py +0 -98
- agno/tools/mcp.py +0 -679
- agno/tools/memori.py +0 -339
- agno-2.1.2.dist-info/RECORD +0 -543
- {agno-2.1.2.dist-info → agno-2.3.13.dist-info}/WHEEL +0 -0
- {agno-2.1.2.dist-info → agno-2.3.13.dist-info}/licenses/LICENSE +0 -0
- {agno-2.1.2.dist-info → agno-2.3.13.dist-info}/top_level.txt +0 -0
|
@@ -0,0 +1,190 @@
|
|
|
1
|
+
from dataclasses import dataclass
|
|
2
|
+
from os import getenv
|
|
3
|
+
from typing import Any, Dict, List, Optional, Type, Union
|
|
4
|
+
|
|
5
|
+
import httpx
|
|
6
|
+
from pydantic import BaseModel
|
|
7
|
+
|
|
8
|
+
from agno.models.anthropic import Claude as AnthropicClaude
|
|
9
|
+
from agno.utils.http import get_default_async_client, get_default_sync_client
|
|
10
|
+
from agno.utils.log import log_debug, log_warning
|
|
11
|
+
from agno.utils.models.claude import format_tools_for_model
|
|
12
|
+
|
|
13
|
+
try:
|
|
14
|
+
from anthropic import AnthropicVertex, AsyncAnthropicVertex
|
|
15
|
+
except ImportError as e:
|
|
16
|
+
raise ImportError("`anthropic` not installed. Please install it with `pip install anthropic`") from e
|
|
17
|
+
|
|
18
|
+
|
|
19
|
+
@dataclass
|
|
20
|
+
class Claude(AnthropicClaude):
|
|
21
|
+
"""
|
|
22
|
+
A class representing Anthropic Claude model.
|
|
23
|
+
|
|
24
|
+
For more information, see: https://docs.anthropic.com/en/api/messages
|
|
25
|
+
"""
|
|
26
|
+
|
|
27
|
+
id: str = "claude-sonnet-4@20250514"
|
|
28
|
+
name: str = "Claude"
|
|
29
|
+
provider: str = "VertexAI"
|
|
30
|
+
|
|
31
|
+
# Client parameters
|
|
32
|
+
region: Optional[str] = None
|
|
33
|
+
project_id: Optional[str] = None
|
|
34
|
+
base_url: Optional[str] = None
|
|
35
|
+
|
|
36
|
+
client: Optional[AnthropicVertex] = None # type: ignore
|
|
37
|
+
async_client: Optional[AsyncAnthropicVertex] = None # type: ignore
|
|
38
|
+
|
|
39
|
+
def __post_init__(self):
|
|
40
|
+
"""Validate model configuration after initialization"""
|
|
41
|
+
# Validate thinking support immediately at model creation
|
|
42
|
+
if self.thinking:
|
|
43
|
+
self._validate_thinking_support()
|
|
44
|
+
# Overwrite output schema support for VertexAI Claude
|
|
45
|
+
self.supports_native_structured_outputs = False
|
|
46
|
+
self.supports_json_schema_outputs = False
|
|
47
|
+
|
|
48
|
+
def _get_client_params(self) -> Dict[str, Any]:
|
|
49
|
+
client_params: Dict[str, Any] = {}
|
|
50
|
+
|
|
51
|
+
# Add API key to client parameters
|
|
52
|
+
client_params["region"] = self.region or getenv("CLOUD_ML_REGION")
|
|
53
|
+
client_params["project_id"] = self.project_id or getenv("ANTHROPIC_VERTEX_PROJECT_ID")
|
|
54
|
+
client_params["base_url"] = self.base_url or getenv("ANTHROPIC_VERTEX_BASE_URL")
|
|
55
|
+
if self.timeout is not None:
|
|
56
|
+
client_params["timeout"] = self.timeout
|
|
57
|
+
|
|
58
|
+
# Add additional client parameters
|
|
59
|
+
if self.client_params is not None:
|
|
60
|
+
client_params.update(self.client_params)
|
|
61
|
+
if self.default_headers is not None:
|
|
62
|
+
client_params["default_headers"] = self.default_headers
|
|
63
|
+
return client_params
|
|
64
|
+
|
|
65
|
+
def get_client(self):
|
|
66
|
+
"""
|
|
67
|
+
Returns an instance of the Anthropic client.
|
|
68
|
+
"""
|
|
69
|
+
if self.client and not self.client.is_closed():
|
|
70
|
+
return self.client
|
|
71
|
+
|
|
72
|
+
_client_params = self._get_client_params()
|
|
73
|
+
if self.http_client:
|
|
74
|
+
if isinstance(self.http_client, httpx.Client):
|
|
75
|
+
_client_params["http_client"] = self.http_client
|
|
76
|
+
else:
|
|
77
|
+
log_warning("http_client is not an instance of httpx.Client. Using default global httpx.Client.")
|
|
78
|
+
# Use global sync client when user http_client is invalid
|
|
79
|
+
_client_params["http_client"] = get_default_sync_client()
|
|
80
|
+
else:
|
|
81
|
+
# Use global sync client when no custom http_client is provided
|
|
82
|
+
_client_params["http_client"] = get_default_sync_client()
|
|
83
|
+
self.client = AnthropicVertex(**_client_params)
|
|
84
|
+
return self.client
|
|
85
|
+
|
|
86
|
+
def get_async_client(self):
|
|
87
|
+
"""
|
|
88
|
+
Returns an instance of the async Anthropic client.
|
|
89
|
+
"""
|
|
90
|
+
if self.async_client and not self.async_client.is_closed():
|
|
91
|
+
return self.async_client
|
|
92
|
+
|
|
93
|
+
_client_params = self._get_client_params()
|
|
94
|
+
if self.http_client:
|
|
95
|
+
if isinstance(self.http_client, httpx.AsyncClient):
|
|
96
|
+
_client_params["http_client"] = self.http_client
|
|
97
|
+
else:
|
|
98
|
+
log_warning(
|
|
99
|
+
"http_client is not an instance of httpx.AsyncClient. Using default global httpx.AsyncClient."
|
|
100
|
+
)
|
|
101
|
+
# Use global async client when user http_client is invalid
|
|
102
|
+
_client_params["http_client"] = get_default_async_client()
|
|
103
|
+
else:
|
|
104
|
+
# Use global async client when no custom http_client is provided
|
|
105
|
+
_client_params["http_client"] = get_default_async_client()
|
|
106
|
+
self.async_client = AsyncAnthropicVertex(**_client_params)
|
|
107
|
+
return self.async_client
|
|
108
|
+
|
|
109
|
+
def get_request_params(
|
|
110
|
+
self,
|
|
111
|
+
response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
|
|
112
|
+
tools: Optional[List[Dict[str, Any]]] = None,
|
|
113
|
+
) -> Dict[str, Any]:
|
|
114
|
+
"""
|
|
115
|
+
Generate keyword arguments for API requests.
|
|
116
|
+
|
|
117
|
+
Returns:
|
|
118
|
+
Dict[str, Any]: The keyword arguments for API requests.
|
|
119
|
+
"""
|
|
120
|
+
# Validate thinking support if thinking is enabled
|
|
121
|
+
if self.thinking:
|
|
122
|
+
self._validate_thinking_support()
|
|
123
|
+
|
|
124
|
+
_request_params: Dict[str, Any] = {}
|
|
125
|
+
if self.max_tokens:
|
|
126
|
+
_request_params["max_tokens"] = self.max_tokens
|
|
127
|
+
if self.thinking:
|
|
128
|
+
_request_params["thinking"] = self.thinking
|
|
129
|
+
if self.temperature:
|
|
130
|
+
_request_params["temperature"] = self.temperature
|
|
131
|
+
if self.stop_sequences:
|
|
132
|
+
_request_params["stop_sequences"] = self.stop_sequences
|
|
133
|
+
if self.top_p:
|
|
134
|
+
_request_params["top_p"] = self.top_p
|
|
135
|
+
if self.top_k:
|
|
136
|
+
_request_params["top_k"] = self.top_k
|
|
137
|
+
if self.timeout:
|
|
138
|
+
_request_params["timeout"] = self.timeout
|
|
139
|
+
|
|
140
|
+
# Build betas list - include existing betas and add new one if needed
|
|
141
|
+
betas_list = list(self.betas) if self.betas else []
|
|
142
|
+
|
|
143
|
+
# Include betas if any are present
|
|
144
|
+
if betas_list:
|
|
145
|
+
_request_params["betas"] = betas_list
|
|
146
|
+
|
|
147
|
+
if self.request_params:
|
|
148
|
+
_request_params.update(self.request_params)
|
|
149
|
+
|
|
150
|
+
if _request_params:
|
|
151
|
+
log_debug(f"Calling {self.provider} with request parameters: {_request_params}", log_level=2)
|
|
152
|
+
return _request_params
|
|
153
|
+
|
|
154
|
+
def _prepare_request_kwargs(
|
|
155
|
+
self,
|
|
156
|
+
system_message: str,
|
|
157
|
+
tools: Optional[List[Dict[str, Any]]] = None,
|
|
158
|
+
response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
|
|
159
|
+
) -> Dict[str, Any]:
|
|
160
|
+
"""
|
|
161
|
+
Prepare the request keyword arguments for the API call.
|
|
162
|
+
|
|
163
|
+
Args:
|
|
164
|
+
system_message (str): The concatenated system messages.
|
|
165
|
+
tools: Optional list of tools
|
|
166
|
+
response_format: Optional response format (Pydantic model or dict)
|
|
167
|
+
|
|
168
|
+
Returns:
|
|
169
|
+
Dict[str, Any]: The request keyword arguments.
|
|
170
|
+
"""
|
|
171
|
+
# Pass response_format and tools to get_request_params for beta header handling
|
|
172
|
+
request_kwargs = self.get_request_params(response_format=response_format, tools=tools).copy()
|
|
173
|
+
if system_message:
|
|
174
|
+
if self.cache_system_prompt:
|
|
175
|
+
cache_control = (
|
|
176
|
+
{"type": "ephemeral", "ttl": "1h"}
|
|
177
|
+
if self.extended_cache_time is not None and self.extended_cache_time is True
|
|
178
|
+
else {"type": "ephemeral"}
|
|
179
|
+
)
|
|
180
|
+
request_kwargs["system"] = [{"text": system_message, "type": "text", "cache_control": cache_control}]
|
|
181
|
+
else:
|
|
182
|
+
request_kwargs["system"] = [{"text": system_message, "type": "text"}]
|
|
183
|
+
|
|
184
|
+
# Format tools (this will handle strict mode)
|
|
185
|
+
if tools:
|
|
186
|
+
request_kwargs["tools"] = format_tools_for_model(tools)
|
|
187
|
+
|
|
188
|
+
if request_kwargs:
|
|
189
|
+
log_debug(f"Calling {self.provider} with request parameters: {request_kwargs}", log_level=2)
|
|
190
|
+
return request_kwargs
|
agno/models/vllm/vllm.py
CHANGED
|
@@ -4,6 +4,7 @@ from typing import Any, Dict, List, Optional, Type, Union
|
|
|
4
4
|
|
|
5
5
|
from pydantic import BaseModel
|
|
6
6
|
|
|
7
|
+
from agno.exceptions import ModelAuthenticationError
|
|
7
8
|
from agno.models.openai.like import OpenAILike
|
|
8
9
|
from agno.utils.log import log_debug
|
|
9
10
|
|
|
@@ -29,8 +30,8 @@ class VLLM(OpenAILike):
|
|
|
29
30
|
name: str = "VLLM"
|
|
30
31
|
provider: str = "VLLM"
|
|
31
32
|
|
|
32
|
-
api_key: Optional[str] =
|
|
33
|
-
base_url: Optional[str] =
|
|
33
|
+
api_key: Optional[str] = None
|
|
34
|
+
base_url: Optional[str] = None
|
|
34
35
|
|
|
35
36
|
temperature: float = 0.7
|
|
36
37
|
top_p: float = 0.8
|
|
@@ -38,19 +39,23 @@ class VLLM(OpenAILike):
|
|
|
38
39
|
top_k: Optional[int] = None
|
|
39
40
|
enable_thinking: Optional[bool] = None
|
|
40
41
|
|
|
41
|
-
def
|
|
42
|
-
"""
|
|
43
|
-
|
|
44
|
-
raise ValueError("VLLM_BASE_URL must be set via environment variable or explicit initialization")
|
|
45
|
-
if self.id == "not-set":
|
|
46
|
-
raise ValueError("Model ID must be set via environment variable or explicit initialization")
|
|
42
|
+
def _get_client_params(self) -> Dict[str, Any]:
|
|
43
|
+
"""
|
|
44
|
+
Returns client parameters for API requests, checking for VLLM_API_KEY.
|
|
47
45
|
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
if self.
|
|
52
|
-
|
|
53
|
-
|
|
46
|
+
Returns:
|
|
47
|
+
Dict[str, Any]: A dictionary of client parameters for API requests.
|
|
48
|
+
"""
|
|
49
|
+
if not self.api_key:
|
|
50
|
+
self.api_key = getenv("VLLM_API_KEY")
|
|
51
|
+
if not self.api_key:
|
|
52
|
+
raise ModelAuthenticationError(
|
|
53
|
+
message="VLLM_API_KEY not set. Please set the VLLM_API_KEY environment variable.",
|
|
54
|
+
model_name=self.name,
|
|
55
|
+
)
|
|
56
|
+
if not self.base_url:
|
|
57
|
+
self.base_url = getenv("VLLM_BASE_URL", "http://localhost:8000/v1/")
|
|
58
|
+
return super()._get_client_params()
|
|
54
59
|
|
|
55
60
|
def get_request_params(
|
|
56
61
|
self,
|
agno/models/xai/xai.py
CHANGED
|
@@ -1,9 +1,10 @@
|
|
|
1
|
-
from dataclasses import dataclass
|
|
1
|
+
from dataclasses import dataclass
|
|
2
2
|
from os import getenv
|
|
3
3
|
from typing import Any, Dict, List, Optional, Type, Union
|
|
4
4
|
|
|
5
5
|
from pydantic import BaseModel
|
|
6
6
|
|
|
7
|
+
from agno.exceptions import ModelAuthenticationError
|
|
7
8
|
from agno.models.message import Citations, UrlCitation
|
|
8
9
|
from agno.models.openai.like import OpenAILike
|
|
9
10
|
from agno.models.response import ModelResponse
|
|
@@ -34,11 +35,27 @@ class xAI(OpenAILike):
|
|
|
34
35
|
name: str = "xAI"
|
|
35
36
|
provider: str = "xAI"
|
|
36
37
|
|
|
37
|
-
api_key: Optional[str] =
|
|
38
|
+
api_key: Optional[str] = None
|
|
38
39
|
base_url: str = "https://api.x.ai/v1"
|
|
39
40
|
|
|
40
41
|
search_parameters: Optional[Dict[str, Any]] = None
|
|
41
42
|
|
|
43
|
+
def _get_client_params(self) -> Dict[str, Any]:
|
|
44
|
+
"""
|
|
45
|
+
Returns client parameters for API requests, checking for XAI_API_KEY.
|
|
46
|
+
|
|
47
|
+
Returns:
|
|
48
|
+
Dict[str, Any]: A dictionary of client parameters for API requests.
|
|
49
|
+
"""
|
|
50
|
+
if not self.api_key:
|
|
51
|
+
self.api_key = getenv("XAI_API_KEY")
|
|
52
|
+
if not self.api_key:
|
|
53
|
+
raise ModelAuthenticationError(
|
|
54
|
+
message="XAI_API_KEY not set. Please set the XAI_API_KEY environment variable.",
|
|
55
|
+
model_name=self.name,
|
|
56
|
+
)
|
|
57
|
+
return super()._get_client_params()
|
|
58
|
+
|
|
42
59
|
def get_request_params(
|
|
43
60
|
self,
|
|
44
61
|
response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
|