agno 2.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (314) hide show
  1. agno/agent/agent.py +5540 -2273
  2. agno/api/api.py +2 -0
  3. agno/api/os.py +1 -1
  4. agno/compression/__init__.py +3 -0
  5. agno/compression/manager.py +247 -0
  6. agno/culture/__init__.py +3 -0
  7. agno/culture/manager.py +956 -0
  8. agno/db/async_postgres/__init__.py +3 -0
  9. agno/db/base.py +689 -6
  10. agno/db/dynamo/dynamo.py +933 -37
  11. agno/db/dynamo/schemas.py +174 -10
  12. agno/db/dynamo/utils.py +63 -4
  13. agno/db/firestore/firestore.py +831 -9
  14. agno/db/firestore/schemas.py +51 -0
  15. agno/db/firestore/utils.py +102 -4
  16. agno/db/gcs_json/gcs_json_db.py +660 -12
  17. agno/db/gcs_json/utils.py +60 -26
  18. agno/db/in_memory/in_memory_db.py +287 -14
  19. agno/db/in_memory/utils.py +60 -2
  20. agno/db/json/json_db.py +590 -14
  21. agno/db/json/utils.py +60 -26
  22. agno/db/migrations/manager.py +199 -0
  23. agno/db/migrations/v1_to_v2.py +43 -13
  24. agno/db/migrations/versions/__init__.py +0 -0
  25. agno/db/migrations/versions/v2_3_0.py +938 -0
  26. agno/db/mongo/__init__.py +15 -1
  27. agno/db/mongo/async_mongo.py +2760 -0
  28. agno/db/mongo/mongo.py +879 -11
  29. agno/db/mongo/schemas.py +42 -0
  30. agno/db/mongo/utils.py +80 -8
  31. agno/db/mysql/__init__.py +2 -1
  32. agno/db/mysql/async_mysql.py +2912 -0
  33. agno/db/mysql/mysql.py +946 -68
  34. agno/db/mysql/schemas.py +72 -10
  35. agno/db/mysql/utils.py +198 -7
  36. agno/db/postgres/__init__.py +2 -1
  37. agno/db/postgres/async_postgres.py +2579 -0
  38. agno/db/postgres/postgres.py +942 -57
  39. agno/db/postgres/schemas.py +81 -18
  40. agno/db/postgres/utils.py +164 -2
  41. agno/db/redis/redis.py +671 -7
  42. agno/db/redis/schemas.py +50 -0
  43. agno/db/redis/utils.py +65 -7
  44. agno/db/schemas/__init__.py +2 -1
  45. agno/db/schemas/culture.py +120 -0
  46. agno/db/schemas/evals.py +1 -0
  47. agno/db/schemas/memory.py +17 -2
  48. agno/db/singlestore/schemas.py +63 -0
  49. agno/db/singlestore/singlestore.py +949 -83
  50. agno/db/singlestore/utils.py +60 -2
  51. agno/db/sqlite/__init__.py +2 -1
  52. agno/db/sqlite/async_sqlite.py +2911 -0
  53. agno/db/sqlite/schemas.py +62 -0
  54. agno/db/sqlite/sqlite.py +965 -46
  55. agno/db/sqlite/utils.py +169 -8
  56. agno/db/surrealdb/__init__.py +3 -0
  57. agno/db/surrealdb/metrics.py +292 -0
  58. agno/db/surrealdb/models.py +334 -0
  59. agno/db/surrealdb/queries.py +71 -0
  60. agno/db/surrealdb/surrealdb.py +1908 -0
  61. agno/db/surrealdb/utils.py +147 -0
  62. agno/db/utils.py +2 -0
  63. agno/eval/__init__.py +10 -0
  64. agno/eval/accuracy.py +75 -55
  65. agno/eval/agent_as_judge.py +861 -0
  66. agno/eval/base.py +29 -0
  67. agno/eval/performance.py +16 -7
  68. agno/eval/reliability.py +28 -16
  69. agno/eval/utils.py +35 -17
  70. agno/exceptions.py +27 -2
  71. agno/filters.py +354 -0
  72. agno/guardrails/prompt_injection.py +1 -0
  73. agno/hooks/__init__.py +3 -0
  74. agno/hooks/decorator.py +164 -0
  75. agno/integrations/discord/client.py +1 -1
  76. agno/knowledge/chunking/agentic.py +13 -10
  77. agno/knowledge/chunking/fixed.py +4 -1
  78. agno/knowledge/chunking/semantic.py +9 -4
  79. agno/knowledge/chunking/strategy.py +59 -15
  80. agno/knowledge/embedder/fastembed.py +1 -1
  81. agno/knowledge/embedder/nebius.py +1 -1
  82. agno/knowledge/embedder/ollama.py +8 -0
  83. agno/knowledge/embedder/openai.py +8 -8
  84. agno/knowledge/embedder/sentence_transformer.py +6 -2
  85. agno/knowledge/embedder/vllm.py +262 -0
  86. agno/knowledge/knowledge.py +1618 -318
  87. agno/knowledge/reader/base.py +6 -2
  88. agno/knowledge/reader/csv_reader.py +8 -10
  89. agno/knowledge/reader/docx_reader.py +5 -6
  90. agno/knowledge/reader/field_labeled_csv_reader.py +16 -20
  91. agno/knowledge/reader/json_reader.py +5 -4
  92. agno/knowledge/reader/markdown_reader.py +8 -8
  93. agno/knowledge/reader/pdf_reader.py +17 -19
  94. agno/knowledge/reader/pptx_reader.py +101 -0
  95. agno/knowledge/reader/reader_factory.py +32 -3
  96. agno/knowledge/reader/s3_reader.py +3 -3
  97. agno/knowledge/reader/tavily_reader.py +193 -0
  98. agno/knowledge/reader/text_reader.py +22 -10
  99. agno/knowledge/reader/web_search_reader.py +1 -48
  100. agno/knowledge/reader/website_reader.py +10 -10
  101. agno/knowledge/reader/wikipedia_reader.py +33 -1
  102. agno/knowledge/types.py +1 -0
  103. agno/knowledge/utils.py +72 -7
  104. agno/media.py +22 -6
  105. agno/memory/__init__.py +14 -1
  106. agno/memory/manager.py +544 -83
  107. agno/memory/strategies/__init__.py +15 -0
  108. agno/memory/strategies/base.py +66 -0
  109. agno/memory/strategies/summarize.py +196 -0
  110. agno/memory/strategies/types.py +37 -0
  111. agno/models/aimlapi/aimlapi.py +17 -0
  112. agno/models/anthropic/claude.py +515 -40
  113. agno/models/aws/bedrock.py +102 -21
  114. agno/models/aws/claude.py +131 -274
  115. agno/models/azure/ai_foundry.py +41 -19
  116. agno/models/azure/openai_chat.py +39 -8
  117. agno/models/base.py +1249 -525
  118. agno/models/cerebras/cerebras.py +91 -21
  119. agno/models/cerebras/cerebras_openai.py +21 -2
  120. agno/models/cohere/chat.py +40 -6
  121. agno/models/cometapi/cometapi.py +18 -1
  122. agno/models/dashscope/dashscope.py +2 -3
  123. agno/models/deepinfra/deepinfra.py +18 -1
  124. agno/models/deepseek/deepseek.py +69 -3
  125. agno/models/fireworks/fireworks.py +18 -1
  126. agno/models/google/gemini.py +877 -80
  127. agno/models/google/utils.py +22 -0
  128. agno/models/groq/groq.py +51 -18
  129. agno/models/huggingface/huggingface.py +17 -6
  130. agno/models/ibm/watsonx.py +16 -6
  131. agno/models/internlm/internlm.py +18 -1
  132. agno/models/langdb/langdb.py +13 -1
  133. agno/models/litellm/chat.py +44 -9
  134. agno/models/litellm/litellm_openai.py +18 -1
  135. agno/models/message.py +28 -5
  136. agno/models/meta/llama.py +47 -14
  137. agno/models/meta/llama_openai.py +22 -17
  138. agno/models/mistral/mistral.py +8 -4
  139. agno/models/nebius/nebius.py +6 -7
  140. agno/models/nvidia/nvidia.py +20 -3
  141. agno/models/ollama/chat.py +24 -8
  142. agno/models/openai/chat.py +104 -29
  143. agno/models/openai/responses.py +101 -81
  144. agno/models/openrouter/openrouter.py +60 -3
  145. agno/models/perplexity/perplexity.py +17 -1
  146. agno/models/portkey/portkey.py +7 -6
  147. agno/models/requesty/requesty.py +24 -4
  148. agno/models/response.py +73 -2
  149. agno/models/sambanova/sambanova.py +20 -3
  150. agno/models/siliconflow/siliconflow.py +19 -2
  151. agno/models/together/together.py +20 -3
  152. agno/models/utils.py +254 -8
  153. agno/models/vercel/v0.py +20 -3
  154. agno/models/vertexai/__init__.py +0 -0
  155. agno/models/vertexai/claude.py +190 -0
  156. agno/models/vllm/vllm.py +19 -14
  157. agno/models/xai/xai.py +19 -2
  158. agno/os/app.py +549 -152
  159. agno/os/auth.py +190 -3
  160. agno/os/config.py +23 -0
  161. agno/os/interfaces/a2a/router.py +8 -11
  162. agno/os/interfaces/a2a/utils.py +1 -1
  163. agno/os/interfaces/agui/router.py +18 -3
  164. agno/os/interfaces/agui/utils.py +152 -39
  165. agno/os/interfaces/slack/router.py +55 -37
  166. agno/os/interfaces/slack/slack.py +9 -1
  167. agno/os/interfaces/whatsapp/router.py +0 -1
  168. agno/os/interfaces/whatsapp/security.py +3 -1
  169. agno/os/mcp.py +110 -52
  170. agno/os/middleware/__init__.py +2 -0
  171. agno/os/middleware/jwt.py +676 -112
  172. agno/os/router.py +40 -1478
  173. agno/os/routers/agents/__init__.py +3 -0
  174. agno/os/routers/agents/router.py +599 -0
  175. agno/os/routers/agents/schema.py +261 -0
  176. agno/os/routers/evals/evals.py +96 -39
  177. agno/os/routers/evals/schemas.py +65 -33
  178. agno/os/routers/evals/utils.py +80 -10
  179. agno/os/routers/health.py +10 -4
  180. agno/os/routers/knowledge/knowledge.py +196 -38
  181. agno/os/routers/knowledge/schemas.py +82 -22
  182. agno/os/routers/memory/memory.py +279 -52
  183. agno/os/routers/memory/schemas.py +46 -17
  184. agno/os/routers/metrics/metrics.py +20 -8
  185. agno/os/routers/metrics/schemas.py +16 -16
  186. agno/os/routers/session/session.py +462 -34
  187. agno/os/routers/teams/__init__.py +3 -0
  188. agno/os/routers/teams/router.py +512 -0
  189. agno/os/routers/teams/schema.py +257 -0
  190. agno/os/routers/traces/__init__.py +3 -0
  191. agno/os/routers/traces/schemas.py +414 -0
  192. agno/os/routers/traces/traces.py +499 -0
  193. agno/os/routers/workflows/__init__.py +3 -0
  194. agno/os/routers/workflows/router.py +624 -0
  195. agno/os/routers/workflows/schema.py +75 -0
  196. agno/os/schema.py +256 -693
  197. agno/os/scopes.py +469 -0
  198. agno/os/utils.py +514 -36
  199. agno/reasoning/anthropic.py +80 -0
  200. agno/reasoning/gemini.py +73 -0
  201. agno/reasoning/openai.py +5 -0
  202. agno/reasoning/vertexai.py +76 -0
  203. agno/run/__init__.py +6 -0
  204. agno/run/agent.py +155 -32
  205. agno/run/base.py +55 -3
  206. agno/run/requirement.py +181 -0
  207. agno/run/team.py +125 -38
  208. agno/run/workflow.py +72 -18
  209. agno/session/agent.py +102 -89
  210. agno/session/summary.py +56 -15
  211. agno/session/team.py +164 -90
  212. agno/session/workflow.py +405 -40
  213. agno/table.py +10 -0
  214. agno/team/team.py +3974 -1903
  215. agno/tools/dalle.py +2 -4
  216. agno/tools/eleven_labs.py +23 -25
  217. agno/tools/exa.py +21 -16
  218. agno/tools/file.py +153 -23
  219. agno/tools/file_generation.py +16 -10
  220. agno/tools/firecrawl.py +15 -7
  221. agno/tools/function.py +193 -38
  222. agno/tools/gmail.py +238 -14
  223. agno/tools/google_drive.py +271 -0
  224. agno/tools/googlecalendar.py +36 -8
  225. agno/tools/googlesheets.py +20 -5
  226. agno/tools/jira.py +20 -0
  227. agno/tools/mcp/__init__.py +10 -0
  228. agno/tools/mcp/mcp.py +331 -0
  229. agno/tools/mcp/multi_mcp.py +347 -0
  230. agno/tools/mcp/params.py +24 -0
  231. agno/tools/mcp_toolbox.py +3 -3
  232. agno/tools/models/nebius.py +5 -5
  233. agno/tools/models_labs.py +20 -10
  234. agno/tools/nano_banana.py +151 -0
  235. agno/tools/notion.py +204 -0
  236. agno/tools/parallel.py +314 -0
  237. agno/tools/postgres.py +76 -36
  238. agno/tools/redshift.py +406 -0
  239. agno/tools/scrapegraph.py +1 -1
  240. agno/tools/shopify.py +1519 -0
  241. agno/tools/slack.py +18 -3
  242. agno/tools/spotify.py +919 -0
  243. agno/tools/tavily.py +146 -0
  244. agno/tools/toolkit.py +25 -0
  245. agno/tools/workflow.py +8 -1
  246. agno/tools/yfinance.py +12 -11
  247. agno/tracing/__init__.py +12 -0
  248. agno/tracing/exporter.py +157 -0
  249. agno/tracing/schemas.py +276 -0
  250. agno/tracing/setup.py +111 -0
  251. agno/utils/agent.py +938 -0
  252. agno/utils/cryptography.py +22 -0
  253. agno/utils/dttm.py +33 -0
  254. agno/utils/events.py +151 -3
  255. agno/utils/gemini.py +15 -5
  256. agno/utils/hooks.py +118 -4
  257. agno/utils/http.py +113 -2
  258. agno/utils/knowledge.py +12 -5
  259. agno/utils/log.py +1 -0
  260. agno/utils/mcp.py +92 -2
  261. agno/utils/media.py +187 -1
  262. agno/utils/merge_dict.py +3 -3
  263. agno/utils/message.py +60 -0
  264. agno/utils/models/ai_foundry.py +9 -2
  265. agno/utils/models/claude.py +49 -14
  266. agno/utils/models/cohere.py +9 -2
  267. agno/utils/models/llama.py +9 -2
  268. agno/utils/models/mistral.py +4 -2
  269. agno/utils/print_response/agent.py +109 -16
  270. agno/utils/print_response/team.py +223 -30
  271. agno/utils/print_response/workflow.py +251 -34
  272. agno/utils/streamlit.py +1 -1
  273. agno/utils/team.py +98 -9
  274. agno/utils/tokens.py +657 -0
  275. agno/vectordb/base.py +39 -7
  276. agno/vectordb/cassandra/cassandra.py +21 -5
  277. agno/vectordb/chroma/chromadb.py +43 -12
  278. agno/vectordb/clickhouse/clickhousedb.py +21 -5
  279. agno/vectordb/couchbase/couchbase.py +29 -5
  280. agno/vectordb/lancedb/lance_db.py +92 -181
  281. agno/vectordb/langchaindb/langchaindb.py +24 -4
  282. agno/vectordb/lightrag/lightrag.py +17 -3
  283. agno/vectordb/llamaindex/llamaindexdb.py +25 -5
  284. agno/vectordb/milvus/milvus.py +50 -37
  285. agno/vectordb/mongodb/__init__.py +7 -1
  286. agno/vectordb/mongodb/mongodb.py +36 -30
  287. agno/vectordb/pgvector/pgvector.py +201 -77
  288. agno/vectordb/pineconedb/pineconedb.py +41 -23
  289. agno/vectordb/qdrant/qdrant.py +67 -54
  290. agno/vectordb/redis/__init__.py +9 -0
  291. agno/vectordb/redis/redisdb.py +682 -0
  292. agno/vectordb/singlestore/singlestore.py +50 -29
  293. agno/vectordb/surrealdb/surrealdb.py +31 -41
  294. agno/vectordb/upstashdb/upstashdb.py +34 -6
  295. agno/vectordb/weaviate/weaviate.py +53 -14
  296. agno/workflow/__init__.py +2 -0
  297. agno/workflow/agent.py +299 -0
  298. agno/workflow/condition.py +120 -18
  299. agno/workflow/loop.py +77 -10
  300. agno/workflow/parallel.py +231 -143
  301. agno/workflow/router.py +118 -17
  302. agno/workflow/step.py +609 -170
  303. agno/workflow/steps.py +73 -6
  304. agno/workflow/types.py +96 -21
  305. agno/workflow/workflow.py +2039 -262
  306. {agno-2.1.2.dist-info → agno-2.3.13.dist-info}/METADATA +201 -66
  307. agno-2.3.13.dist-info/RECORD +613 -0
  308. agno/tools/googlesearch.py +0 -98
  309. agno/tools/mcp.py +0 -679
  310. agno/tools/memori.py +0 -339
  311. agno-2.1.2.dist-info/RECORD +0 -543
  312. {agno-2.1.2.dist-info → agno-2.3.13.dist-info}/WHEEL +0 -0
  313. {agno-2.1.2.dist-info → agno-2.3.13.dist-info}/licenses/LICENSE +0 -0
  314. {agno-2.1.2.dist-info → agno-2.3.13.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,190 @@
1
+ from dataclasses import dataclass
2
+ from os import getenv
3
+ from typing import Any, Dict, List, Optional, Type, Union
4
+
5
+ import httpx
6
+ from pydantic import BaseModel
7
+
8
+ from agno.models.anthropic import Claude as AnthropicClaude
9
+ from agno.utils.http import get_default_async_client, get_default_sync_client
10
+ from agno.utils.log import log_debug, log_warning
11
+ from agno.utils.models.claude import format_tools_for_model
12
+
13
+ try:
14
+ from anthropic import AnthropicVertex, AsyncAnthropicVertex
15
+ except ImportError as e:
16
+ raise ImportError("`anthropic` not installed. Please install it with `pip install anthropic`") from e
17
+
18
+
19
+ @dataclass
20
+ class Claude(AnthropicClaude):
21
+ """
22
+ A class representing Anthropic Claude model.
23
+
24
+ For more information, see: https://docs.anthropic.com/en/api/messages
25
+ """
26
+
27
+ id: str = "claude-sonnet-4@20250514"
28
+ name: str = "Claude"
29
+ provider: str = "VertexAI"
30
+
31
+ # Client parameters
32
+ region: Optional[str] = None
33
+ project_id: Optional[str] = None
34
+ base_url: Optional[str] = None
35
+
36
+ client: Optional[AnthropicVertex] = None # type: ignore
37
+ async_client: Optional[AsyncAnthropicVertex] = None # type: ignore
38
+
39
+ def __post_init__(self):
40
+ """Validate model configuration after initialization"""
41
+ # Validate thinking support immediately at model creation
42
+ if self.thinking:
43
+ self._validate_thinking_support()
44
+ # Overwrite output schema support for VertexAI Claude
45
+ self.supports_native_structured_outputs = False
46
+ self.supports_json_schema_outputs = False
47
+
48
+ def _get_client_params(self) -> Dict[str, Any]:
49
+ client_params: Dict[str, Any] = {}
50
+
51
+ # Add API key to client parameters
52
+ client_params["region"] = self.region or getenv("CLOUD_ML_REGION")
53
+ client_params["project_id"] = self.project_id or getenv("ANTHROPIC_VERTEX_PROJECT_ID")
54
+ client_params["base_url"] = self.base_url or getenv("ANTHROPIC_VERTEX_BASE_URL")
55
+ if self.timeout is not None:
56
+ client_params["timeout"] = self.timeout
57
+
58
+ # Add additional client parameters
59
+ if self.client_params is not None:
60
+ client_params.update(self.client_params)
61
+ if self.default_headers is not None:
62
+ client_params["default_headers"] = self.default_headers
63
+ return client_params
64
+
65
+ def get_client(self):
66
+ """
67
+ Returns an instance of the Anthropic client.
68
+ """
69
+ if self.client and not self.client.is_closed():
70
+ return self.client
71
+
72
+ _client_params = self._get_client_params()
73
+ if self.http_client:
74
+ if isinstance(self.http_client, httpx.Client):
75
+ _client_params["http_client"] = self.http_client
76
+ else:
77
+ log_warning("http_client is not an instance of httpx.Client. Using default global httpx.Client.")
78
+ # Use global sync client when user http_client is invalid
79
+ _client_params["http_client"] = get_default_sync_client()
80
+ else:
81
+ # Use global sync client when no custom http_client is provided
82
+ _client_params["http_client"] = get_default_sync_client()
83
+ self.client = AnthropicVertex(**_client_params)
84
+ return self.client
85
+
86
+ def get_async_client(self):
87
+ """
88
+ Returns an instance of the async Anthropic client.
89
+ """
90
+ if self.async_client and not self.async_client.is_closed():
91
+ return self.async_client
92
+
93
+ _client_params = self._get_client_params()
94
+ if self.http_client:
95
+ if isinstance(self.http_client, httpx.AsyncClient):
96
+ _client_params["http_client"] = self.http_client
97
+ else:
98
+ log_warning(
99
+ "http_client is not an instance of httpx.AsyncClient. Using default global httpx.AsyncClient."
100
+ )
101
+ # Use global async client when user http_client is invalid
102
+ _client_params["http_client"] = get_default_async_client()
103
+ else:
104
+ # Use global async client when no custom http_client is provided
105
+ _client_params["http_client"] = get_default_async_client()
106
+ self.async_client = AsyncAnthropicVertex(**_client_params)
107
+ return self.async_client
108
+
109
+ def get_request_params(
110
+ self,
111
+ response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
112
+ tools: Optional[List[Dict[str, Any]]] = None,
113
+ ) -> Dict[str, Any]:
114
+ """
115
+ Generate keyword arguments for API requests.
116
+
117
+ Returns:
118
+ Dict[str, Any]: The keyword arguments for API requests.
119
+ """
120
+ # Validate thinking support if thinking is enabled
121
+ if self.thinking:
122
+ self._validate_thinking_support()
123
+
124
+ _request_params: Dict[str, Any] = {}
125
+ if self.max_tokens:
126
+ _request_params["max_tokens"] = self.max_tokens
127
+ if self.thinking:
128
+ _request_params["thinking"] = self.thinking
129
+ if self.temperature:
130
+ _request_params["temperature"] = self.temperature
131
+ if self.stop_sequences:
132
+ _request_params["stop_sequences"] = self.stop_sequences
133
+ if self.top_p:
134
+ _request_params["top_p"] = self.top_p
135
+ if self.top_k:
136
+ _request_params["top_k"] = self.top_k
137
+ if self.timeout:
138
+ _request_params["timeout"] = self.timeout
139
+
140
+ # Build betas list - include existing betas and add new one if needed
141
+ betas_list = list(self.betas) if self.betas else []
142
+
143
+ # Include betas if any are present
144
+ if betas_list:
145
+ _request_params["betas"] = betas_list
146
+
147
+ if self.request_params:
148
+ _request_params.update(self.request_params)
149
+
150
+ if _request_params:
151
+ log_debug(f"Calling {self.provider} with request parameters: {_request_params}", log_level=2)
152
+ return _request_params
153
+
154
+ def _prepare_request_kwargs(
155
+ self,
156
+ system_message: str,
157
+ tools: Optional[List[Dict[str, Any]]] = None,
158
+ response_format: Optional[Union[Dict, Type[BaseModel]]] = None,
159
+ ) -> Dict[str, Any]:
160
+ """
161
+ Prepare the request keyword arguments for the API call.
162
+
163
+ Args:
164
+ system_message (str): The concatenated system messages.
165
+ tools: Optional list of tools
166
+ response_format: Optional response format (Pydantic model or dict)
167
+
168
+ Returns:
169
+ Dict[str, Any]: The request keyword arguments.
170
+ """
171
+ # Pass response_format and tools to get_request_params for beta header handling
172
+ request_kwargs = self.get_request_params(response_format=response_format, tools=tools).copy()
173
+ if system_message:
174
+ if self.cache_system_prompt:
175
+ cache_control = (
176
+ {"type": "ephemeral", "ttl": "1h"}
177
+ if self.extended_cache_time is not None and self.extended_cache_time is True
178
+ else {"type": "ephemeral"}
179
+ )
180
+ request_kwargs["system"] = [{"text": system_message, "type": "text", "cache_control": cache_control}]
181
+ else:
182
+ request_kwargs["system"] = [{"text": system_message, "type": "text"}]
183
+
184
+ # Format tools (this will handle strict mode)
185
+ if tools:
186
+ request_kwargs["tools"] = format_tools_for_model(tools)
187
+
188
+ if request_kwargs:
189
+ log_debug(f"Calling {self.provider} with request parameters: {request_kwargs}", log_level=2)
190
+ return request_kwargs
agno/models/vllm/vllm.py CHANGED
@@ -4,6 +4,7 @@ from typing import Any, Dict, List, Optional, Type, Union
4
4
 
5
5
  from pydantic import BaseModel
6
6
 
7
+ from agno.exceptions import ModelAuthenticationError
7
8
  from agno.models.openai.like import OpenAILike
8
9
  from agno.utils.log import log_debug
9
10
 
@@ -29,8 +30,8 @@ class VLLM(OpenAILike):
29
30
  name: str = "VLLM"
30
31
  provider: str = "VLLM"
31
32
 
32
- api_key: Optional[str] = getenv("VLLM_API_KEY") or "EMPTY"
33
- base_url: Optional[str] = getenv("VLLM_BASE_URL", "http://localhost:8000/v1/")
33
+ api_key: Optional[str] = None
34
+ base_url: Optional[str] = None
34
35
 
35
36
  temperature: float = 0.7
36
37
  top_p: float = 0.8
@@ -38,19 +39,23 @@ class VLLM(OpenAILike):
38
39
  top_k: Optional[int] = None
39
40
  enable_thinking: Optional[bool] = None
40
41
 
41
- def __post_init__(self):
42
- """Validate required configuration"""
43
- if not self.base_url:
44
- raise ValueError("VLLM_BASE_URL must be set via environment variable or explicit initialization")
45
- if self.id == "not-set":
46
- raise ValueError("Model ID must be set via environment variable or explicit initialization")
42
+ def _get_client_params(self) -> Dict[str, Any]:
43
+ """
44
+ Returns client parameters for API requests, checking for VLLM_API_KEY.
47
45
 
48
- body: Dict[str, Any] = {}
49
- if self.top_k is not None:
50
- body["top_k"] = self.top_k
51
- if self.enable_thinking is not None:
52
- body["chat_template_kwargs"] = {"enable_thinking": self.enable_thinking}
53
- self.extra_body = body or None
46
+ Returns:
47
+ Dict[str, Any]: A dictionary of client parameters for API requests.
48
+ """
49
+ if not self.api_key:
50
+ self.api_key = getenv("VLLM_API_KEY")
51
+ if not self.api_key:
52
+ raise ModelAuthenticationError(
53
+ message="VLLM_API_KEY not set. Please set the VLLM_API_KEY environment variable.",
54
+ model_name=self.name,
55
+ )
56
+ if not self.base_url:
57
+ self.base_url = getenv("VLLM_BASE_URL", "http://localhost:8000/v1/")
58
+ return super()._get_client_params()
54
59
 
55
60
  def get_request_params(
56
61
  self,
agno/models/xai/xai.py CHANGED
@@ -1,9 +1,10 @@
1
- from dataclasses import dataclass, field
1
+ from dataclasses import dataclass
2
2
  from os import getenv
3
3
  from typing import Any, Dict, List, Optional, Type, Union
4
4
 
5
5
  from pydantic import BaseModel
6
6
 
7
+ from agno.exceptions import ModelAuthenticationError
7
8
  from agno.models.message import Citations, UrlCitation
8
9
  from agno.models.openai.like import OpenAILike
9
10
  from agno.models.response import ModelResponse
@@ -34,11 +35,27 @@ class xAI(OpenAILike):
34
35
  name: str = "xAI"
35
36
  provider: str = "xAI"
36
37
 
37
- api_key: Optional[str] = field(default_factory=lambda: getenv("XAI_API_KEY"))
38
+ api_key: Optional[str] = None
38
39
  base_url: str = "https://api.x.ai/v1"
39
40
 
40
41
  search_parameters: Optional[Dict[str, Any]] = None
41
42
 
43
+ def _get_client_params(self) -> Dict[str, Any]:
44
+ """
45
+ Returns client parameters for API requests, checking for XAI_API_KEY.
46
+
47
+ Returns:
48
+ Dict[str, Any]: A dictionary of client parameters for API requests.
49
+ """
50
+ if not self.api_key:
51
+ self.api_key = getenv("XAI_API_KEY")
52
+ if not self.api_key:
53
+ raise ModelAuthenticationError(
54
+ message="XAI_API_KEY not set. Please set the XAI_API_KEY environment variable.",
55
+ model_name=self.name,
56
+ )
57
+ return super()._get_client_params()
58
+
42
59
  def get_request_params(
43
60
  self,
44
61
  response_format: Optional[Union[Dict, Type[BaseModel]]] = None,