agno 2.0.0rc2__py3-none-any.whl → 2.3.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (331) hide show
  1. agno/agent/agent.py +6009 -2874
  2. agno/api/api.py +2 -0
  3. agno/api/os.py +1 -1
  4. agno/culture/__init__.py +3 -0
  5. agno/culture/manager.py +956 -0
  6. agno/db/async_postgres/__init__.py +3 -0
  7. agno/db/base.py +385 -6
  8. agno/db/dynamo/dynamo.py +388 -81
  9. agno/db/dynamo/schemas.py +47 -10
  10. agno/db/dynamo/utils.py +63 -4
  11. agno/db/firestore/firestore.py +435 -64
  12. agno/db/firestore/schemas.py +11 -0
  13. agno/db/firestore/utils.py +102 -4
  14. agno/db/gcs_json/gcs_json_db.py +384 -42
  15. agno/db/gcs_json/utils.py +60 -26
  16. agno/db/in_memory/in_memory_db.py +351 -66
  17. agno/db/in_memory/utils.py +60 -2
  18. agno/db/json/json_db.py +339 -48
  19. agno/db/json/utils.py +60 -26
  20. agno/db/migrations/manager.py +199 -0
  21. agno/db/migrations/v1_to_v2.py +510 -37
  22. agno/db/migrations/versions/__init__.py +0 -0
  23. agno/db/migrations/versions/v2_3_0.py +938 -0
  24. agno/db/mongo/__init__.py +15 -1
  25. agno/db/mongo/async_mongo.py +2036 -0
  26. agno/db/mongo/mongo.py +653 -76
  27. agno/db/mongo/schemas.py +13 -0
  28. agno/db/mongo/utils.py +80 -8
  29. agno/db/mysql/mysql.py +687 -25
  30. agno/db/mysql/schemas.py +61 -37
  31. agno/db/mysql/utils.py +60 -2
  32. agno/db/postgres/__init__.py +2 -1
  33. agno/db/postgres/async_postgres.py +2001 -0
  34. agno/db/postgres/postgres.py +676 -57
  35. agno/db/postgres/schemas.py +43 -18
  36. agno/db/postgres/utils.py +164 -2
  37. agno/db/redis/redis.py +344 -38
  38. agno/db/redis/schemas.py +18 -0
  39. agno/db/redis/utils.py +60 -2
  40. agno/db/schemas/__init__.py +2 -1
  41. agno/db/schemas/culture.py +120 -0
  42. agno/db/schemas/memory.py +13 -0
  43. agno/db/singlestore/schemas.py +26 -1
  44. agno/db/singlestore/singlestore.py +687 -53
  45. agno/db/singlestore/utils.py +60 -2
  46. agno/db/sqlite/__init__.py +2 -1
  47. agno/db/sqlite/async_sqlite.py +2371 -0
  48. agno/db/sqlite/schemas.py +24 -0
  49. agno/db/sqlite/sqlite.py +774 -85
  50. agno/db/sqlite/utils.py +168 -5
  51. agno/db/surrealdb/__init__.py +3 -0
  52. agno/db/surrealdb/metrics.py +292 -0
  53. agno/db/surrealdb/models.py +309 -0
  54. agno/db/surrealdb/queries.py +71 -0
  55. agno/db/surrealdb/surrealdb.py +1361 -0
  56. agno/db/surrealdb/utils.py +147 -0
  57. agno/db/utils.py +50 -22
  58. agno/eval/accuracy.py +50 -43
  59. agno/eval/performance.py +6 -3
  60. agno/eval/reliability.py +6 -3
  61. agno/eval/utils.py +33 -16
  62. agno/exceptions.py +68 -1
  63. agno/filters.py +354 -0
  64. agno/guardrails/__init__.py +6 -0
  65. agno/guardrails/base.py +19 -0
  66. agno/guardrails/openai.py +144 -0
  67. agno/guardrails/pii.py +94 -0
  68. agno/guardrails/prompt_injection.py +52 -0
  69. agno/integrations/discord/client.py +1 -0
  70. agno/knowledge/chunking/agentic.py +13 -10
  71. agno/knowledge/chunking/fixed.py +1 -1
  72. agno/knowledge/chunking/semantic.py +40 -8
  73. agno/knowledge/chunking/strategy.py +59 -15
  74. agno/knowledge/embedder/aws_bedrock.py +9 -4
  75. agno/knowledge/embedder/azure_openai.py +54 -0
  76. agno/knowledge/embedder/base.py +2 -0
  77. agno/knowledge/embedder/cohere.py +184 -5
  78. agno/knowledge/embedder/fastembed.py +1 -1
  79. agno/knowledge/embedder/google.py +79 -1
  80. agno/knowledge/embedder/huggingface.py +9 -4
  81. agno/knowledge/embedder/jina.py +63 -0
  82. agno/knowledge/embedder/mistral.py +78 -11
  83. agno/knowledge/embedder/nebius.py +1 -1
  84. agno/knowledge/embedder/ollama.py +13 -0
  85. agno/knowledge/embedder/openai.py +37 -65
  86. agno/knowledge/embedder/sentence_transformer.py +8 -4
  87. agno/knowledge/embedder/vllm.py +262 -0
  88. agno/knowledge/embedder/voyageai.py +69 -16
  89. agno/knowledge/knowledge.py +595 -187
  90. agno/knowledge/reader/base.py +9 -2
  91. agno/knowledge/reader/csv_reader.py +8 -10
  92. agno/knowledge/reader/docx_reader.py +5 -6
  93. agno/knowledge/reader/field_labeled_csv_reader.py +290 -0
  94. agno/knowledge/reader/json_reader.py +6 -5
  95. agno/knowledge/reader/markdown_reader.py +13 -13
  96. agno/knowledge/reader/pdf_reader.py +43 -68
  97. agno/knowledge/reader/pptx_reader.py +101 -0
  98. agno/knowledge/reader/reader_factory.py +51 -6
  99. agno/knowledge/reader/s3_reader.py +3 -15
  100. agno/knowledge/reader/tavily_reader.py +194 -0
  101. agno/knowledge/reader/text_reader.py +13 -13
  102. agno/knowledge/reader/web_search_reader.py +2 -43
  103. agno/knowledge/reader/website_reader.py +43 -25
  104. agno/knowledge/reranker/__init__.py +3 -0
  105. agno/knowledge/types.py +9 -0
  106. agno/knowledge/utils.py +20 -0
  107. agno/media.py +339 -266
  108. agno/memory/manager.py +336 -82
  109. agno/models/aimlapi/aimlapi.py +2 -2
  110. agno/models/anthropic/claude.py +183 -37
  111. agno/models/aws/bedrock.py +52 -112
  112. agno/models/aws/claude.py +33 -1
  113. agno/models/azure/ai_foundry.py +33 -15
  114. agno/models/azure/openai_chat.py +25 -8
  115. agno/models/base.py +1011 -566
  116. agno/models/cerebras/cerebras.py +19 -13
  117. agno/models/cerebras/cerebras_openai.py +8 -5
  118. agno/models/cohere/chat.py +27 -1
  119. agno/models/cometapi/__init__.py +5 -0
  120. agno/models/cometapi/cometapi.py +57 -0
  121. agno/models/dashscope/dashscope.py +1 -0
  122. agno/models/deepinfra/deepinfra.py +2 -2
  123. agno/models/deepseek/deepseek.py +2 -2
  124. agno/models/fireworks/fireworks.py +2 -2
  125. agno/models/google/gemini.py +110 -37
  126. agno/models/groq/groq.py +28 -11
  127. agno/models/huggingface/huggingface.py +2 -1
  128. agno/models/internlm/internlm.py +2 -2
  129. agno/models/langdb/langdb.py +4 -4
  130. agno/models/litellm/chat.py +18 -1
  131. agno/models/litellm/litellm_openai.py +2 -2
  132. agno/models/llama_cpp/__init__.py +5 -0
  133. agno/models/llama_cpp/llama_cpp.py +22 -0
  134. agno/models/message.py +143 -4
  135. agno/models/meta/llama.py +27 -10
  136. agno/models/meta/llama_openai.py +5 -17
  137. agno/models/nebius/nebius.py +6 -6
  138. agno/models/nexus/__init__.py +3 -0
  139. agno/models/nexus/nexus.py +22 -0
  140. agno/models/nvidia/nvidia.py +2 -2
  141. agno/models/ollama/chat.py +60 -6
  142. agno/models/openai/chat.py +102 -43
  143. agno/models/openai/responses.py +103 -106
  144. agno/models/openrouter/openrouter.py +41 -3
  145. agno/models/perplexity/perplexity.py +4 -5
  146. agno/models/portkey/portkey.py +3 -3
  147. agno/models/requesty/__init__.py +5 -0
  148. agno/models/requesty/requesty.py +52 -0
  149. agno/models/response.py +81 -5
  150. agno/models/sambanova/sambanova.py +2 -2
  151. agno/models/siliconflow/__init__.py +5 -0
  152. agno/models/siliconflow/siliconflow.py +25 -0
  153. agno/models/together/together.py +2 -2
  154. agno/models/utils.py +254 -8
  155. agno/models/vercel/v0.py +2 -2
  156. agno/models/vertexai/__init__.py +0 -0
  157. agno/models/vertexai/claude.py +96 -0
  158. agno/models/vllm/vllm.py +1 -0
  159. agno/models/xai/xai.py +3 -2
  160. agno/os/app.py +543 -175
  161. agno/os/auth.py +24 -14
  162. agno/os/config.py +1 -0
  163. agno/os/interfaces/__init__.py +1 -0
  164. agno/os/interfaces/a2a/__init__.py +3 -0
  165. agno/os/interfaces/a2a/a2a.py +42 -0
  166. agno/os/interfaces/a2a/router.py +250 -0
  167. agno/os/interfaces/a2a/utils.py +924 -0
  168. agno/os/interfaces/agui/agui.py +23 -7
  169. agno/os/interfaces/agui/router.py +27 -3
  170. agno/os/interfaces/agui/utils.py +242 -142
  171. agno/os/interfaces/base.py +6 -2
  172. agno/os/interfaces/slack/router.py +81 -23
  173. agno/os/interfaces/slack/slack.py +29 -14
  174. agno/os/interfaces/whatsapp/router.py +11 -4
  175. agno/os/interfaces/whatsapp/whatsapp.py +14 -7
  176. agno/os/mcp.py +111 -54
  177. agno/os/middleware/__init__.py +7 -0
  178. agno/os/middleware/jwt.py +233 -0
  179. agno/os/router.py +556 -139
  180. agno/os/routers/evals/evals.py +71 -34
  181. agno/os/routers/evals/schemas.py +31 -31
  182. agno/os/routers/evals/utils.py +6 -5
  183. agno/os/routers/health.py +31 -0
  184. agno/os/routers/home.py +52 -0
  185. agno/os/routers/knowledge/knowledge.py +185 -38
  186. agno/os/routers/knowledge/schemas.py +82 -22
  187. agno/os/routers/memory/memory.py +158 -53
  188. agno/os/routers/memory/schemas.py +20 -16
  189. agno/os/routers/metrics/metrics.py +20 -8
  190. agno/os/routers/metrics/schemas.py +16 -16
  191. agno/os/routers/session/session.py +499 -38
  192. agno/os/schema.py +308 -198
  193. agno/os/utils.py +401 -41
  194. agno/reasoning/anthropic.py +80 -0
  195. agno/reasoning/azure_ai_foundry.py +2 -2
  196. agno/reasoning/deepseek.py +2 -2
  197. agno/reasoning/default.py +3 -1
  198. agno/reasoning/gemini.py +73 -0
  199. agno/reasoning/groq.py +2 -2
  200. agno/reasoning/ollama.py +2 -2
  201. agno/reasoning/openai.py +7 -2
  202. agno/reasoning/vertexai.py +76 -0
  203. agno/run/__init__.py +6 -0
  204. agno/run/agent.py +266 -112
  205. agno/run/base.py +53 -24
  206. agno/run/team.py +252 -111
  207. agno/run/workflow.py +156 -45
  208. agno/session/agent.py +105 -89
  209. agno/session/summary.py +65 -25
  210. agno/session/team.py +176 -96
  211. agno/session/workflow.py +406 -40
  212. agno/team/team.py +3854 -1692
  213. agno/tools/brightdata.py +3 -3
  214. agno/tools/cartesia.py +3 -5
  215. agno/tools/dalle.py +9 -8
  216. agno/tools/decorator.py +4 -2
  217. agno/tools/desi_vocal.py +2 -2
  218. agno/tools/duckduckgo.py +15 -11
  219. agno/tools/e2b.py +20 -13
  220. agno/tools/eleven_labs.py +26 -28
  221. agno/tools/exa.py +21 -16
  222. agno/tools/fal.py +4 -4
  223. agno/tools/file.py +153 -23
  224. agno/tools/file_generation.py +350 -0
  225. agno/tools/firecrawl.py +4 -4
  226. agno/tools/function.py +257 -37
  227. agno/tools/giphy.py +2 -2
  228. agno/tools/gmail.py +238 -14
  229. agno/tools/google_drive.py +270 -0
  230. agno/tools/googlecalendar.py +36 -8
  231. agno/tools/googlesheets.py +20 -5
  232. agno/tools/jira.py +20 -0
  233. agno/tools/knowledge.py +3 -3
  234. agno/tools/lumalab.py +3 -3
  235. agno/tools/mcp/__init__.py +10 -0
  236. agno/tools/mcp/mcp.py +331 -0
  237. agno/tools/mcp/multi_mcp.py +347 -0
  238. agno/tools/mcp/params.py +24 -0
  239. agno/tools/mcp_toolbox.py +284 -0
  240. agno/tools/mem0.py +11 -17
  241. agno/tools/memori.py +1 -53
  242. agno/tools/memory.py +419 -0
  243. agno/tools/models/azure_openai.py +2 -2
  244. agno/tools/models/gemini.py +3 -3
  245. agno/tools/models/groq.py +3 -5
  246. agno/tools/models/nebius.py +7 -7
  247. agno/tools/models_labs.py +25 -15
  248. agno/tools/notion.py +204 -0
  249. agno/tools/openai.py +4 -9
  250. agno/tools/opencv.py +3 -3
  251. agno/tools/parallel.py +314 -0
  252. agno/tools/replicate.py +7 -7
  253. agno/tools/scrapegraph.py +58 -31
  254. agno/tools/searxng.py +2 -2
  255. agno/tools/serper.py +2 -2
  256. agno/tools/slack.py +18 -3
  257. agno/tools/spider.py +2 -2
  258. agno/tools/tavily.py +146 -0
  259. agno/tools/whatsapp.py +1 -1
  260. agno/tools/workflow.py +278 -0
  261. agno/tools/yfinance.py +12 -11
  262. agno/utils/agent.py +820 -0
  263. agno/utils/audio.py +27 -0
  264. agno/utils/common.py +90 -1
  265. agno/utils/events.py +222 -7
  266. agno/utils/gemini.py +181 -23
  267. agno/utils/hooks.py +57 -0
  268. agno/utils/http.py +111 -0
  269. agno/utils/knowledge.py +12 -5
  270. agno/utils/log.py +1 -0
  271. agno/utils/mcp.py +95 -5
  272. agno/utils/media.py +188 -10
  273. agno/utils/merge_dict.py +22 -1
  274. agno/utils/message.py +60 -0
  275. agno/utils/models/claude.py +40 -11
  276. agno/utils/models/cohere.py +1 -1
  277. agno/utils/models/watsonx.py +1 -1
  278. agno/utils/openai.py +1 -1
  279. agno/utils/print_response/agent.py +105 -21
  280. agno/utils/print_response/team.py +103 -38
  281. agno/utils/print_response/workflow.py +251 -34
  282. agno/utils/reasoning.py +22 -1
  283. agno/utils/serialize.py +32 -0
  284. agno/utils/streamlit.py +16 -10
  285. agno/utils/string.py +41 -0
  286. agno/utils/team.py +98 -9
  287. agno/utils/tools.py +1 -1
  288. agno/vectordb/base.py +23 -4
  289. agno/vectordb/cassandra/cassandra.py +65 -9
  290. agno/vectordb/chroma/chromadb.py +182 -38
  291. agno/vectordb/clickhouse/clickhousedb.py +64 -11
  292. agno/vectordb/couchbase/couchbase.py +105 -10
  293. agno/vectordb/lancedb/lance_db.py +183 -135
  294. agno/vectordb/langchaindb/langchaindb.py +25 -7
  295. agno/vectordb/lightrag/lightrag.py +17 -3
  296. agno/vectordb/llamaindex/__init__.py +3 -0
  297. agno/vectordb/llamaindex/llamaindexdb.py +46 -7
  298. agno/vectordb/milvus/milvus.py +126 -9
  299. agno/vectordb/mongodb/__init__.py +7 -1
  300. agno/vectordb/mongodb/mongodb.py +112 -7
  301. agno/vectordb/pgvector/pgvector.py +142 -21
  302. agno/vectordb/pineconedb/pineconedb.py +80 -8
  303. agno/vectordb/qdrant/qdrant.py +125 -39
  304. agno/vectordb/redis/__init__.py +9 -0
  305. agno/vectordb/redis/redisdb.py +694 -0
  306. agno/vectordb/singlestore/singlestore.py +111 -25
  307. agno/vectordb/surrealdb/surrealdb.py +31 -5
  308. agno/vectordb/upstashdb/upstashdb.py +76 -8
  309. agno/vectordb/weaviate/weaviate.py +86 -15
  310. agno/workflow/__init__.py +2 -0
  311. agno/workflow/agent.py +299 -0
  312. agno/workflow/condition.py +112 -18
  313. agno/workflow/loop.py +69 -10
  314. agno/workflow/parallel.py +266 -118
  315. agno/workflow/router.py +110 -17
  316. agno/workflow/step.py +645 -136
  317. agno/workflow/steps.py +65 -6
  318. agno/workflow/types.py +71 -33
  319. agno/workflow/workflow.py +2113 -300
  320. agno-2.3.0.dist-info/METADATA +618 -0
  321. agno-2.3.0.dist-info/RECORD +577 -0
  322. agno-2.3.0.dist-info/licenses/LICENSE +201 -0
  323. agno/knowledge/reader/url_reader.py +0 -128
  324. agno/tools/googlesearch.py +0 -98
  325. agno/tools/mcp.py +0 -610
  326. agno/utils/models/aws_claude.py +0 -170
  327. agno-2.0.0rc2.dist-info/METADATA +0 -355
  328. agno-2.0.0rc2.dist-info/RECORD +0 -515
  329. agno-2.0.0rc2.dist-info/licenses/LICENSE +0 -375
  330. {agno-2.0.0rc2.dist-info → agno-2.3.0.dist-info}/WHEEL +0 -0
  331. {agno-2.0.0rc2.dist-info → agno-2.3.0.dist-info}/top_level.txt +0 -0
@@ -8,7 +8,7 @@ from agno.knowledge.chunking.strategy import ChunkingStrategy, ChunkingStrategyT
8
8
  from agno.knowledge.document.base import Document
9
9
  from agno.knowledge.reader.base import Reader
10
10
  from agno.knowledge.types import ContentType
11
- from agno.utils.log import log_info, logger
11
+ from agno.utils.log import log_debug, log_error, log_warning
12
12
 
13
13
 
14
14
  class TextReader(Reader):
@@ -37,14 +37,14 @@ class TextReader(Reader):
37
37
  if isinstance(file, Path):
38
38
  if not file.exists():
39
39
  raise FileNotFoundError(f"Could not find file: {file}")
40
- log_info(f"Reading: {file}")
40
+ log_debug(f"Reading: {file}")
41
41
  file_name = name or file.stem
42
- file_contents = file.read_text("utf-8")
42
+ file_contents = file.read_text(self.encoding or "utf-8")
43
43
  else:
44
44
  file_name = name or file.name.split(".")[0]
45
- log_info(f"Reading uploaded file: {file_name}")
45
+ log_debug(f"Reading uploaded file: {file_name}")
46
46
  file.seek(0)
47
- file_contents = file.read().decode("utf-8")
47
+ file_contents = file.read().decode(self.encoding or "utf-8")
48
48
 
49
49
  documents = [
50
50
  Document(
@@ -60,7 +60,7 @@ class TextReader(Reader):
60
60
  return chunked_documents
61
61
  return documents
62
62
  except Exception as e:
63
- logger.error(f"Error reading: {file}: {e}")
63
+ log_error(f"Error reading: {file}: {e}")
64
64
  return []
65
65
 
66
66
  async def async_read(self, file: Union[Path, IO[Any]], name: Optional[str] = None) -> List[Document]:
@@ -69,22 +69,22 @@ class TextReader(Reader):
69
69
  if not file.exists():
70
70
  raise FileNotFoundError(f"Could not find file: {file}")
71
71
 
72
- log_info(f"Reading asynchronously: {file}")
72
+ log_debug(f"Reading asynchronously: {file}")
73
73
  file_name = name or file.stem
74
74
 
75
75
  try:
76
76
  import aiofiles
77
77
 
78
- async with aiofiles.open(file, "r", encoding="utf-8") as f:
78
+ async with aiofiles.open(file, "r", encoding=self.encoding or "utf-8") as f:
79
79
  file_contents = await f.read()
80
80
  except ImportError:
81
- logger.warning("aiofiles not installed, using synchronous file I/O")
82
- file_contents = file.read_text("utf-8")
81
+ log_warning("aiofiles not installed, using synchronous file I/O")
82
+ file_contents = file.read_text(self.encoding or "utf-8")
83
83
  else:
84
- log_info(f"Reading uploaded file asynchronously: {file.name}")
84
+ log_debug(f"Reading uploaded file asynchronously: {file.name}")
85
85
  file_name = name or file.name.split(".")[0]
86
86
  file.seek(0)
87
- file_contents = file.read().decode("utf-8")
87
+ file_contents = file.read().decode(self.encoding or "utf-8")
88
88
 
89
89
  document = Document(
90
90
  name=file_name,
@@ -96,7 +96,7 @@ class TextReader(Reader):
96
96
  return await self._async_chunk_document(document)
97
97
  return [document]
98
98
  except Exception as e:
99
- logger.error(f"Error reading asynchronously: {file}: {e}")
99
+ log_error(f"Error reading asynchronously: {file}: {e}")
100
100
  return []
101
101
 
102
102
  async def _async_chunk_document(self, document: Document) -> List[Document]:
@@ -37,7 +37,7 @@ class WebSearchReader(Reader):
37
37
  user_agent: str = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
38
38
 
39
39
  # Search engine configuration
40
- search_engine: Literal["duckduckgo", "google"] = "duckduckgo"
40
+ search_engine: Literal["duckduckgo"] = "duckduckgo"
41
41
  search_delay: float = 3.0 # Delay between search requests
42
42
  max_search_retries: int = 2 # Retries for search operations
43
43
 
@@ -96,7 +96,7 @@ class WebSearchReader(Reader):
96
96
  results.append(
97
97
  {
98
98
  "title": result.get("title", ""),
99
- "url": result.get("link", ""),
99
+ "url": result.get("href", ""),
100
100
  "description": result.get("body", ""),
101
101
  }
102
102
  )
@@ -121,51 +121,10 @@ class WebSearchReader(Reader):
121
121
  return []
122
122
  return []
123
123
 
124
- def _perform_google_search(self, query: str) -> List[Dict[str, str]]:
125
- """Perform web search using Google (requires googlesearch-python)"""
126
- log_debug(f"Performing Google search for: {query}")
127
-
128
- try:
129
- from googlesearch import search
130
- except ImportError:
131
- logger.error("Google search requires 'googlesearch-python'. Install with: pip install googlesearch-python")
132
- return []
133
-
134
- for attempt in range(self.max_search_retries):
135
- try:
136
- self._respect_rate_limits()
137
-
138
- results = []
139
- search_results = search(query, num_results=self.max_results, stop=self.max_results)
140
-
141
- for result in search_results:
142
- results.append(
143
- {
144
- "title": getattr(result, "title", ""),
145
- "url": getattr(result, "url", ""),
146
- "description": getattr(result, "description", ""),
147
- }
148
- )
149
-
150
- log_debug(f"Found {len(results)} Google search results")
151
- return results
152
-
153
- except Exception as e:
154
- logger.warning(f"Google search attempt {attempt + 1} failed: {e}")
155
- if attempt < self.max_search_retries - 1:
156
- time.sleep(self.search_delay)
157
- else:
158
- logger.error(f"All Google search attempts failed: {e}")
159
- return []
160
-
161
- return []
162
-
163
124
  def _perform_web_search(self, query: str) -> List[Dict[str, str]]:
164
125
  """Perform web search using the configured search engine"""
165
126
  if self.search_engine == "duckduckgo":
166
127
  return self._perform_duckduckgo_search(query)
167
- elif self.search_engine == "google":
168
- return self._perform_google_search(query)
169
128
  else:
170
129
  logger.error(f"Unsupported search engine: {self.search_engine}")
171
130
  return []
@@ -12,7 +12,7 @@ from agno.knowledge.chunking.strategy import ChunkingStrategy, ChunkingStrategyT
12
12
  from agno.knowledge.document.base import Document
13
13
  from agno.knowledge.reader.base import Reader
14
14
  from agno.knowledge.types import ContentType
15
- from agno.utils.log import log_debug, logger
15
+ from agno.utils.log import log_debug, log_error, log_warning
16
16
 
17
17
  try:
18
18
  from bs4 import BeautifulSoup, Tag # noqa: F401
@@ -106,23 +106,36 @@ class WebsiteReader(Reader):
106
106
  """
107
107
  Check if the tag matches any of the relevant tags or class names
108
108
  """
109
- if tag.name in ["article", "main"]:
109
+ if not isinstance(tag, Tag):
110
+ return False
111
+
112
+ if tag.name in ["article", "main", "section"]:
113
+ return True
114
+
115
+ classes_attr = tag.get("class")
116
+ classes: List[str] = classes_attr if isinstance(classes_attr, list) else []
117
+ content_classes = ["content", "main-content", "post-content", "entry-content", "article-body"]
118
+ if any(cls in content_classes for cls in classes):
110
119
  return True
111
- if any(cls in ["content", "main-content", "post-content"] for cls in tag.get("class", [])): # type: ignore
120
+
121
+ # Check for common content IDs
122
+ tag_id = tag.get("id", "")
123
+ if tag_id in ["content", "main", "article"]:
112
124
  return True
125
+
113
126
  return False
114
127
 
115
- # Use a single call to 'find' with a custom function to match tags or classes
128
+ # Try to find main content element
116
129
  element = soup.find(match)
117
- if element:
130
+ if element and hasattr(element, "find_all"):
131
+ # Remove common unwanted elements from the found content
132
+ for unwanted in element.find_all(["script", "style", "nav", "header", "footer"]):
133
+ unwanted.decompose()
118
134
  return element.get_text(strip=True, separator=" ")
119
135
 
120
- # If we only have a div without specific content classes, return empty string
121
- if soup.find("div") and not any(
122
- soup.find(class_=class_name) for class_name in ["content", "main-content", "post-content"]
123
- ):
124
- return ""
125
-
136
+ # Fallback: get full page content
137
+ for unwanted in soup.find_all(["script", "style", "nav", "header", "footer"]):
138
+ unwanted.decompose()
126
139
  return soup.get_text(strip=True, separator=" ")
127
140
 
128
141
  def crawl(self, url: str, starting_depth: int = 1) -> Dict[str, str]:
@@ -164,7 +177,7 @@ class WebsiteReader(Reader):
164
177
  if (
165
178
  current_url in self._visited
166
179
  or not urlparse(current_url).netloc.endswith(primary_domain)
167
- or current_depth > self.max_depth
180
+ or (current_depth > self.max_depth and current_url != url)
168
181
  or num_links >= self.max_links
169
182
  ):
170
183
  continue
@@ -174,13 +187,14 @@ class WebsiteReader(Reader):
174
187
 
175
188
  try:
176
189
  log_debug(f"Crawling: {current_url}")
190
+
177
191
  response = (
178
- httpx.get(current_url, timeout=self.timeout, proxy=self.proxy)
192
+ httpx.get(current_url, timeout=self.timeout, proxy=self.proxy, follow_redirects=True)
179
193
  if self.proxy
180
- else httpx.get(current_url, timeout=self.timeout)
194
+ else httpx.get(current_url, timeout=self.timeout, follow_redirects=True)
181
195
  )
182
-
183
196
  response.raise_for_status()
197
+
184
198
  soup = BeautifulSoup(response.content, "html.parser")
185
199
 
186
200
  # Extract main content
@@ -213,19 +227,23 @@ class WebsiteReader(Reader):
213
227
 
214
228
  except httpx.HTTPStatusError as e:
215
229
  # Log HTTP status errors but continue crawling other pages
216
- logger.warning(f"HTTP status error while crawling {current_url}: {e}")
217
- # For the initial URL, we should raise the error
218
- if current_url == url and not crawler_result:
230
+ # Skip redirect errors (3xx) as they should be handled by follow_redirects
231
+ if e.response.status_code >= 300 and e.response.status_code < 400:
232
+ log_debug(f"Redirect encountered for {current_url}, skipping: {e}")
233
+ else:
234
+ log_warning(f"HTTP status error while crawling {current_url}: {e}")
235
+ # For the initial URL, we should raise the error only if it's not a redirect
236
+ if current_url == url and not crawler_result and not (300 <= e.response.status_code < 400):
219
237
  raise
220
238
  except httpx.RequestError as e:
221
239
  # Log request errors but continue crawling other pages
222
- logger.warning(f"Request error while crawling {current_url}: {e}")
240
+ log_warning(f"Request error while crawling {current_url}: {e}")
223
241
  # For the initial URL, we should raise the error
224
242
  if current_url == url and not crawler_result:
225
243
  raise
226
244
  except Exception as e:
227
245
  # Log other exceptions but continue crawling other pages
228
- logger.warning(f"Failed to crawl {current_url}: {e}")
246
+ log_warning(f"Failed to crawl {current_url}: {e}")
229
247
  # For the initial URL, we should raise the error
230
248
  if current_url == url and not crawler_result:
231
249
  # Wrap non-HTTP exceptions in a RequestError
@@ -314,19 +332,19 @@ class WebsiteReader(Reader):
314
332
 
315
333
  except httpx.HTTPStatusError as e:
316
334
  # Log HTTP status errors but continue crawling other pages
317
- logger.warning(f"HTTP status error while crawling asynchronously {current_url}: {e}")
335
+ log_warning(f"HTTP status error while crawling asynchronously {current_url}: {e}")
318
336
  # For the initial URL, we should raise the error
319
337
  if current_url == url and not crawler_result:
320
338
  raise
321
339
  except httpx.RequestError as e:
322
340
  # Log request errors but continue crawling other pages
323
- logger.warning(f"Request error while crawling asynchronously {current_url}: {e}")
341
+ log_warning(f"Request error while crawling asynchronously {current_url}: {e}")
324
342
  # For the initial URL, we should raise the error
325
343
  if current_url == url and not crawler_result:
326
344
  raise
327
345
  except Exception as e:
328
346
  # Log other exceptions but continue crawling other pages
329
- logger.warning(f"Failed to crawl asynchronously {current_url}: {e}")
347
+ log_warning(f"Failed to crawl asynchronously {current_url}: {e}")
330
348
  # For the initial URL, we should raise the error
331
349
  if current_url == url and not crawler_result:
332
350
  # Wrap non-HTTP exceptions in a RequestError
@@ -380,7 +398,7 @@ class WebsiteReader(Reader):
380
398
  )
381
399
  return documents
382
400
  except (httpx.HTTPStatusError, httpx.RequestError) as e:
383
- logger.error(f"Error reading website {url}: {e}")
401
+ log_error(f"Error reading website {url}: {e}")
384
402
  raise
385
403
 
386
404
  async def async_read(self, url: str, name: Optional[str] = None) -> List[Document]:
@@ -433,5 +451,5 @@ class WebsiteReader(Reader):
433
451
 
434
452
  return documents
435
453
  except (httpx.HTTPStatusError, httpx.RequestError) as e:
436
- logger.error(f"Error reading website asynchronously {url}: {e}")
454
+ log_error(f"Error reading website asynchronously {url}: {e}")
437
455
  raise
@@ -0,0 +1,3 @@
1
+ from agno.knowledge.reranker.base import Reranker
2
+
3
+ __all__ = ["Reranker"]
agno/knowledge/types.py CHANGED
@@ -1,4 +1,7 @@
1
1
  from enum import Enum
2
+ from typing import Any
3
+
4
+ from pydantic import BaseModel
2
5
 
3
6
 
4
7
  class ContentType(str, Enum):
@@ -17,6 +20,7 @@ class ContentType(str, Enum):
17
20
  MARKDOWN = ".md"
18
21
  DOCX = ".docx"
19
22
  DOC = ".doc"
23
+ PPTX = ".pptx"
20
24
  JSON = ".json"
21
25
 
22
26
  # Spreadsheet file extensions
@@ -28,3 +32,8 @@ class ContentType(str, Enum):
28
32
  def get_content_type_enum(content_type_str: str) -> ContentType:
29
33
  """Convert a content type string to ContentType enum."""
30
34
  return ContentType(content_type_str)
35
+
36
+
37
+ class KnowledgeFilter(BaseModel):
38
+ key: str
39
+ value: Any
agno/knowledge/utils.py CHANGED
@@ -129,12 +129,32 @@ def get_chunker_info(chunker_key: str) -> Dict:
129
129
  class_name = chunker_class.__name__
130
130
  docstring = chunker_class.__doc__ or f"{class_name} chunking strategy"
131
131
 
132
+ # Check class __init__ signature for chunk_size and overlap parameters
133
+ metadata = {}
134
+ import inspect
135
+
136
+ try:
137
+ sig = inspect.signature(chunker_class.__init__)
138
+ param_names = set(sig.parameters.keys())
139
+
140
+ # If class has chunk_size or max_chunk_size parameter, set default chunk_size
141
+ if "chunk_size" in param_names or "max_chunk_size" in param_names:
142
+ metadata["chunk_size"] = 5000
143
+
144
+ # If class has overlap parameter, set default overlap
145
+ if "overlap" in param_names:
146
+ metadata["chunk_overlap"] = 0
147
+ except Exception:
148
+ # If we can't inspect, skip metadata
149
+ pass
150
+
132
151
  return {
133
152
  "key": chunker_key,
134
153
  "class_name": class_name,
135
154
  "name": chunker_key,
136
155
  "description": docstring.strip(),
137
156
  "strategy_type": strategy_type.value,
157
+ "metadata": metadata,
138
158
  }
139
159
  except ValueError:
140
160
  raise ValueError(f"Unknown chunker key: {chunker_key}")