PyPI - agno - Versions diffs - 0.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl - Mend

agno 0.1.2py3-none-any.whl → 2.3.13py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (723) hide show

agno/__init__.py +8 -0
agno/agent/__init__.py +44 -5
agno/agent/agent.py +10531 -2975
agno/api/agent.py +14 -53
agno/api/api.py +7 -46
agno/api/evals.py +22 -0
agno/api/os.py +17 -0
agno/api/routes.py +6 -25
agno/api/schemas/__init__.py +9 -0
agno/api/schemas/agent.py +6 -9
agno/api/schemas/evals.py +16 -0
agno/api/schemas/os.py +14 -0
agno/api/schemas/team.py +10 -10
agno/api/schemas/utils.py +21 -0
agno/api/schemas/workflows.py +16 -0
agno/api/settings.py +53 -0
agno/api/team.py +22 -26
agno/api/workflow.py +28 -0
agno/cloud/aws/base.py +214 -0
agno/cloud/aws/s3/__init__.py +2 -0
agno/cloud/aws/s3/api_client.py +43 -0
agno/cloud/aws/s3/bucket.py +195 -0
agno/cloud/aws/s3/object.py +57 -0
agno/compression/__init__.py +3 -0
agno/compression/manager.py +247 -0
agno/culture/__init__.py +3 -0
agno/culture/manager.py +956 -0
agno/db/__init__.py +24 -0
agno/db/async_postgres/__init__.py +3 -0
agno/db/base.py +946 -0
agno/db/dynamo/__init__.py +3 -0
agno/db/dynamo/dynamo.py +2781 -0
agno/db/dynamo/schemas.py +442 -0
agno/db/dynamo/utils.py +743 -0
agno/db/firestore/__init__.py +3 -0
agno/db/firestore/firestore.py +2379 -0
agno/db/firestore/schemas.py +181 -0
agno/db/firestore/utils.py +376 -0
agno/db/gcs_json/__init__.py +3 -0
agno/db/gcs_json/gcs_json_db.py +1791 -0
agno/db/gcs_json/utils.py +228 -0
agno/db/in_memory/__init__.py +3 -0
agno/db/in_memory/in_memory_db.py +1312 -0
agno/db/in_memory/utils.py +230 -0
agno/db/json/__init__.py +3 -0
agno/db/json/json_db.py +1777 -0
agno/db/json/utils.py +230 -0
agno/db/migrations/manager.py +199 -0
agno/db/migrations/v1_to_v2.py +635 -0
agno/db/migrations/versions/v2_3_0.py +938 -0
agno/db/mongo/__init__.py +17 -0
agno/db/mongo/async_mongo.py +2760 -0
agno/db/mongo/mongo.py +2597 -0
agno/db/mongo/schemas.py +119 -0
agno/db/mongo/utils.py +276 -0
agno/db/mysql/__init__.py +4 -0
agno/db/mysql/async_mysql.py +2912 -0
agno/db/mysql/mysql.py +2923 -0
agno/db/mysql/schemas.py +186 -0
agno/db/mysql/utils.py +488 -0
agno/db/postgres/__init__.py +4 -0
agno/db/postgres/async_postgres.py +2579 -0
agno/db/postgres/postgres.py +2870 -0
agno/db/postgres/schemas.py +187 -0
agno/db/postgres/utils.py +442 -0
agno/db/redis/__init__.py +3 -0
agno/db/redis/redis.py +2141 -0
agno/db/redis/schemas.py +159 -0
agno/db/redis/utils.py +346 -0
agno/db/schemas/__init__.py +4 -0
agno/db/schemas/culture.py +120 -0
agno/db/schemas/evals.py +34 -0
agno/db/schemas/knowledge.py +40 -0
agno/db/schemas/memory.py +61 -0
agno/db/singlestore/__init__.py +3 -0
agno/db/singlestore/schemas.py +179 -0
agno/db/singlestore/singlestore.py +2877 -0
agno/db/singlestore/utils.py +384 -0
agno/db/sqlite/__init__.py +4 -0
agno/db/sqlite/async_sqlite.py +2911 -0
agno/db/sqlite/schemas.py +181 -0
agno/db/sqlite/sqlite.py +2908 -0
agno/db/sqlite/utils.py +429 -0
agno/db/surrealdb/__init__.py +3 -0
agno/db/surrealdb/metrics.py +292 -0
agno/db/surrealdb/models.py +334 -0
agno/db/surrealdb/queries.py +71 -0
agno/db/surrealdb/surrealdb.py +1908 -0
agno/db/surrealdb/utils.py +147 -0
agno/db/utils.py +118 -0
agno/eval/__init__.py +24 -0
agno/eval/accuracy.py +666 -276
agno/eval/agent_as_judge.py +861 -0
agno/eval/base.py +29 -0
agno/eval/performance.py +779 -0
agno/eval/reliability.py +241 -62
agno/eval/utils.py +120 -0
agno/exceptions.py +143 -1
agno/filters.py +354 -0
agno/guardrails/__init__.py +6 -0
agno/guardrails/base.py +19 -0
agno/guardrails/openai.py +144 -0
agno/guardrails/pii.py +94 -0
agno/guardrails/prompt_injection.py +52 -0
agno/hooks/__init__.py +3 -0
agno/hooks/decorator.py +164 -0
agno/integrations/discord/__init__.py +3 -0
agno/integrations/discord/client.py +203 -0
agno/knowledge/__init__.py +5 -1
agno/{document → knowledge}/chunking/agentic.py +22 -14
agno/{document → knowledge}/chunking/document.py +2 -2
agno/{document → knowledge}/chunking/fixed.py +7 -6
agno/knowledge/chunking/markdown.py +151 -0
agno/{document → knowledge}/chunking/recursive.py +15 -3
agno/knowledge/chunking/row.py +39 -0
agno/knowledge/chunking/semantic.py +91 -0
agno/knowledge/chunking/strategy.py +165 -0
agno/knowledge/content.py +74 -0
agno/knowledge/document/__init__.py +5 -0
agno/{document → knowledge/document}/base.py +12 -2
agno/knowledge/embedder/__init__.py +5 -0
agno/knowledge/embedder/aws_bedrock.py +343 -0
agno/knowledge/embedder/azure_openai.py +210 -0
agno/{embedder → knowledge/embedder}/base.py +8 -0
agno/knowledge/embedder/cohere.py +323 -0
agno/knowledge/embedder/fastembed.py +62 -0
agno/{embedder → knowledge/embedder}/fireworks.py +1 -1
agno/knowledge/embedder/google.py +258 -0
agno/knowledge/embedder/huggingface.py +94 -0
agno/knowledge/embedder/jina.py +182 -0
agno/knowledge/embedder/langdb.py +22 -0
agno/knowledge/embedder/mistral.py +206 -0
agno/knowledge/embedder/nebius.py +13 -0
agno/knowledge/embedder/ollama.py +154 -0
agno/knowledge/embedder/openai.py +195 -0
agno/knowledge/embedder/sentence_transformer.py +63 -0
agno/{embedder → knowledge/embedder}/together.py +1 -1
agno/knowledge/embedder/vllm.py +262 -0
agno/knowledge/embedder/voyageai.py +165 -0
agno/knowledge/knowledge.py +3006 -0
agno/knowledge/reader/__init__.py +7 -0
agno/knowledge/reader/arxiv_reader.py +81 -0
agno/knowledge/reader/base.py +95 -0
agno/knowledge/reader/csv_reader.py +164 -0
agno/knowledge/reader/docx_reader.py +82 -0
agno/knowledge/reader/field_labeled_csv_reader.py +290 -0
agno/knowledge/reader/firecrawl_reader.py +201 -0
agno/knowledge/reader/json_reader.py +88 -0
agno/knowledge/reader/markdown_reader.py +137 -0
agno/knowledge/reader/pdf_reader.py +431 -0
agno/knowledge/reader/pptx_reader.py +101 -0
agno/knowledge/reader/reader_factory.py +313 -0
agno/knowledge/reader/s3_reader.py +89 -0
agno/knowledge/reader/tavily_reader.py +193 -0
agno/knowledge/reader/text_reader.py +127 -0
agno/knowledge/reader/web_search_reader.py +325 -0
agno/knowledge/reader/website_reader.py +455 -0
agno/knowledge/reader/wikipedia_reader.py +91 -0
agno/knowledge/reader/youtube_reader.py +78 -0
agno/knowledge/remote_content/remote_content.py +88 -0
agno/knowledge/reranker/__init__.py +3 -0
agno/{reranker → knowledge/reranker}/base.py +1 -1
agno/{reranker → knowledge/reranker}/cohere.py +2 -2
agno/knowledge/reranker/infinity.py +195 -0
agno/knowledge/reranker/sentence_transformer.py +54 -0
agno/knowledge/types.py +39 -0
agno/knowledge/utils.py +234 -0
agno/media.py +439 -95
agno/memory/__init__.py +16 -3
agno/memory/manager.py +1474 -123
agno/memory/strategies/__init__.py +15 -0
agno/memory/strategies/base.py +66 -0
agno/memory/strategies/summarize.py +196 -0
agno/memory/strategies/types.py +37 -0
agno/models/aimlapi/__init__.py +5 -0
agno/models/aimlapi/aimlapi.py +62 -0
agno/models/anthropic/__init__.py +4 -0
agno/models/anthropic/claude.py +960 -496
agno/models/aws/__init__.py +15 -0
agno/models/aws/bedrock.py +686 -451
agno/models/aws/claude.py +190 -183
agno/models/azure/__init__.py +18 -1
agno/models/azure/ai_foundry.py +489 -0
agno/models/azure/openai_chat.py +89 -40
agno/models/base.py +2477 -550
agno/models/cerebras/__init__.py +12 -0
agno/models/cerebras/cerebras.py +565 -0
agno/models/cerebras/cerebras_openai.py +131 -0
agno/models/cohere/__init__.py +4 -0
agno/models/cohere/chat.py +306 -492
agno/models/cometapi/__init__.py +5 -0
agno/models/cometapi/cometapi.py +74 -0
agno/models/dashscope/__init__.py +5 -0
agno/models/dashscope/dashscope.py +90 -0
agno/models/deepinfra/__init__.py +5 -0
agno/models/deepinfra/deepinfra.py +45 -0
agno/models/deepseek/__init__.py +4 -0
agno/models/deepseek/deepseek.py +110 -9
agno/models/fireworks/__init__.py +4 -0
agno/models/fireworks/fireworks.py +19 -22
agno/models/google/__init__.py +3 -7
agno/models/google/gemini.py +1717 -662
agno/models/google/utils.py +22 -0
agno/models/groq/__init__.py +4 -0
agno/models/groq/groq.py +391 -666
agno/models/huggingface/__init__.py +4 -0
agno/models/huggingface/huggingface.py +266 -538
agno/models/ibm/__init__.py +5 -0
agno/models/ibm/watsonx.py +432 -0
agno/models/internlm/__init__.py +3 -0
agno/models/internlm/internlm.py +20 -3
agno/models/langdb/__init__.py +1 -0
agno/models/langdb/langdb.py +60 -0
agno/models/litellm/__init__.py +14 -0
agno/models/litellm/chat.py +503 -0
agno/models/litellm/litellm_openai.py +42 -0
agno/models/llama_cpp/__init__.py +5 -0
agno/models/llama_cpp/llama_cpp.py +22 -0
agno/models/lmstudio/__init__.py +5 -0
agno/models/lmstudio/lmstudio.py +25 -0
agno/models/message.py +361 -39
agno/models/meta/__init__.py +12 -0
agno/models/meta/llama.py +502 -0
agno/models/meta/llama_openai.py +79 -0
agno/models/metrics.py +120 -0
agno/models/mistral/__init__.py +4 -0
agno/models/mistral/mistral.py +293 -393
agno/models/nebius/__init__.py +3 -0
agno/models/nebius/nebius.py +53 -0
agno/models/nexus/__init__.py +3 -0
agno/models/nexus/nexus.py +22 -0
agno/models/nvidia/__init__.py +4 -0
agno/models/nvidia/nvidia.py +22 -3
agno/models/ollama/__init__.py +4 -2
agno/models/ollama/chat.py +257 -492
agno/models/openai/__init__.py +7 -0
agno/models/openai/chat.py +725 -770
agno/models/openai/like.py +16 -2
agno/models/openai/responses.py +1121 -0
agno/models/openrouter/__init__.py +4 -0
agno/models/openrouter/openrouter.py +62 -5
agno/models/perplexity/__init__.py +5 -0
agno/models/perplexity/perplexity.py +203 -0
agno/models/portkey/__init__.py +3 -0
agno/models/portkey/portkey.py +82 -0
agno/models/requesty/__init__.py +5 -0
agno/models/requesty/requesty.py +69 -0
agno/models/response.py +177 -7
agno/models/sambanova/__init__.py +4 -0
agno/models/sambanova/sambanova.py +23 -4
agno/models/siliconflow/__init__.py +5 -0
agno/models/siliconflow/siliconflow.py +42 -0
agno/models/together/__init__.py +4 -0
agno/models/together/together.py +21 -164
agno/models/utils.py +266 -0
agno/models/vercel/__init__.py +3 -0
agno/models/vercel/v0.py +43 -0
agno/models/vertexai/__init__.py +0 -1
agno/models/vertexai/claude.py +190 -0
agno/models/vllm/__init__.py +3 -0
agno/models/vllm/vllm.py +83 -0
agno/models/xai/__init__.py +2 -0
agno/models/xai/xai.py +111 -7
agno/os/__init__.py +3 -0
agno/os/app.py +1027 -0
agno/os/auth.py +244 -0
agno/os/config.py +126 -0
agno/os/interfaces/__init__.py +1 -0
agno/os/interfaces/a2a/__init__.py +3 -0
agno/os/interfaces/a2a/a2a.py +42 -0
agno/os/interfaces/a2a/router.py +249 -0
agno/os/interfaces/a2a/utils.py +924 -0
agno/os/interfaces/agui/__init__.py +3 -0
agno/os/interfaces/agui/agui.py +47 -0
agno/os/interfaces/agui/router.py +147 -0
agno/os/interfaces/agui/utils.py +574 -0
agno/os/interfaces/base.py +25 -0
agno/os/interfaces/slack/__init__.py +3 -0
agno/os/interfaces/slack/router.py +148 -0
agno/os/interfaces/slack/security.py +30 -0
agno/os/interfaces/slack/slack.py +47 -0
agno/os/interfaces/whatsapp/__init__.py +3 -0
agno/os/interfaces/whatsapp/router.py +210 -0
agno/os/interfaces/whatsapp/security.py +55 -0
agno/os/interfaces/whatsapp/whatsapp.py +36 -0
agno/os/mcp.py +293 -0
agno/os/middleware/__init__.py +9 -0
agno/os/middleware/jwt.py +797 -0
agno/os/router.py +258 -0
agno/os/routers/__init__.py +3 -0
agno/os/routers/agents/__init__.py +3 -0
agno/os/routers/agents/router.py +599 -0
agno/os/routers/agents/schema.py +261 -0
agno/os/routers/evals/__init__.py +3 -0
agno/os/routers/evals/evals.py +450 -0
agno/os/routers/evals/schemas.py +174 -0
agno/os/routers/evals/utils.py +231 -0
agno/os/routers/health.py +31 -0
agno/os/routers/home.py +52 -0
agno/os/routers/knowledge/__init__.py +3 -0
agno/os/routers/knowledge/knowledge.py +1008 -0
agno/os/routers/knowledge/schemas.py +178 -0
agno/os/routers/memory/__init__.py +3 -0
agno/os/routers/memory/memory.py +661 -0
agno/os/routers/memory/schemas.py +88 -0
agno/os/routers/metrics/__init__.py +3 -0
agno/os/routers/metrics/metrics.py +190 -0
agno/os/routers/metrics/schemas.py +47 -0
agno/os/routers/session/__init__.py +3 -0
agno/os/routers/session/session.py +997 -0
agno/os/routers/teams/__init__.py +3 -0
agno/os/routers/teams/router.py +512 -0
agno/os/routers/teams/schema.py +257 -0
agno/os/routers/traces/__init__.py +3 -0
agno/os/routers/traces/schemas.py +414 -0
agno/os/routers/traces/traces.py +499 -0
agno/os/routers/workflows/__init__.py +3 -0
agno/os/routers/workflows/router.py +624 -0
agno/os/routers/workflows/schema.py +75 -0
agno/os/schema.py +534 -0
agno/os/scopes.py +469 -0
agno/{playground → os}/settings.py +7 -15
agno/os/utils.py +973 -0
agno/reasoning/anthropic.py +80 -0
agno/reasoning/azure_ai_foundry.py +67 -0
agno/reasoning/deepseek.py +63 -0
agno/reasoning/default.py +97 -0
agno/reasoning/gemini.py +73 -0
agno/reasoning/groq.py +71 -0
agno/reasoning/helpers.py +24 -1
agno/reasoning/ollama.py +67 -0
agno/reasoning/openai.py +86 -0
agno/reasoning/step.py +2 -1
agno/reasoning/vertexai.py +76 -0
agno/run/__init__.py +6 -0
agno/run/agent.py +822 -0
agno/run/base.py +247 -0
agno/run/cancel.py +81 -0
agno/run/requirement.py +181 -0
agno/run/team.py +767 -0
agno/run/workflow.py +708 -0
agno/session/__init__.py +10 -0
agno/session/agent.py +260 -0
agno/session/summary.py +265 -0
agno/session/team.py +342 -0
agno/session/workflow.py +501 -0
agno/table.py +10 -0
agno/team/__init__.py +37 -0
agno/team/team.py +9536 -0
agno/tools/__init__.py +7 -0
agno/tools/agentql.py +120 -0
agno/tools/airflow.py +22 -12
agno/tools/api.py +122 -0
agno/tools/apify.py +276 -83
agno/tools/{arxiv_toolkit.py → arxiv.py} +20 -12
agno/tools/aws_lambda.py +28 -7
agno/tools/aws_ses.py +66 -0
agno/tools/baidusearch.py +11 -4
agno/tools/bitbucket.py +292 -0
agno/tools/brandfetch.py +213 -0
agno/tools/bravesearch.py +106 -0
agno/tools/brightdata.py +367 -0
agno/tools/browserbase.py +209 -0
agno/tools/calcom.py +32 -23
agno/tools/calculator.py +24 -37
agno/tools/cartesia.py +187 -0
agno/tools/{clickup_tool.py → clickup.py} +17 -28
agno/tools/confluence.py +91 -26
agno/tools/crawl4ai.py +139 -43
agno/tools/csv_toolkit.py +28 -22
agno/tools/dalle.py +36 -22
agno/tools/daytona.py +475 -0
agno/tools/decorator.py +169 -14
agno/tools/desi_vocal.py +23 -11
agno/tools/discord.py +32 -29
agno/tools/docker.py +716 -0
agno/tools/duckdb.py +76 -81
agno/tools/duckduckgo.py +43 -40
agno/tools/e2b.py +703 -0
agno/tools/eleven_labs.py +65 -54
agno/tools/email.py +13 -5
agno/tools/evm.py +129 -0
agno/tools/exa.py +324 -42
agno/tools/fal.py +39 -35
agno/tools/file.py +196 -30
agno/tools/file_generation.py +356 -0
agno/tools/financial_datasets.py +288 -0
agno/tools/firecrawl.py +108 -33
agno/tools/function.py +960 -122
agno/tools/giphy.py +34 -12
agno/tools/github.py +1294 -97
agno/tools/gmail.py +922 -0
agno/tools/google_bigquery.py +117 -0
agno/tools/google_drive.py +271 -0
agno/tools/google_maps.py +253 -0
agno/tools/googlecalendar.py +607 -107
agno/tools/googlesheets.py +377 -0
agno/tools/hackernews.py +20 -12
agno/tools/jina.py +24 -14
agno/tools/jira.py +48 -19
agno/tools/knowledge.py +218 -0
agno/tools/linear.py +82 -43
agno/tools/linkup.py +58 -0
agno/tools/local_file_system.py +15 -7
agno/tools/lumalab.py +41 -26
agno/tools/mcp/__init__.py +10 -0
agno/tools/mcp/mcp.py +331 -0
agno/tools/mcp/multi_mcp.py +347 -0
agno/tools/mcp/params.py +24 -0
agno/tools/mcp_toolbox.py +284 -0
agno/tools/mem0.py +193 -0
agno/tools/memory.py +419 -0
agno/tools/mlx_transcribe.py +11 -9
agno/tools/models/azure_openai.py +190 -0
agno/tools/models/gemini.py +203 -0
agno/tools/models/groq.py +158 -0
agno/tools/models/morph.py +186 -0
agno/tools/models/nebius.py +124 -0
agno/tools/models_labs.py +163 -82
agno/tools/moviepy_video.py +18 -13
agno/tools/nano_banana.py +151 -0
agno/tools/neo4j.py +134 -0
agno/tools/newspaper.py +15 -4
agno/tools/newspaper4k.py +19 -6
agno/tools/notion.py +204 -0
agno/tools/openai.py +181 -17
agno/tools/openbb.py +27 -20
agno/tools/opencv.py +321 -0
agno/tools/openweather.py +233 -0
agno/tools/oxylabs.py +385 -0
agno/tools/pandas.py +25 -15
agno/tools/parallel.py +314 -0
agno/tools/postgres.py +238 -185
agno/tools/pubmed.py +125 -13
agno/tools/python.py +48 -35
agno/tools/reasoning.py +283 -0
agno/tools/reddit.py +207 -29
agno/tools/redshift.py +406 -0
agno/tools/replicate.py +69 -26
agno/tools/resend.py +11 -6
agno/tools/scrapegraph.py +179 -19
agno/tools/searxng.py +23 -31
agno/tools/serpapi.py +15 -10
agno/tools/serper.py +255 -0
agno/tools/shell.py +23 -12
agno/tools/shopify.py +1519 -0
agno/tools/slack.py +56 -14
agno/tools/sleep.py +8 -6
agno/tools/spider.py +35 -11
agno/tools/spotify.py +919 -0
agno/tools/sql.py +34 -19
agno/tools/tavily.py +158 -8
agno/tools/telegram.py +18 -8
agno/tools/todoist.py +218 -0
agno/tools/toolkit.py +134 -9
agno/tools/trafilatura.py +388 -0
agno/tools/trello.py +25 -28
agno/tools/twilio.py +18 -9
agno/tools/user_control_flow.py +78 -0
agno/tools/valyu.py +228 -0
agno/tools/visualization.py +467 -0
agno/tools/webbrowser.py +28 -0
agno/tools/webex.py +76 -0
agno/tools/website.py +23 -19
agno/tools/webtools.py +45 -0
agno/tools/whatsapp.py +286 -0
agno/tools/wikipedia.py +28 -19
agno/tools/workflow.py +285 -0
agno/tools/{twitter.py → x.py} +142 -46
agno/tools/yfinance.py +41 -39
agno/tools/youtube.py +34 -17
agno/tools/zendesk.py +15 -5
agno/tools/zep.py +454 -0
agno/tools/zoom.py +86 -37
agno/tracing/__init__.py +12 -0
agno/tracing/exporter.py +157 -0
agno/tracing/schemas.py +276 -0
agno/tracing/setup.py +111 -0
agno/utils/agent.py +938 -0
agno/utils/audio.py +37 -1
agno/utils/certs.py +27 -0
agno/utils/code_execution.py +11 -0
agno/utils/common.py +103 -20
agno/utils/cryptography.py +22 -0
agno/utils/dttm.py +33 -0
agno/utils/events.py +700 -0
agno/utils/functions.py +107 -37
agno/utils/gemini.py +426 -0
agno/utils/hooks.py +171 -0
agno/utils/http.py +185 -0
agno/utils/json_schema.py +159 -37
agno/utils/knowledge.py +36 -0
agno/utils/location.py +19 -0
agno/utils/log.py +221 -8
agno/utils/mcp.py +214 -0
agno/utils/media.py +335 -14
agno/utils/merge_dict.py +22 -1
agno/utils/message.py +77 -2
agno/utils/models/ai_foundry.py +50 -0
agno/utils/models/claude.py +373 -0
agno/utils/models/cohere.py +94 -0
agno/utils/models/llama.py +85 -0
agno/utils/models/mistral.py +100 -0
agno/utils/models/openai_responses.py +140 -0
agno/utils/models/schema_utils.py +153 -0
agno/utils/models/watsonx.py +41 -0
agno/utils/openai.py +257 -0
agno/utils/pickle.py +1 -1
agno/utils/pprint.py +124 -8
agno/utils/print_response/agent.py +930 -0
agno/utils/print_response/team.py +1914 -0
agno/utils/print_response/workflow.py +1668 -0
agno/utils/prompts.py +111 -0
agno/utils/reasoning.py +108 -0
agno/utils/response.py +163 -0
agno/utils/serialize.py +32 -0
agno/utils/shell.py +4 -4
agno/utils/streamlit.py +487 -0
agno/utils/string.py +204 -51
agno/utils/team.py +139 -0
agno/utils/timer.py +9 -2
agno/utils/tokens.py +657 -0
agno/utils/tools.py +19 -1
agno/utils/whatsapp.py +305 -0
agno/utils/yaml_io.py +3 -3
agno/vectordb/__init__.py +2 -0
agno/vectordb/base.py +87 -9
agno/vectordb/cassandra/__init__.py +5 -1
agno/vectordb/cassandra/cassandra.py +383 -27
agno/vectordb/chroma/__init__.py +4 -0
agno/vectordb/chroma/chromadb.py +748 -83
agno/vectordb/clickhouse/__init__.py +7 -1
agno/vectordb/clickhouse/clickhousedb.py +554 -53
agno/vectordb/couchbase/__init__.py +3 -0
agno/vectordb/couchbase/couchbase.py +1446 -0
agno/vectordb/lancedb/__init__.py +5 -0
agno/vectordb/lancedb/lance_db.py +730 -98
agno/vectordb/langchaindb/__init__.py +5 -0
agno/vectordb/langchaindb/langchaindb.py +163 -0
agno/vectordb/lightrag/__init__.py +5 -0
agno/vectordb/lightrag/lightrag.py +388 -0
agno/vectordb/llamaindex/__init__.py +3 -0
agno/vectordb/llamaindex/llamaindexdb.py +166 -0
agno/vectordb/milvus/__init__.py +3 -0
agno/vectordb/milvus/milvus.py +966 -78
agno/vectordb/mongodb/__init__.py +9 -1
agno/vectordb/mongodb/mongodb.py +1175 -172
agno/vectordb/pgvector/__init__.py +8 -0
agno/vectordb/pgvector/pgvector.py +599 -115
agno/vectordb/pineconedb/__init__.py +5 -1
agno/vectordb/pineconedb/pineconedb.py +406 -43
agno/vectordb/qdrant/__init__.py +4 -0
agno/vectordb/qdrant/qdrant.py +914 -61
agno/vectordb/redis/__init__.py +9 -0
agno/vectordb/redis/redisdb.py +682 -0
agno/vectordb/singlestore/__init__.py +8 -1
agno/vectordb/singlestore/singlestore.py +771 -0
agno/vectordb/surrealdb/__init__.py +3 -0
agno/vectordb/surrealdb/surrealdb.py +663 -0
agno/vectordb/upstashdb/__init__.py +5 -0
agno/vectordb/upstashdb/upstashdb.py +718 -0
agno/vectordb/weaviate/__init__.py +8 -0
agno/vectordb/weaviate/index.py +15 -0
agno/vectordb/weaviate/weaviate.py +1009 -0
agno/workflow/__init__.py +23 -1
agno/workflow/agent.py +299 -0
agno/workflow/condition.py +759 -0
agno/workflow/loop.py +756 -0
agno/workflow/parallel.py +853 -0
agno/workflow/router.py +723 -0
agno/workflow/step.py +1564 -0
agno/workflow/steps.py +613 -0
agno/workflow/types.py +556 -0
agno/workflow/workflow.py +4327 -514
agno-2.3.13.dist-info/METADATA +639 -0
agno-2.3.13.dist-info/RECORD +613 -0
{agno-0.1.2.dist-info → agno-2.3.13.dist-info}/WHEEL +1 -1
agno-2.3.13.dist-info/licenses/LICENSE +201 -0
agno/api/playground.py +0 -91
agno/api/schemas/playground.py +0 -22
agno/api/schemas/user.py +0 -22
agno/api/schemas/workspace.py +0 -46
agno/api/user.py +0 -160
agno/api/workspace.py +0 -151
agno/cli/auth_server.py +0 -118
agno/cli/config.py +0 -275
agno/cli/console.py +0 -88
agno/cli/credentials.py +0 -23
agno/cli/entrypoint.py +0 -571
agno/cli/operator.py +0 -355
agno/cli/settings.py +0 -85
agno/cli/ws/ws_cli.py +0 -817
agno/constants.py +0 -13
agno/document/__init__.py +0 -1
agno/document/chunking/semantic.py +0 -47
agno/document/chunking/strategy.py +0 -31
agno/document/reader/__init__.py +0 -1
agno/document/reader/arxiv_reader.py +0 -41
agno/document/reader/base.py +0 -22
agno/document/reader/csv_reader.py +0 -84
agno/document/reader/docx_reader.py +0 -46
agno/document/reader/firecrawl_reader.py +0 -99
agno/document/reader/json_reader.py +0 -43
agno/document/reader/pdf_reader.py +0 -219
agno/document/reader/s3/pdf_reader.py +0 -46
agno/document/reader/s3/text_reader.py +0 -51
agno/document/reader/text_reader.py +0 -41
agno/document/reader/website_reader.py +0 -175
agno/document/reader/youtube_reader.py +0 -50
agno/embedder/__init__.py +0 -1
agno/embedder/azure_openai.py +0 -86
agno/embedder/cohere.py +0 -72
agno/embedder/fastembed.py +0 -37
agno/embedder/google.py +0 -73
agno/embedder/huggingface.py +0 -54
agno/embedder/mistral.py +0 -80
agno/embedder/ollama.py +0 -57
agno/embedder/openai.py +0 -74
agno/embedder/sentence_transformer.py +0 -38
agno/embedder/voyageai.py +0 -64
agno/eval/perf.py +0 -201
agno/file/__init__.py +0 -1
agno/file/file.py +0 -16
agno/file/local/csv.py +0 -32
agno/file/local/txt.py +0 -19
agno/infra/app.py +0 -240
agno/infra/base.py +0 -144
agno/infra/context.py +0 -20
agno/infra/db_app.py +0 -52
agno/infra/resource.py +0 -205
agno/infra/resources.py +0 -55
agno/knowledge/agent.py +0 -230
agno/knowledge/arxiv.py +0 -22
agno/knowledge/combined.py +0 -22
agno/knowledge/csv.py +0 -28
agno/knowledge/csv_url.py +0 -19
agno/knowledge/document.py +0 -20
agno/knowledge/docx.py +0 -30
agno/knowledge/json.py +0 -28
agno/knowledge/langchain.py +0 -71
agno/knowledge/llamaindex.py +0 -66
agno/knowledge/pdf.py +0 -28
agno/knowledge/pdf_url.py +0 -26
agno/knowledge/s3/base.py +0 -60
agno/knowledge/s3/pdf.py +0 -21
agno/knowledge/s3/text.py +0 -23
agno/knowledge/text.py +0 -30
agno/knowledge/website.py +0 -88
agno/knowledge/wikipedia.py +0 -31
agno/knowledge/youtube.py +0 -22
agno/memory/agent.py +0 -392
agno/memory/classifier.py +0 -104
agno/memory/db/__init__.py +0 -1
agno/memory/db/base.py +0 -42
agno/memory/db/mongodb.py +0 -189
agno/memory/db/postgres.py +0 -203
agno/memory/db/sqlite.py +0 -193
agno/memory/memory.py +0 -15
agno/memory/row.py +0 -36
agno/memory/summarizer.py +0 -192
agno/memory/summary.py +0 -19
agno/memory/workflow.py +0 -38
agno/models/google/gemini_openai.py +0 -26
agno/models/ollama/hermes.py +0 -221
agno/models/ollama/tools.py +0 -362
agno/models/vertexai/gemini.py +0 -595
agno/playground/__init__.py +0 -3
agno/playground/async_router.py +0 -421
agno/playground/deploy.py +0 -249
agno/playground/operator.py +0 -92
agno/playground/playground.py +0 -91
agno/playground/schemas.py +0 -76
agno/playground/serve.py +0 -55
agno/playground/sync_router.py +0 -405
agno/reasoning/agent.py +0 -68
agno/run/response.py +0 -112
agno/storage/agent/__init__.py +0 -0
agno/storage/agent/base.py +0 -38
agno/storage/agent/dynamodb.py +0 -350
agno/storage/agent/json.py +0 -92
agno/storage/agent/mongodb.py +0 -228
agno/storage/agent/postgres.py +0 -367
agno/storage/agent/session.py +0 -79
agno/storage/agent/singlestore.py +0 -303
agno/storage/agent/sqlite.py +0 -357
agno/storage/agent/yaml.py +0 -93
agno/storage/workflow/__init__.py +0 -0
agno/storage/workflow/base.py +0 -40
agno/storage/workflow/mongodb.py +0 -233
agno/storage/workflow/postgres.py +0 -366
agno/storage/workflow/session.py +0 -60
agno/storage/workflow/sqlite.py +0 -359
agno/tools/googlesearch.py +0 -88
agno/utils/defaults.py +0 -57
agno/utils/filesystem.py +0 -39
agno/utils/git.py +0 -52
agno/utils/json_io.py +0 -30
agno/utils/load_env.py +0 -19
agno/utils/py_io.py +0 -19
agno/utils/pyproject.py +0 -18
agno/utils/resource_filter.py +0 -31
agno/vectordb/singlestore/s2vectordb.py +0 -390
agno/vectordb/singlestore/s2vectordb2.py +0 -355
agno/workspace/__init__.py +0 -0
agno/workspace/config.py +0 -325
agno/workspace/enums.py +0 -6
agno/workspace/helpers.py +0 -48
agno/workspace/operator.py +0 -758
agno/workspace/settings.py +0 -63
agno-0.1.2.dist-info/LICENSE +0 -375
agno-0.1.2.dist-info/METADATA +0 -502
agno-0.1.2.dist-info/RECORD +0 -352
agno-0.1.2.dist-info/entry_points.txt +0 -3
/agno/{cli → db/migrations}/__init__.py +0 -0
/agno/{cli/ws → db/migrations/versions}/__init__.py +0 -0
/agno/{document/chunking/__init__.py → db/schemas/metrics.py} +0 -0
/agno/{document/reader/s3 → integrations}/__init__.py +0 -0
/agno/{file/local → knowledge/chunking}/__init__.py +0 -0
/agno/{infra → knowledge/remote_content}/__init__.py +0 -0
/agno/{knowledge/s3 → tools/models}/__init__.py +0 -0
/agno/{reranker → utils/models}/__init__.py +0 -0
/agno/{storage → utils/print_response}/__init__.py +0 -0
{agno-0.1.2.dist-info → agno-2.3.13.dist-info}/top_level.txt +0 -0

agno/vectordb/pgvector/pgvector.py CHANGED Viewed

@@ -1,15 +1,21 @@
+import asyncio
 from hashlib import md5
 from math import sqrt
 from typing import Any, Dict, List, Optional, Union, cast
+from agno.utils.string import generate_id
 try:
+    from sqlalchemy import and_, not_, or_, update
     from sqlalchemy.dialects import postgresql
     from sqlalchemy.engine import Engine, create_engine
     from sqlalchemy.inspection import inspect
     from sqlalchemy.orm import Session, scoped_session, sessionmaker
     from sqlalchemy.schema import Column, Index, MetaData, Table
+    from sqlalchemy.sql.elements import ColumnElement
     from sqlalchemy.sql.expression import bindparam, desc, func, select, text
-    from sqlalchemy.types import DateTime, String
+    from sqlalchemy.types import DateTime, Integer, String
 except ImportError:
     raise ImportError("`sqlalchemy` not installed. Please install using `pip install sqlalchemy psycopg`")
@@ -18,10 +24,11 @@ try:
 except ImportError:
     raise ImportError("`pgvector` not installed. Please install using `pip install pgvector`")
-from agno.document import Document
-from agno.embedder import Embedder
-from agno.reranker.base import Reranker
-from agno.utils.log import logger
+from agno.filters import FilterExpr
+from agno.knowledge.document import Document
+from agno.knowledge.embedder import Embedder
+from agno.knowledge.reranker.base import Reranker
+from agno.utils.log import log_debug, log_error, log_info, log_warning
 from agno.vectordb.base import VectorDb
 from agno.vectordb.distance import Distance
 from agno.vectordb.pgvector.index import HNSW, Ivfflat
@@ -40,6 +47,9 @@ class PgVector(VectorDb):
         self,
         table_name: str,
         schema: str = "ai",
+        name: Optional[str] = None,
+        description: Optional[str] = None,
+        id: Optional[str] = None,
         db_url: Optional[str] = None,
         db_engine: Optional[Engine] = None,
         embedder: Optional[Embedder] = None,
@@ -52,6 +62,7 @@ class PgVector(VectorDb):
         schema_version: int = 1,
         auto_upgrade_schema: bool = False,
         reranker: Optional[Reranker] = None,
+        create_schema: bool = True,
     ):
         """
         Initialize the PgVector instance.
@@ -59,6 +70,8 @@ class PgVector(VectorDb):
         Args:
             table_name (str): Name of the table to store vector data.
             schema (str): Database schema name.
+            name (Optional[str]): Name of the vector database.
+            description (Optional[str]): Description of the vector database.
             db_url (Optional[str]): Database connection URL.
             db_engine (Optional[Engine]): SQLAlchemy database engine.
             embedder (Optional[Embedder]): Embedder instance for creating embeddings.
@@ -70,6 +83,8 @@ class PgVector(VectorDb):
             content_language (str): Language for full-text search.
             schema_version (int): Version of the database schema.
             auto_upgrade_schema (bool): Automatically upgrade schema if True.
+            create_schema (bool): Whether to automatically create the database schema if it doesn't exist.
+                Set to False if schema is managed externally (e.g., via migrations). Defaults to True.
         """
         if not table_name:
             raise ValueError("Table name must be provided.")
@@ -77,13 +92,22 @@ class PgVector(VectorDb):
         if db_engine is None and db_url is None:
             raise ValueError("Either 'db_url' or 'db_engine' must be provided.")
+        if id is None:
+            base_seed = db_url or str(db_engine.url)  # type: ignore
+            schema_suffix = table_name if table_name is not None else "ai"
+            seed = f"{base_seed}#{schema_suffix}"
+            id = generate_id(seed)
+        # Initialize base class with name and description
+        super().__init__(id=id, name=name, description=description)
         if db_engine is None:
             if db_url is None:
                 raise ValueError("Must provide 'db_url' if 'db_engine' is None.")
             try:
                 db_engine = create_engine(db_url)
             except Exception as e:
-                logger.error(f"Failed to create engine from 'db_url': {e}")
+                log_error(f"Failed to create engine from 'db_url': {e}")
                 raise
         # Database settings
@@ -95,9 +119,10 @@ class PgVector(VectorDb):
         # Embedder for embedding the document contents
         if embedder is None:
-            from agno.embedder.openai import OpenAIEmbedder
+            from agno.knowledge.embedder.openai import OpenAIEmbedder
             embedder = OpenAIEmbedder()
+            log_info("Embedder not provided, using OpenAIEmbedder as default.")
         self.embedder: Embedder = embedder
         self.dimensions: Optional[int] = self.embedder.dimensions
@@ -125,11 +150,14 @@ class PgVector(VectorDb):
         # Reranker instance
         self.reranker: Optional[Reranker] = reranker
+        # Schema creation flag
+        self.create_schema: bool = create_schema
         # Database session
         self.Session: scoped_session = scoped_session(sessionmaker(bind=self.db_engine))
         # Database table
         self.table: Table = self.get_table()
-        logger.debug(f"Initialized PgVector with table '{self.schema}.{self.table_name}'")
+        log_debug(f"Initialized PgVector with table '{self.schema}.{self.table_name}'")
     def get_table_v1(self) -> Table:
         """
@@ -153,6 +181,7 @@ class PgVector(VectorDb):
             Column("created_at", DateTime(timezone=True), server_default=func.now()),
             Column("updated_at", DateTime(timezone=True), onupdate=func.now()),
             Column("content_hash", String),
+            Column("content_id", String),
             extend_existing=True,
         )
@@ -160,7 +189,7 @@ class PgVector(VectorDb):
         Index(f"idx_{self.table_name}_id", table.c.id)
         Index(f"idx_{self.table_name}_name", table.c.name)
         Index(f"idx_{self.table_name}_content_hash", table.c.content_hash)
+        Index(f"idx_{self.table_name}_content_id", table.c.content_id)
         return table
     def get_table(self) -> Table:
@@ -182,11 +211,11 @@ class PgVector(VectorDb):
         Returns:
             bool: True if the table exists, False otherwise.
         """
-        logger.debug(f"Checking if table '{self.table.fullname}' exists.")
+        log_debug(f"Checking if table '{self.table.fullname}' exists.")
         try:
             return inspect(self.db_engine).has_table(self.table_name, schema=self.schema)
         except Exception as e:
-            logger.error(f"Error checking if table exists: {e}")
+            log_error(f"Error checking if table exists: {e}")
             return False
     def create(self) -> None:
@@ -195,14 +224,18 @@ class PgVector(VectorDb):
         """
         if not self.table_exists():
             with self.Session() as sess, sess.begin():
-                logger.debug("Creating extension: vector")
+                log_debug("Creating extension: vector")
                 sess.execute(text("CREATE EXTENSION IF NOT EXISTS vector;"))
-                if self.schema is not None:
-                    logger.debug(f"Creating schema: {self.schema}")
+                if self.create_schema and self.schema is not None:
+                    log_debug(f"Creating schema: {self.schema}")
                     sess.execute(text(f"CREATE SCHEMA IF NOT EXISTS {self.schema};"))
-            logger.debug(f"Creating table: {self.table_name}")
+            log_debug(f"Creating table: {self.table_name}")
             self.table.create(self.db_engine)
+    async def async_create(self) -> None:
+        """Create the table asynchronously by running in a thread."""
+        await asyncio.to_thread(self.create)
     def _record_exists(self, column, value) -> bool:
         """
         Check if a record with the given column value exists in the table.
@@ -220,23 +253,9 @@ class PgVector(VectorDb):
                 result = sess.execute(stmt).first()
                 return result is not None
         except Exception as e:
-            logger.error(f"Error checking if record exists: {e}")
+            log_error(f"Error checking if record exists: {e}")
             return False
-    def doc_exists(self, document: Document) -> bool:
-        """
-        Check if a document with the same content hash exists in the table.
-        Args:
-            document (Document): The document to check.
-        Returns:
-            bool: True if the document exists, False otherwise.
-        """
-        cleaned_content = document.content.replace("\x00", "\ufffd")
-        content_hash = md5(cleaned_content.encode()).hexdigest()
-        return self._record_exists(self.table.c.content_hash, content_hash)
     def name_exists(self, name: str) -> bool:
         """
         Check if a document with the given name exists in the table.
@@ -249,6 +268,10 @@ class PgVector(VectorDb):
         """
         return self._record_exists(self.table.c.name, name)
+    async def async_name_exists(self, name: str) -> bool:
+        """Check if name exists asynchronously by running in a thread."""
+        return await asyncio.to_thread(self.name_exists, name)
     def id_exists(self, id: str) -> bool:
         """
         Check if a document with the given ID exists in the table.
@@ -261,6 +284,12 @@ class PgVector(VectorDb):
         """
         return self._record_exists(self.table.c.id, id)
+    def content_hash_exists(self, content_hash: str) -> bool:
+        """
+        Check if a document with the given content hash exists in the table.
+        """
+        return self._record_exists(self.table.c.content_hash, content_hash)
     def _clean_content(self, content: str) -> str:
         """
         Clean the content by replacing null characters.
@@ -275,6 +304,7 @@ class PgVector(VectorDb):
     def insert(
         self,
+        content_hash: str,
         documents: List[Document],
         filters: Optional[Dict[str, Any]] = None,
         batch_size: int = 100,
@@ -283,6 +313,7 @@ class PgVector(VectorDb):
         Insert documents into the database.
         Args:
+            content_hash (str): The content hash to insert.
             documents (List[Document]): List of documents to insert.
             filters (Optional[Dict[str, Any]]): Filters to apply to the documents.
             batch_size (int): Number of documents to insert in each batch.
@@ -291,18 +322,62 @@ class PgVector(VectorDb):
             with self.Session() as sess:
                 for i in range(0, len(documents), batch_size):
                     batch_docs = documents[i : i + batch_size]
-                    logger.debug(f"Processing batch starting at index {i}, size: {len(batch_docs)}")
+                    log_debug(f"Processing batch starting at index {i}, size: {len(batch_docs)}")
                     try:
                         # Prepare documents for insertion
                         batch_records = []
                         for doc in batch_docs:
                             try:
-                                doc.embed(embedder=self.embedder)
+                                batch_records.append(self._get_document_record(doc, filters, content_hash))
+                            except Exception as e:
+                                log_error(f"Error processing document '{doc.name}': {e}")
+                        # Insert the batch of records
+                        insert_stmt = postgresql.insert(self.table)
+                        sess.execute(insert_stmt, batch_records)
+                        sess.commit()  # Commit batch independently
+                        log_info(f"Inserted batch of {len(batch_records)} documents.")
+                    except Exception as e:
+                        log_error(f"Error with batch starting at index {i}: {e}")
+                        sess.rollback()  # Rollback the current batch if there's an error
+                        raise
+        except Exception as e:
+            log_error(f"Error inserting documents: {e}")
+            raise
+    async def async_insert(
+        self,
+        content_hash: str,
+        documents: List[Document],
+        filters: Optional[Dict[str, Any]] = None,
+        batch_size: int = 100,
+    ) -> None:
+        """Insert documents asynchronously with parallel embedding."""
+        try:
+            with self.Session() as sess:
+                for i in range(0, len(documents), batch_size):
+                    batch_docs = documents[i : i + batch_size]
+                    log_debug(f"Processing batch starting at index {i}, size: {len(batch_docs)}")
+                    try:
+                        # Embed all documents in the batch
+                        await self._async_embed_documents(batch_docs)
+                        # Prepare documents for insertion
+                        batch_records = []
+                        for doc in batch_docs:
+                            try:
                                 cleaned_content = self._clean_content(doc.content)
-                                content_hash = md5(cleaned_content.encode()).hexdigest()
-                                _id = doc.id or content_hash
+                                # Include content_hash in ID to ensure uniqueness across different content hashes
+                                # This allows the same URL/content to be inserted with different descriptions
+                                base_id = doc.id or md5(cleaned_content.encode()).hexdigest()
+                                record_id = md5(f"{base_id}_{content_hash}".encode()).hexdigest()
+                                meta_data = doc.meta_data or {}
+                                if filters:
+                                    meta_data.update(filters)
                                 record = {
-                                    "id": _id,
+                                    "id": record_id,
                                     "name": doc.name,
                                     "meta_data": doc.meta_data,
                                     "filters": filters,
@@ -310,22 +385,24 @@ class PgVector(VectorDb):
                                     "embedding": doc.embedding,
                                     "usage": doc.usage,
                                     "content_hash": content_hash,
+                                    "content_id": doc.content_id,
                                 }
                                 batch_records.append(record)
                             except Exception as e:
-                                logger.error(f"Error processing document '{doc.name}': {e}")
+                                log_error(f"Error processing document '{doc.name}': {e}")
                         # Insert the batch of records
-                        insert_stmt = postgresql.insert(self.table)
-                        sess.execute(insert_stmt, batch_records)
-                        sess.commit()  # Commit batch independently
-                        logger.info(f"Inserted batch of {len(batch_records)} documents.")
+                        if batch_records:
+                            insert_stmt = postgresql.insert(self.table)
+                            sess.execute(insert_stmt, batch_records)
+                            sess.commit()  # Commit batch independently
+                            log_info(f"Inserted batch of {len(batch_records)} documents.")
                     except Exception as e:
-                        logger.error(f"Error with batch starting at index {i}: {e}")
+                        log_error(f"Error with batch starting at index {i}: {e}")
                         sess.rollback()  # Rollback the current batch if there's an error
                         raise
         except Exception as e:
-            logger.error(f"Error inserting documents: {e}")
+            log_error(f"Error inserting documents: {e}")
             raise
     def upsert_available(self) -> bool:
@@ -339,6 +416,27 @@ class PgVector(VectorDb):
     def upsert(
         self,
+        content_hash: str,
+        documents: List[Document],
+        filters: Optional[Dict[str, Any]] = None,
+        batch_size: int = 100,
+    ) -> None:
+        """
+        Upsert documents by content hash.
+        First delete all documents with the same content hash.
+        Then upsert the new documents.
+        """
+        try:
+            if self.content_hash_exists(content_hash):
+                self._delete_by_content_hash(content_hash)
+            self._upsert(content_hash, documents, filters, batch_size)
+        except Exception as e:
+            log_error(f"Error upserting documents by content hash: {e}")
+            raise
+    def _upsert(
+        self,
+        content_hash: str,
         documents: List[Document],
         filters: Optional[Dict[str, Any]] = None,
         batch_size: int = 100,
@@ -355,18 +453,209 @@ class PgVector(VectorDb):
             with self.Session() as sess:
                 for i in range(0, len(documents), batch_size):
                     batch_docs = documents[i : i + batch_size]
-                    logger.debug(f"Processing batch starting at index {i}, size: {len(batch_docs)}")
+                    log_info(f"Processing batch starting at index {i}, size: {len(batch_docs)}")
                     try:
                         # Prepare documents for upserting
-                        batch_records = []
+                        batch_records_dict: Dict[str, Dict[str, Any]] = {}  # Use dict to deduplicate by ID
                         for doc in batch_docs:
                             try:
-                                doc.embed(embedder=self.embedder)
+                                record = self._get_document_record(doc, filters, content_hash)
+                                # Use the generated record ID (which includes content_hash) for deduplication
+                                batch_records_dict[record["id"]] = record
+                            except Exception as e:
+                                log_error(f"Error processing document '{doc.name}': {e}")
+                        # Convert dict to list for upsert
+                        batch_records = list(batch_records_dict.values())
+                        if not batch_records:
+                            log_info("No valid records to upsert in this batch.")
+                            continue
+                        # Upsert the batch of records
+                        insert_stmt = postgresql.insert(self.table).values(batch_records)
+                        upsert_stmt = insert_stmt.on_conflict_do_update(
+                            index_elements=["id"],
+                            set_={
+                                "name": insert_stmt.excluded.name,
+                                "meta_data": insert_stmt.excluded.meta_data,
+                                "filters": insert_stmt.excluded.filters,
+                                "content": insert_stmt.excluded.content,
+                                "embedding": insert_stmt.excluded.embedding,
+                                "usage": insert_stmt.excluded.usage,
+                                "content_hash": insert_stmt.excluded.content_hash,
+                                "content_id": insert_stmt.excluded.content_id,
+                            },
+                        )
+                        sess.execute(upsert_stmt)
+                        sess.commit()  # Commit batch independently
+                        log_info(f"Upserted batch of {len(batch_records)} documents.")
+                    except Exception as e:
+                        log_error(f"Error with batch starting at index {i}: {e}")
+                        sess.rollback()  # Rollback the current batch if there's an error
+                        raise
+        except Exception as e:
+            log_error(f"Error upserting documents: {e}")
+            raise
+    def _get_document_record(
+        self, doc: Document, filters: Optional[Dict[str, Any]] = None, content_hash: str = ""
+    ) -> Dict[str, Any]:
+        doc.embed(embedder=self.embedder)
+        cleaned_content = self._clean_content(doc.content)
+        # Include content_hash in ID to ensure uniqueness across different content hashes
+        # This allows the same URL/content to be inserted with different descriptions
+        base_id = doc.id or md5(cleaned_content.encode()).hexdigest()
+        record_id = md5(f"{base_id}_{content_hash}".encode()).hexdigest()
+        meta_data = doc.meta_data or {}
+        if filters:
+            meta_data.update(filters)
+        return {
+            "id": record_id,
+            "name": doc.name,
+            "meta_data": doc.meta_data,
+            "filters": filters,
+            "content": cleaned_content,
+            "embedding": doc.embedding,
+            "usage": doc.usage,
+            "content_hash": content_hash,
+            "content_id": doc.content_id,
+        }
+    async def _async_embed_documents(self, batch_docs: List[Document]) -> None:
+        """
+        Embed a batch of documents using either batch embedding or individual embedding.
+        Args:
+            batch_docs: List of documents to embed
+        """
+        if self.embedder.enable_batch and hasattr(self.embedder, "async_get_embeddings_batch_and_usage"):
+            # Use batch embedding when enabled and supported
+            try:
+                # Extract content from all documents
+                doc_contents = [doc.content for doc in batch_docs]
+                # Get batch embeddings and usage
+                embeddings, usages = await self.embedder.async_get_embeddings_batch_and_usage(doc_contents)
+                # Process documents with pre-computed embeddings
+                for j, doc in enumerate(batch_docs):
+                    try:
+                        if j < len(embeddings):
+                            doc.embedding = embeddings[j]
+                            doc.usage = usages[j] if j < len(usages) else None
+                    except Exception as e:
+                        log_error(f"Error assigning batch embedding to document '{doc.name}': {e}")
+            except Exception as e:
+                # Check if this is a rate limit error - don't fall back as it would make things worse
+                error_str = str(e).lower()
+                is_rate_limit = any(
+                    phrase in error_str
+                    for phrase in ["rate limit", "too many requests", "429", "trial key", "api calls / minute"]
+                )
+                if is_rate_limit:
+                    log_error(f"Rate limit detected during batch embedding.  {e}")
+                    raise e
+                else:
+                    log_warning(f"Async batch embedding failed, falling back to individual embeddings: {e}")
+                    # Fall back to individual embedding
+                    embed_tasks = [doc.async_embed(embedder=self.embedder) for doc in batch_docs]
+                    results = await asyncio.gather(*embed_tasks, return_exceptions=True)
+                    # Check for exceptions and handle them
+                    for i, result in enumerate(results):
+                        if isinstance(result, Exception):
+                            error_msg = str(result)
+                            # If it's an event loop closure error, log it but don't fail
+                            if "Event loop is closed" in error_msg or "RuntimeError" in type(result).__name__:
+                                log_warning(
+                                    f"Event loop closure during embedding for document {i}, but operation may have succeeded: {result}"
+                                )
+                            else:
+                                log_error(f"Error embedding document {i}: {result}")
+        else:
+            # Use individual embedding
+            embed_tasks = [doc.async_embed(embedder=self.embedder) for doc in batch_docs]
+            results = await asyncio.gather(*embed_tasks, return_exceptions=True)
+            # Check for exceptions and handle them
+            for i, result in enumerate(results):
+                if isinstance(result, Exception):
+                    error_msg = str(result)
+                    # If it's an event loop closure error, log it but don't fail
+                    if "Event loop is closed" in error_msg or "RuntimeError" in type(result).__name__:
+                        log_warning(
+                            f"Event loop closure during embedding for document {i}, but operation may have succeeded: {result}"
+                        )
+                    else:
+                        log_error(f"Error embedding document {i}: {result}")
+    async def async_upsert(
+        self,
+        content_hash: str,
+        documents: List[Document],
+        filters: Optional[Dict[str, Any]] = None,
+        batch_size: int = 100,
+    ) -> None:
+        """Upsert documents asynchronously by running in a thread."""
+        try:
+            if self.content_hash_exists(content_hash):
+                self._delete_by_content_hash(content_hash)
+            await self._async_upsert(content_hash, documents, filters, batch_size)
+        except Exception as e:
+            log_error(f"Error upserting documents by content hash: {e}")
+            raise
+    async def _async_upsert(
+        self,
+        content_hash: str,
+        documents: List[Document],
+        filters: Optional[Dict[str, Any]] = None,
+        batch_size: int = 100,
+    ) -> None:
+        """
+        Upsert (insert or update) documents in the database.
+        Args:
+            documents (List[Document]): List of documents to upsert.
+            filters (Optional[Dict[str, Any]]): Filters to apply to the documents.
+            batch_size (int): Number of documents to upsert in each batch.
+        """
+        try:
+            with self.Session() as sess:
+                for i in range(0, len(documents), batch_size):
+                    batch_docs = documents[i : i + batch_size]
+                    log_info(f"Processing batch starting at index {i}, size: {len(batch_docs)}")
+                    try:
+                        # Embed all documents in the batch
+                        await self._async_embed_documents(batch_docs)
+                        # Prepare documents for upserting
+                        batch_records_dict = {}  # Use dict to deduplicate by ID
+                        for idx, doc in enumerate(batch_docs):
+                            try:
                                 cleaned_content = self._clean_content(doc.content)
-                                content_hash = md5(cleaned_content.encode()).hexdigest()
-                                _id = doc.id or content_hash
+                                # Include content_hash in ID to ensure uniqueness across different content hashes
+                                # This allows the same URL/content to be inserted with different descriptions
+                                base_id = doc.id or md5(cleaned_content.encode()).hexdigest()
+                                record_id = md5(f"{base_id}_{content_hash}".encode()).hexdigest()
+                                if (
+                                    doc.embedding is not None
+                                    and isinstance(doc.embedding, list)
+                                    and len(doc.embedding) == 0
+                                ):
+                                    log_warning(f"Document {idx} '{doc.name}' has empty embedding (length 0)")
+                                meta_data = doc.meta_data or {}
+                                if filters:
+                                    meta_data.update(filters)
                                 record = {
-                                    "id": _id,
+                                    "id": record_id,  # use record_id as a reproducible id to avoid duplicates while upsert
                                     "name": doc.name,
                                     "meta_data": doc.meta_data,
                                     "filters": filters,
@@ -374,44 +663,81 @@ class PgVector(VectorDb):
                                     "embedding": doc.embedding,
                                     "usage": doc.usage,
                                     "content_hash": content_hash,
+                                    "content_id": doc.content_id,
                                 }
-                                batch_records.append(record)
+                                batch_records_dict[record_id] = record  # This deduplicates by ID
                             except Exception as e:
-                                logger.error(f"Error processing document '{doc.name}': {e}")
+                                log_error(f"Error processing document '{doc.name}': {e}")
+                        # Convert dict to list for upsert
+                        batch_records = list(batch_records_dict.values())
+                        if not batch_records:
+                            log_info("No valid records to upsert in this batch.")
+                            continue
                         # Upsert the batch of records
                         insert_stmt = postgresql.insert(self.table).values(batch_records)
                         upsert_stmt = insert_stmt.on_conflict_do_update(
                             index_elements=["id"],
-                            set_=dict(
-                                name=insert_stmt.excluded.name,
-                                meta_data=insert_stmt.excluded.meta_data,
-                                filters=insert_stmt.excluded.filters,
-                                content=insert_stmt.excluded.content,
-                                embedding=insert_stmt.excluded.embedding,
-                                usage=insert_stmt.excluded.usage,
-                                content_hash=insert_stmt.excluded.content_hash,
-                            ),
+                            set_={
+                                "name": insert_stmt.excluded.name,
+                                "meta_data": insert_stmt.excluded.meta_data,
+                                "filters": insert_stmt.excluded.filters,
+                                "content": insert_stmt.excluded.content,
+                                "embedding": insert_stmt.excluded.embedding,
+                                "usage": insert_stmt.excluded.usage,
+                                "content_hash": insert_stmt.excluded.content_hash,
+                                "content_id": insert_stmt.excluded.content_id,
+                            },
                         )
                         sess.execute(upsert_stmt)
                         sess.commit()  # Commit batch independently
-                        logger.info(f"Upserted batch of {len(batch_records)} documents.")
+                        log_info(f"Upserted batch of {len(batch_records)} documents.")
                     except Exception as e:
-                        logger.error(f"Error with batch starting at index {i}: {e}")
+                        log_error(f"Error with batch starting at index {i}: {e}")
                         sess.rollback()  # Rollback the current batch if there's an error
                         raise
         except Exception as e:
-            logger.error(f"Error upserting documents: {e}")
+            log_error(f"Error upserting documents: {e}")
+            raise
+    def update_metadata(self, content_id: str, metadata: Dict[str, Any]) -> None:
+        """
+        Update the metadata for a document.
+        Args:
+            content_id (str): The ID of the document.
+            metadata (Dict[str, Any]): The metadata to update.
+        """
+        try:
+            with self.Session() as sess:
+                # Merge JSONB for metadata, but replace filters entirely (absolute value)
+                stmt = (
+                    update(self.table)
+                    .where(self.table.c.content_id == content_id)
+                    .values(
+                        meta_data=func.coalesce(self.table.c.meta_data, text("'{}'::jsonb")).op("||")(
+                            bindparam("md", type_=postgresql.JSONB)
+                        ),
+                        filters=bindparam("ft", type_=postgresql.JSONB),
+                    )
+                )
+                sess.execute(stmt, {"md": metadata, "ft": metadata})
+                sess.commit()
+        except Exception as e:
+            log_error(f"Error updating metadata for document {content_id}: {e}")
             raise
-    def search(self, query: str, limit: int = 5, filters: Optional[Dict[str, Any]] = None) -> List[Document]:
+    def search(
+        self, query: str, limit: int = 5, filters: Optional[Union[Dict[str, Any], List[FilterExpr]]] = None
+    ) -> List[Document]:
         """
         Perform a search based on the configured search type.
         Args:
             query (str): The search query.
             limit (int): Maximum number of results to return.
-            filters (Optional[Dict[str, Any]]): Filters to apply to the search.
+            filters (Optional[Union[Dict[str, Any], List[FilterExpr]]]): Filters to apply to the search.
         Returns:
             List[Document]: List of matching documents.
@@ -423,17 +749,46 @@ class PgVector(VectorDb):
         elif self.search_type == SearchType.hybrid:
             return self.hybrid_search(query=query, limit=limit, filters=filters)
         else:
-            logger.error(f"Invalid search type '{self.search_type}'.")
+            log_error(f"Invalid search type '{self.search_type}'.")
             return []
-    def vector_search(self, query: str, limit: int = 5, filters: Optional[Dict[str, Any]] = None) -> List[Document]:
+    async def async_search(
+        self, query: str, limit: int = 5, filters: Optional[Union[Dict[str, Any], List[FilterExpr]]] = None
+    ) -> List[Document]:
+        """Search asynchronously by running in a thread."""
+        return await asyncio.to_thread(self.search, query, limit, filters)
+    def _dsl_to_sqlalchemy(self, filter_expr, table) -> ColumnElement[bool]:
+        op = filter_expr["op"]
+        if op == "EQ":
+            return table.c.meta_data[filter_expr["key"]].astext == str(filter_expr["value"])
+        elif op == "IN":
+            # Postgres JSONB array containment
+            return table.c.meta_data[filter_expr["key"]].astext.in_([str(v) for v in filter_expr["values"]])
+        elif op == "GT":
+            return table.c.meta_data[filter_expr["key"]].astext.cast(Integer) > filter_expr["value"]
+        elif op == "LT":
+            return table.c.meta_data[filter_expr["key"]].astext.cast(Integer) < filter_expr["value"]
+        elif op == "NOT":
+            return not_(self._dsl_to_sqlalchemy(filter_expr["condition"], table))
+        elif op == "AND":
+            return and_(*[self._dsl_to_sqlalchemy(cond, table) for cond in filter_expr["conditions"]])
+        elif op == "OR":
+            return or_(*[self._dsl_to_sqlalchemy(cond, table) for cond in filter_expr["conditions"]])
+        else:
+            raise ValueError(f"Unknown filter operator: {op}")
+    def vector_search(
+        self, query: str, limit: int = 5, filters: Optional[Union[Dict[str, Any], List[FilterExpr]]] = None
+    ) -> List[Document]:
         """
         Perform a vector similarity search.
         Args:
             query (str): The search query.
             limit (int): Maximum number of results to return.
-            filters (Optional[Dict[str, Any]]): Filters to apply to the search.
+            filters (Optional[Union[Dict[str, Any], List[FilterExpr]]]): Filters to apply to the search.
         Returns:
             List[Document]: List of matching documents.
@@ -442,7 +797,7 @@ class PgVector(VectorDb):
             # Get the embedding for the query string
             query_embedding = self.embedder.get_embedding(query)
             if query_embedding is None:
-                logger.error(f"Error getting embedding for Query: {query}")
+                log_error(f"Error getting embedding for Query: {query}")
                 return []
             # Define the columns to select
@@ -460,7 +815,17 @@ class PgVector(VectorDb):
             # Apply filters if provided
             if filters is not None:
-                stmt = stmt.where(self.table.c.filters.contains(filters))
+                # Handle dict filters
+                if isinstance(filters, dict):
+                    stmt = stmt.where(self.table.c.meta_data.contains(filters))
+                # Handle FilterExpr DSL
+                else:
+                    # Convert each DSL expression to SQLAlchemy and AND them together
+                    sqlalchemy_conditions = [
+                        self._dsl_to_sqlalchemy(f.to_dict() if hasattr(f, "to_dict") else f, self.table)
+                        for f in filters
+                    ]
+                    stmt = stmt.where(and_(*sqlalchemy_conditions))
             # Order the results based on the distance metric
             if self.distance == Distance.l2:
@@ -470,14 +835,14 @@ class PgVector(VectorDb):
             elif self.distance == Distance.max_inner_product:
                 stmt = stmt.order_by(self.table.c.embedding.max_inner_product(query_embedding))
             else:
-                logger.error(f"Unknown distance metric: {self.distance}")
+                log_error(f"Unknown distance metric: {self.distance}")
                 return []
             # Limit the number of results
             stmt = stmt.limit(limit)
             # Log the query for debugging
-            logger.debug(f"Vector search query: {stmt}")
+            log_debug(f"Vector search query: {stmt}")
             # Execute the query
             try:
@@ -489,8 +854,8 @@ class PgVector(VectorDb):
                             sess.execute(text(f"SET LOCAL hnsw.ef_search = {self.vector_index.ef_search}"))
                     results = sess.execute(stmt).fetchall()
             except Exception as e:
-                logger.error(f"Error performing semantic search: {e}")
-                logger.error("Table might not exist, creating for future use")
+                log_error(f"Error performing semantic search: {e}")
+                log_error("Table might not exist, creating for future use")
                 self.create()
                 return []
@@ -512,9 +877,10 @@ class PgVector(VectorDb):
             if self.reranker:
                 search_results = self.reranker.rerank(query=query, documents=search_results)
+            log_info(f"Found {len(search_results)} documents")
             return search_results
         except Exception as e:
-            logger.error(f"Error during vector search: {e}")
+            log_error(f"Error during vector search: {e}")
             return []
     def enable_prefix_matching(self, query: str) -> str:
@@ -532,14 +898,16 @@ class PgVector(VectorDb):
         processed_words = [word + "*" for word in words]
         return " ".join(processed_words)
-    def keyword_search(self, query: str, limit: int = 5, filters: Optional[Dict[str, Any]] = None) -> List[Document]:
+    def keyword_search(
+        self, query: str, limit: int = 5, filters: Optional[Union[Dict[str, Any], List[FilterExpr]]] = None
+    ) -> List[Document]:
         """
         Perform a keyword search on the 'content' column.
         Args:
             query (str): The search query.
             limit (int): Maximum number of results to return.
-            filters (Optional[Dict[str, Any]]): Filters to apply to the search.
+            filters (Optional[Union[Dict[str, Any], List[FilterExpr]]]): Filters to apply to the search.
         Returns:
             List[Document]: List of matching documents.
@@ -568,8 +936,17 @@ class PgVector(VectorDb):
             # Apply filters if provided
             if filters is not None:
-                # Use the contains() method for JSONB columns to check if the filters column contains the specified filters
-                stmt = stmt.where(self.table.c.filters.contains(filters))
+                # Handle dict filters
+                if isinstance(filters, dict):
+                    stmt = stmt.where(self.table.c.meta_data.contains(filters))
+                # Handle FilterExpr DSL
+                else:
+                    # Convert each DSL expression to SQLAlchemy and AND them together
+                    sqlalchemy_conditions = [
+                        self._dsl_to_sqlalchemy(f.to_dict() if hasattr(f, "to_dict") else f, self.table)
+                        for f in filters
+                    ]
+                    stmt = stmt.where(and_(*sqlalchemy_conditions))
             # Order by the relevance rank
             stmt = stmt.order_by(text_rank.desc())
@@ -578,15 +955,15 @@ class PgVector(VectorDb):
             stmt = stmt.limit(limit)
             # Log the query for debugging
-            logger.debug(f"Keyword search query: {stmt}")
+            log_debug(f"Keyword search query: {stmt}")
             # Execute the query
             try:
                 with self.Session() as sess, sess.begin():
                     results = sess.execute(stmt).fetchall()
             except Exception as e:
-                logger.error(f"Error performing keyword search: {e}")
-                logger.error("Table might not exist, creating for future use")
+                log_error(f"Error performing keyword search: {e}")
+                log_error("Table might not exist, creating for future use")
                 self.create()
                 return []
@@ -605,16 +982,17 @@ class PgVector(VectorDb):
                     )
                 )
+            log_info(f"Found {len(search_results)} documents")
             return search_results
         except Exception as e:
-            logger.error(f"Error during keyword search: {e}")
+            log_error(f"Error during keyword search: {e}")
             return []
     def hybrid_search(
         self,
         query: str,
         limit: int = 5,
-        filters: Optional[Dict[str, Any]] = None,
+        filters: Optional[Union[Dict[str, Any], List[FilterExpr]]] = None,
     ) -> List[Document]:
         """
         Perform a hybrid search combining vector similarity and full-text search.
@@ -622,7 +1000,7 @@ class PgVector(VectorDb):
         Args:
             query (str): The search query.
             limit (int): Maximum number of results to return.
-            filters (Optional[Dict[str, Any]]): Filters to apply to the search.
+            filters (Optional[Union[Dict[str, Any], List[FilterExpr]]]): Filters to apply to the search.
         Returns:
             List[Document]: List of matching documents.
@@ -631,7 +1009,7 @@ class PgVector(VectorDb):
             # Get the embedding for the query string
             query_embedding = self.embedder.get_embedding(query)
             if query_embedding is None:
-                logger.error(f"Error getting embedding for Query: {query}")
+                log_error(f"Error getting embedding for Query: {query}")
                 return []
             # Define the columns to select
@@ -669,7 +1047,7 @@ class PgVector(VectorDb):
                 # Normalize to range [0, 1]
                 vector_score = (raw_vector_score + 1) / 2
             else:
-                logger.error(f"Unknown distance metric: {self.distance}")
+                log_error(f"Unknown distance metric: {self.distance}")
                 return []
             # Apply weights to control the influence of each score
@@ -689,7 +1067,17 @@ class PgVector(VectorDb):
             # Apply filters if provided
             if filters is not None:
-                stmt = stmt.where(self.table.c.filters.contains(filters))
+                # Handle dict filters
+                if isinstance(filters, dict):
+                    stmt = stmt.where(self.table.c.meta_data.contains(filters))
+                # Handle FilterExpr DSL
+                else:
+                    # Convert each DSL expression to SQLAlchemy and AND them together
+                    sqlalchemy_conditions = [
+                        self._dsl_to_sqlalchemy(f.to_dict() if hasattr(f, "to_dict") else f, self.table)
+                        for f in filters
+                    ]
+                    stmt = stmt.where(and_(*sqlalchemy_conditions))
             # Order the results by the hybrid score in descending order
             stmt = stmt.order_by(desc("hybrid_score"))
@@ -698,7 +1086,7 @@ class PgVector(VectorDb):
             stmt = stmt.limit(limit)
             # Log the query for debugging
-            logger.debug(f"Hybrid search query: {stmt}")
+            log_debug(f"Hybrid search query: {stmt}")
             # Execute the query
             try:
@@ -710,7 +1098,7 @@ class PgVector(VectorDb):
                             sess.execute(text(f"SET LOCAL hnsw.ef_search = {self.vector_index.ef_search}"))
                     results = sess.execute(stmt).fetchall()
             except Exception as e:
-                logger.error(f"Error performing hybrid search: {e}")
+                log_error(f"Error performing hybrid search: {e}")
                 return []
             # Process the results and convert to Document objects
@@ -728,9 +1116,14 @@ class PgVector(VectorDb):
                     )
                 )
+            if self.reranker:
+                search_results = self.reranker.rerank(query=query, documents=search_results)
+            log_info(f"Found {len(search_results)} documents")
             return search_results
         except Exception as e:
-            logger.error(f"Error during hybrid search: {e}")
+            log_error(f"Error during hybrid search: {e}")
             return []
     def drop(self) -> None:
@@ -739,14 +1132,18 @@ class PgVector(VectorDb):
         """
         if self.table_exists():
             try:
-                logger.debug(f"Dropping table '{self.table.fullname}'.")
+                log_debug(f"Dropping table '{self.table.fullname}'.")
                 self.table.drop(self.db_engine)
-                logger.info(f"Table '{self.table.fullname}' dropped successfully.")
+                log_info(f"Table '{self.table.fullname}' dropped successfully.")
             except Exception as e:
-                logger.error(f"Error dropping table '{self.table.fullname}': {e}")
+                log_error(f"Error dropping table '{self.table.fullname}': {e}")
                 raise
         else:
-            logger.info(f"Table '{self.table.fullname}' does not exist.")
+            log_info(f"Table '{self.table.fullname}' does not exist.")
+    async def async_drop(self) -> None:
+        """Drop the table asynchronously by running in a thread."""
+        await asyncio.to_thread(self.drop)
     def exists(self) -> bool:
         """
@@ -757,6 +1154,10 @@ class PgVector(VectorDb):
         """
         return self.table_exists()
+    async def async_exists(self) -> bool:
+        """Check if table exists asynchronously by running in a thread."""
+        return await asyncio.to_thread(self.exists)
     def get_count(self) -> int:
         """
         Get the number of records in the table.
@@ -770,7 +1171,7 @@ class PgVector(VectorDb):
                 result = sess.execute(stmt).scalar()
                 return int(result) if result is not None else 0
         except Exception as e:
-            logger.error(f"Error getting count from table '{self.table.fullname}': {e}")
+            log_error(f"Error getting count from table '{self.table.fullname}': {e}")
             return 0
     def optimize(self, force_recreate: bool = False) -> None:
@@ -780,10 +1181,10 @@ class PgVector(VectorDb):
         Args:
             force_recreate (bool): If True, existing indexes will be dropped and recreated.
         """
-        logger.debug("==== Optimizing Vector DB ====")
+        log_debug("==== Optimizing Vector DB ====")
         self._create_vector_index(force_recreate=force_recreate)
         self._create_gin_index(force_recreate=force_recreate)
-        logger.debug("==== Optimized Vector DB ====")
+        log_debug("==== Optimized Vector DB ====")
     def _index_exists(self, index_name: str) -> bool:
         """
@@ -811,7 +1212,7 @@ class PgVector(VectorDb):
                 drop_index_sql = f'DROP INDEX IF EXISTS "{self.schema}"."{index_name}";'
                 sess.execute(text(drop_index_sql))
         except Exception as e:
-            logger.error(f"Error dropping index '{index_name}': {e}")
+            log_error(f"Error dropping index '{index_name}': {e}")
             raise
     def _create_vector_index(self, force_recreate: bool = False) -> None:
@@ -822,7 +1223,7 @@ class PgVector(VectorDb):
             force_recreate (bool): If True, existing index will be dropped and recreated.
         """
         if self.vector_index is None:
-            logger.debug("No vector index specified, skipping vector index optimization.")
+            log_debug("No vector index specified, skipping vector index optimization.")
             return
         # Generate index name if not provided
@@ -844,12 +1245,12 @@ class PgVector(VectorDb):
         vector_index_exists = self._index_exists(self.vector_index.name)
         if vector_index_exists:
-            logger.info(f"Vector index '{self.vector_index.name}' already exists.")
+            log_info(f"Vector index '{self.vector_index.name}' already exists.")
             if force_recreate:
-                logger.info(f"Force recreating vector index '{self.vector_index.name}'. Dropping existing index.")
+                log_info(f"Force recreating vector index '{self.vector_index.name}'. Dropping existing index.")
                 self._drop_index(self.vector_index.name)
             else:
-                logger.info(f"Skipping vector index creation as index '{self.vector_index.name}' already exists.")
+                log_info(f"Skipping vector index creation as index '{self.vector_index.name}' already exists.")
                 return
         # Proceed to create the vector index
@@ -857,7 +1258,7 @@ class PgVector(VectorDb):
             with self.Session() as sess, sess.begin():
                 # Set configuration parameters
                 if self.vector_index.configuration:
-                    logger.debug(f"Setting configuration: {self.vector_index.configuration}")
+                    log_debug(f"Setting configuration: {self.vector_index.configuration}")
                     for key, value in self.vector_index.configuration.items():
                         sess.execute(text(f"SET {key} = :value;"), {"value": value})
@@ -866,10 +1267,10 @@ class PgVector(VectorDb):
                 elif isinstance(self.vector_index, HNSW):
                     self._create_hnsw_index(sess, table_fullname, index_distance)
                 else:
-                    logger.error(f"Unknown index type: {type(self.vector_index)}")
+                    log_error(f"Unknown index type: {type(self.vector_index)}")
                     return
         except Exception as e:
-            logger.error(f"Error creating vector index '{self.vector_index.name}': {e}")
+            log_error(f"Error creating vector index '{self.vector_index.name}': {e}")
             raise
     def _create_ivfflat_index(self, sess: Session, table_fullname: str, index_distance: str) -> None:
@@ -888,7 +1289,7 @@ class PgVector(VectorDb):
         num_lists = self.vector_index.lists
         if self.vector_index.dynamic_lists:
             total_records = self.get_count()
-            logger.debug(f"Number of records: {total_records}")
+            log_debug(f"Number of records: {total_records}")
             if total_records < 1000000:
                 num_lists = max(int(total_records / 1000), 1)  # Ensure at least one list
             else:
@@ -897,7 +1298,7 @@ class PgVector(VectorDb):
         # Set ivfflat.probes
         sess.execute(text("SET ivfflat.probes = :probes;"), {"probes": self.vector_index.probes})
-        logger.debug(
+        log_debug(
             f"Creating Ivfflat index '{self.vector_index.name}' on table '{table_fullname}' with "
             f"lists: {num_lists}, probes: {self.vector_index.probes}, "
             f"and distance metric: {index_distance}"
@@ -923,7 +1324,7 @@ class PgVector(VectorDb):
         # Cast index to HNSW for type hinting
         self.vector_index = cast(HNSW, self.vector_index)
-        logger.debug(
+        log_debug(
             f"Creating HNSW index '{self.vector_index.name}' on table '{table_fullname}' with "
             f"m: {self.vector_index.m}, ef_construction: {self.vector_index.ef_construction}, "
             f"and distance metric: {index_distance}"
@@ -949,18 +1350,18 @@ class PgVector(VectorDb):
         gin_index_exists = self._index_exists(gin_index_name)
         if gin_index_exists:
-            logger.info(f"GIN index '{gin_index_name}' already exists.")
+            log_info(f"GIN index '{gin_index_name}' already exists.")
             if force_recreate:
-                logger.info(f"Force recreating GIN index '{gin_index_name}'. Dropping existing index.")
+                log_info(f"Force recreating GIN index '{gin_index_name}'. Dropping existing index.")
                 self._drop_index(gin_index_name)
             else:
-                logger.info(f"Skipping GIN index creation as index '{gin_index_name}' already exists.")
+                log_info(f"Skipping GIN index creation as index '{gin_index_name}' already exists.")
                 return
         # Proceed to create GIN index
         try:
             with self.Session() as sess, sess.begin():
-                logger.debug(f"Creating GIN index '{gin_index_name}' on table '{self.table.fullname}'.")
+                log_debug(f"Creating GIN index '{gin_index_name}' on table '{self.table.fullname}'.")
                 # Create index
                 create_gin_index_sql = text(
                     f'CREATE INDEX "{gin_index_name}" ON {self.table.fullname} '
@@ -968,7 +1369,7 @@ class PgVector(VectorDb):
                 )
                 sess.execute(create_gin_index_sql)
         except Exception as e:
-            logger.error(f"Error creating GIN index '{gin_index_name}': {e}")
+            log_error(f"Error creating GIN index '{gin_index_name}': {e}")
             raise
     def delete(self) -> bool:
@@ -984,10 +1385,90 @@ class PgVector(VectorDb):
             with self.Session() as sess:
                 sess.execute(delete(self.table))
                 sess.commit()
-                logger.info(f"Deleted all records from table '{self.table.fullname}'.")
+                log_info(f"Deleted all records from table '{self.table.fullname}'.")
+                return True
+        except Exception as e:
+            log_error(f"Error deleting rows from table '{self.table.fullname}': {e}")
+            sess.rollback()
+            return False
+    def delete_by_id(self, id: str) -> bool:
+        """
+        Delete content by ID.
+        """
+        try:
+            with self.Session() as sess, sess.begin():
+                stmt = self.table.delete().where(self.table.c.id == id)
+                sess.execute(stmt)
+                sess.commit()
+                log_info(f"Deleted records with id '{id}' from table '{self.table.fullname}'.")
+                return True
+        except Exception as e:
+            log_error(f"Error deleting rows from table '{self.table.fullname}': {e}")
+            sess.rollback()
+            return False
+    def delete_by_name(self, name: str) -> bool:
+        """
+        Delete content by name.
+        """
+        try:
+            with self.Session() as sess, sess.begin():
+                stmt = self.table.delete().where(self.table.c.name == name)
+                sess.execute(stmt)
+                sess.commit()
+                log_info(f"Deleted records with name '{name}' from table '{self.table.fullname}'.")
+                return True
+        except Exception as e:
+            log_error(f"Error deleting rows from table '{self.table.fullname}': {e}")
+            sess.rollback()
+            return False
+    def delete_by_metadata(self, metadata: Dict[str, Any]) -> bool:
+        """
+        Delete content by metadata.
+        """
+        try:
+            with self.Session() as sess, sess.begin():
+                stmt = self.table.delete().where(self.table.c.meta_data.contains(metadata))
+                sess.execute(stmt)
+                sess.commit()
+                log_info(f"Deleted records with metadata '{metadata}' from table '{self.table.fullname}'.")
+                return True
+        except Exception as e:
+            log_error(f"Error deleting rows from table '{self.table.fullname}': {e}")
+            sess.rollback()
+            return False
+    def delete_by_content_id(self, content_id: str) -> bool:
+        """
+        Delete content by content ID.
+        """
+        try:
+            with self.Session() as sess, sess.begin():
+                stmt = self.table.delete().where(self.table.c.content_id == content_id)
+                sess.execute(stmt)
+                sess.commit()
+                log_info(f"Deleted records with content ID '{content_id}' from table '{self.table.fullname}'.")
                 return True
         except Exception as e:
-            logger.error(f"Error deleting rows from table '{self.table.fullname}': {e}")
+            log_error(f"Error deleting rows from table '{self.table.fullname}': {e}")
+            sess.rollback()
+            return False
+    def _delete_by_content_hash(self, content_hash: str) -> bool:
+        """
+        Delete content by content hash.
+        """
+        try:
+            with self.Session() as sess, sess.begin():
+                stmt = self.table.delete().where(self.table.c.content_hash == content_hash)
+                sess.execute(stmt)
+                sess.commit()
+                log_info(f"Deleted records with content hash '{content_hash}' from table '{self.table.fullname}'.")
+                return True
+        except Exception as e:
+            log_error(f"Error deleting rows from table '{self.table.fullname}': {e}")
             sess.rollback()
             return False
@@ -1023,3 +1504,6 @@ class PgVector(VectorDb):
         copied_obj.table = copied_obj.get_table()
         return copied_obj
+    def get_supported_search_types(self) -> List[str]:
+        return [SearchType.vector, SearchType.keyword, SearchType.hybrid]

agno 0.1.2__py3-none-any.whl → 2.3.13__py3-none-any.whl

agno 0.1.2py3-none-any.whl → 2.3.13py3-none-any.whl