PyPI - vanna - Versions diffs - 0.7.9__py3-none-any.whl → 2.0.0rc1__py3-none-any.whl - Mend

vanna 0.7.9py3-none-any.whl → 2.0.0rc1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (302) hide show

vanna/__init__.py +167 -395
vanna/agents/__init__.py +7 -0
vanna/capabilities/__init__.py +17 -0
vanna/capabilities/agent_memory/__init__.py +21 -0
vanna/capabilities/agent_memory/base.py +103 -0
vanna/capabilities/agent_memory/models.py +53 -0
vanna/capabilities/file_system/__init__.py +14 -0
vanna/capabilities/file_system/base.py +71 -0
vanna/capabilities/file_system/models.py +25 -0
vanna/capabilities/sql_runner/__init__.py +13 -0
vanna/capabilities/sql_runner/base.py +37 -0
vanna/capabilities/sql_runner/models.py +13 -0
vanna/components/__init__.py +92 -0
vanna/components/base.py +11 -0
vanna/components/rich/__init__.py +83 -0
vanna/components/rich/containers/__init__.py +7 -0
vanna/components/rich/containers/card.py +20 -0
vanna/components/rich/data/__init__.py +9 -0
vanna/components/rich/data/chart.py +17 -0
vanna/components/rich/data/dataframe.py +93 -0
vanna/components/rich/feedback/__init__.py +21 -0
vanna/components/rich/feedback/badge.py +16 -0
vanna/components/rich/feedback/icon_text.py +14 -0
vanna/components/rich/feedback/log_viewer.py +41 -0
vanna/components/rich/feedback/notification.py +19 -0
vanna/components/rich/feedback/progress.py +37 -0
vanna/components/rich/feedback/status_card.py +28 -0
vanna/components/rich/feedback/status_indicator.py +14 -0
vanna/components/rich/interactive/__init__.py +21 -0
vanna/components/rich/interactive/button.py +95 -0
vanna/components/rich/interactive/task_list.py +58 -0
vanna/components/rich/interactive/ui_state.py +93 -0
vanna/components/rich/specialized/__init__.py +7 -0
vanna/components/rich/specialized/artifact.py +20 -0
vanna/components/rich/text.py +16 -0
vanna/components/simple/__init__.py +15 -0
vanna/components/simple/image.py +15 -0
vanna/components/simple/link.py +15 -0
vanna/components/simple/text.py +11 -0
vanna/core/__init__.py +193 -0
vanna/core/_compat.py +19 -0
vanna/core/agent/__init__.py +10 -0
vanna/core/agent/agent.py +1407 -0
vanna/core/agent/config.py +123 -0
vanna/core/audit/__init__.py +28 -0
vanna/core/audit/base.py +299 -0
vanna/core/audit/models.py +131 -0
vanna/core/component_manager.py +329 -0
vanna/core/components.py +53 -0
vanna/core/enhancer/__init__.py +11 -0
vanna/core/enhancer/base.py +94 -0
vanna/core/enhancer/default.py +118 -0
vanna/core/enricher/__init__.py +10 -0
vanna/core/enricher/base.py +59 -0
vanna/core/errors.py +47 -0
vanna/core/evaluation/__init__.py +81 -0
vanna/core/evaluation/base.py +186 -0
vanna/core/evaluation/dataset.py +254 -0
vanna/core/evaluation/evaluators.py +376 -0
vanna/core/evaluation/report.py +289 -0
vanna/core/evaluation/runner.py +313 -0
vanna/core/filter/__init__.py +10 -0
vanna/core/filter/base.py +67 -0
vanna/core/lifecycle/__init__.py +10 -0
vanna/core/lifecycle/base.py +83 -0
vanna/core/llm/__init__.py +16 -0
vanna/core/llm/base.py +40 -0
vanna/core/llm/models.py +61 -0
vanna/core/middleware/__init__.py +10 -0
vanna/core/middleware/base.py +69 -0
vanna/core/observability/__init__.py +11 -0
vanna/core/observability/base.py +88 -0
vanna/core/observability/models.py +47 -0
vanna/core/recovery/__init__.py +11 -0
vanna/core/recovery/base.py +84 -0
vanna/core/recovery/models.py +32 -0
vanna/core/registry.py +278 -0
vanna/core/rich_component.py +156 -0
vanna/core/simple_component.py +27 -0
vanna/core/storage/__init__.py +14 -0
vanna/core/storage/base.py +46 -0
vanna/core/storage/models.py +46 -0
vanna/core/system_prompt/__init__.py +13 -0
vanna/core/system_prompt/base.py +36 -0
vanna/core/system_prompt/default.py +157 -0
vanna/core/tool/__init__.py +18 -0
vanna/core/tool/base.py +70 -0
vanna/core/tool/models.py +84 -0
vanna/core/user/__init__.py +17 -0
vanna/core/user/base.py +29 -0
vanna/core/user/models.py +25 -0
vanna/core/user/request_context.py +70 -0
vanna/core/user/resolver.py +42 -0
vanna/core/validation.py +164 -0
vanna/core/workflow/__init__.py +12 -0
vanna/core/workflow/base.py +254 -0
vanna/core/workflow/default.py +789 -0
vanna/examples/__init__.py +1 -0
vanna/examples/__main__.py +44 -0
vanna/examples/anthropic_quickstart.py +80 -0
vanna/examples/artifact_example.py +293 -0
vanna/examples/claude_sqlite_example.py +236 -0
vanna/examples/coding_agent_example.py +300 -0
vanna/examples/custom_system_prompt_example.py +174 -0
vanna/examples/default_workflow_handler_example.py +208 -0
vanna/examples/email_auth_example.py +340 -0
vanna/examples/evaluation_example.py +269 -0
vanna/examples/extensibility_example.py +262 -0
vanna/examples/minimal_example.py +67 -0
vanna/examples/mock_auth_example.py +227 -0
vanna/examples/mock_custom_tool.py +311 -0
vanna/examples/mock_quickstart.py +79 -0
vanna/examples/mock_quota_example.py +145 -0
vanna/examples/mock_rich_components_demo.py +396 -0
vanna/examples/mock_sqlite_example.py +223 -0
vanna/examples/openai_quickstart.py +83 -0
vanna/examples/primitive_components_demo.py +305 -0
vanna/examples/quota_lifecycle_example.py +139 -0
vanna/examples/visualization_example.py +251 -0
vanna/integrations/__init__.py +17 -0
vanna/integrations/anthropic/__init__.py +9 -0
vanna/integrations/anthropic/llm.py +270 -0
vanna/integrations/azureopenai/__init__.py +9 -0
vanna/integrations/azureopenai/llm.py +329 -0
vanna/integrations/azuresearch/__init__.py +7 -0
vanna/integrations/azuresearch/agent_memory.py +413 -0
vanna/integrations/bigquery/__init__.py +5 -0
vanna/integrations/bigquery/sql_runner.py +81 -0
vanna/integrations/chromadb/__init__.py +104 -0
vanna/integrations/chromadb/agent_memory.py +416 -0
vanna/integrations/clickhouse/__init__.py +5 -0
vanna/integrations/clickhouse/sql_runner.py +82 -0
vanna/integrations/duckdb/__init__.py +5 -0
vanna/integrations/duckdb/sql_runner.py +65 -0
vanna/integrations/faiss/__init__.py +7 -0
vanna/integrations/faiss/agent_memory.py +431 -0
vanna/integrations/google/__init__.py +9 -0
vanna/integrations/google/gemini.py +370 -0
vanna/integrations/hive/__init__.py +5 -0
vanna/integrations/hive/sql_runner.py +87 -0
vanna/integrations/local/__init__.py +17 -0
vanna/integrations/local/agent_memory/__init__.py +7 -0
vanna/integrations/local/agent_memory/in_memory.py +285 -0
vanna/integrations/local/audit.py +59 -0
vanna/integrations/local/file_system.py +242 -0
vanna/integrations/local/file_system_conversation_store.py +255 -0
vanna/integrations/local/storage.py +62 -0
vanna/integrations/marqo/__init__.py +7 -0
vanna/integrations/marqo/agent_memory.py +354 -0
vanna/integrations/milvus/__init__.py +7 -0
vanna/integrations/milvus/agent_memory.py +458 -0
vanna/integrations/mock/__init__.py +9 -0
vanna/integrations/mock/llm.py +65 -0
vanna/integrations/mssql/__init__.py +5 -0
vanna/integrations/mssql/sql_runner.py +66 -0
vanna/integrations/mysql/__init__.py +5 -0
vanna/integrations/mysql/sql_runner.py +92 -0
vanna/integrations/ollama/__init__.py +7 -0
vanna/integrations/ollama/llm.py +252 -0
vanna/integrations/openai/__init__.py +10 -0
vanna/integrations/openai/llm.py +267 -0
vanna/integrations/openai/responses.py +163 -0
vanna/integrations/opensearch/__init__.py +7 -0
vanna/integrations/opensearch/agent_memory.py +411 -0
vanna/integrations/oracle/__init__.py +5 -0
vanna/integrations/oracle/sql_runner.py +75 -0
vanna/integrations/pinecone/__init__.py +7 -0
vanna/integrations/pinecone/agent_memory.py +329 -0
vanna/integrations/plotly/__init__.py +5 -0
vanna/integrations/plotly/chart_generator.py +313 -0
vanna/integrations/postgres/__init__.py +9 -0
vanna/integrations/postgres/sql_runner.py +112 -0
vanna/integrations/premium/agent_memory/__init__.py +7 -0
vanna/integrations/premium/agent_memory/premium.py +186 -0
vanna/integrations/presto/__init__.py +5 -0
vanna/integrations/presto/sql_runner.py +107 -0
vanna/integrations/qdrant/__init__.py +7 -0
vanna/integrations/qdrant/agent_memory.py +439 -0
vanna/integrations/snowflake/__init__.py +5 -0
vanna/integrations/snowflake/sql_runner.py +147 -0
vanna/integrations/sqlite/__init__.py +9 -0
vanna/integrations/sqlite/sql_runner.py +65 -0
vanna/integrations/weaviate/__init__.py +7 -0
vanna/integrations/weaviate/agent_memory.py +428 -0
vanna/{ZhipuAI → legacy/ZhipuAI}/ZhipuAI_embeddings.py +11 -11
vanna/legacy/__init__.py +403 -0
vanna/legacy/adapter.py +463 -0
vanna/{advanced → legacy/advanced}/__init__.py +3 -1
vanna/{anthropic → legacy/anthropic}/anthropic_chat.py +9 -7
vanna/{azuresearch → legacy/azuresearch}/azuresearch_vector.py +79 -41
vanna/{base → legacy/base}/base.py +224 -217
vanna/legacy/bedrock/__init__.py +1 -0
vanna/{bedrock → legacy/bedrock}/bedrock_converse.py +13 -12
vanna/{chromadb → legacy/chromadb}/chromadb_vector.py +3 -1
vanna/legacy/cohere/__init__.py +2 -0
vanna/{cohere → legacy/cohere}/cohere_chat.py +19 -14
vanna/{cohere → legacy/cohere}/cohere_embeddings.py +25 -19
vanna/{deepseek → legacy/deepseek}/deepseek_chat.py +5 -6
vanna/legacy/faiss/__init__.py +1 -0
vanna/{faiss → legacy/faiss}/faiss.py +113 -59
vanna/{flask → legacy/flask}/__init__.py +84 -43
vanna/{flask → legacy/flask}/assets.py +5 -5
vanna/{flask → legacy/flask}/auth.py +5 -4
vanna/{google → legacy/google}/bigquery_vector.py +75 -42
vanna/{google → legacy/google}/gemini_chat.py +7 -3
vanna/{hf → legacy/hf}/hf.py +0 -1
vanna/{milvus → legacy/milvus}/milvus_vector.py +58 -35
vanna/{mock → legacy/mock}/llm.py +0 -1
vanna/legacy/mock/vectordb.py +67 -0
vanna/legacy/ollama/ollama.py +110 -0
vanna/{openai → legacy/openai}/openai_chat.py +2 -6
vanna/legacy/opensearch/opensearch_vector.py +369 -0
vanna/legacy/opensearch/opensearch_vector_semantic.py +200 -0
vanna/legacy/oracle/oracle_vector.py +584 -0
vanna/{pgvector → legacy/pgvector}/pgvector.py +42 -13
vanna/{qdrant → legacy/qdrant}/qdrant.py +2 -6
vanna/legacy/qianfan/Qianfan_Chat.py +170 -0
vanna/legacy/qianfan/Qianfan_embeddings.py +36 -0
vanna/legacy/qianwen/QianwenAI_chat.py +132 -0
vanna/{remote.py → legacy/remote.py} +28 -26
vanna/{utils.py → legacy/utils.py} +6 -11
vanna/{vannadb → legacy/vannadb}/vannadb_vector.py +115 -46
vanna/{vllm → legacy/vllm}/vllm.py +5 -6
vanna/{weaviate → legacy/weaviate}/weaviate_vector.py +59 -40
vanna/{xinference → legacy/xinference}/xinference.py +6 -6
vanna/py.typed +0 -0
vanna/servers/__init__.py +16 -0
vanna/servers/__main__.py +8 -0
vanna/servers/base/__init__.py +18 -0
vanna/servers/base/chat_handler.py +65 -0
vanna/servers/base/models.py +111 -0
vanna/servers/base/rich_chat_handler.py +141 -0
vanna/servers/base/templates.py +331 -0
vanna/servers/cli/__init__.py +7 -0
vanna/servers/cli/server_runner.py +204 -0
vanna/servers/fastapi/__init__.py +7 -0
vanna/servers/fastapi/app.py +163 -0
vanna/servers/fastapi/routes.py +183 -0
vanna/servers/flask/__init__.py +7 -0
vanna/servers/flask/app.py +132 -0
vanna/servers/flask/routes.py +137 -0
vanna/tools/__init__.py +41 -0
vanna/tools/agent_memory.py +322 -0
vanna/tools/file_system.py +879 -0
vanna/tools/python.py +222 -0
vanna/tools/run_sql.py +165 -0
vanna/tools/visualize_data.py +195 -0
vanna/utils/__init__.py +0 -0
vanna/web_components/__init__.py +44 -0
vanna-2.0.0rc1.dist-info/METADATA +868 -0
vanna-2.0.0rc1.dist-info/RECORD +289 -0
vanna-2.0.0rc1.dist-info/entry_points.txt +3 -0
vanna/bedrock/__init__.py +0 -1
vanna/cohere/__init__.py +0 -2
vanna/faiss/__init__.py +0 -1
vanna/mock/vectordb.py +0 -55
vanna/ollama/ollama.py +0 -103
vanna/opensearch/opensearch_vector.py +0 -392
vanna/opensearch/opensearch_vector_semantic.py +0 -175
vanna/oracle/oracle_vector.py +0 -585
vanna/qianfan/Qianfan_Chat.py +0 -165
vanna/qianfan/Qianfan_embeddings.py +0 -36
vanna/qianwen/QianwenAI_chat.py +0 -133
vanna-0.7.9.dist-info/METADATA +0 -408
vanna-0.7.9.dist-info/RECORD +0 -79
/vanna/{ZhipuAI → legacy/ZhipuAI}/ZhipuAI_Chat.py +0 -0
/vanna/{ZhipuAI → legacy/ZhipuAI}/__init__.py +0 -0
/vanna/{anthropic → legacy/anthropic}/__init__.py +0 -0
/vanna/{azuresearch → legacy/azuresearch}/__init__.py +0 -0
/vanna/{base → legacy/base}/__init__.py +0 -0
/vanna/{chromadb → legacy/chromadb}/__init__.py +0 -0
/vanna/{deepseek → legacy/deepseek}/__init__.py +0 -0
/vanna/{exceptions → legacy/exceptions}/__init__.py +0 -0
/vanna/{google → legacy/google}/__init__.py +0 -0
/vanna/{hf → legacy/hf}/__init__.py +0 -0
/vanna/{local.py → legacy/local.py} +0 -0
/vanna/{marqo → legacy/marqo}/__init__.py +0 -0
/vanna/{marqo → legacy/marqo}/marqo.py +0 -0
/vanna/{milvus → legacy/milvus}/__init__.py +0 -0
/vanna/{mistral → legacy/mistral}/__init__.py +0 -0
/vanna/{mistral → legacy/mistral}/mistral.py +0 -0
/vanna/{mock → legacy/mock}/__init__.py +0 -0
/vanna/{mock → legacy/mock}/embedding.py +0 -0
/vanna/{ollama → legacy/ollama}/__init__.py +0 -0
/vanna/{openai → legacy/openai}/__init__.py +0 -0
/vanna/{openai → legacy/openai}/openai_embeddings.py +0 -0
/vanna/{opensearch → legacy/opensearch}/__init__.py +0 -0
/vanna/{oracle → legacy/oracle}/__init__.py +0 -0
/vanna/{pgvector → legacy/pgvector}/__init__.py +0 -0
/vanna/{pinecone → legacy/pinecone}/__init__.py +0 -0
/vanna/{pinecone → legacy/pinecone}/pinecone_vector.py +0 -0
/vanna/{qdrant → legacy/qdrant}/__init__.py +0 -0
/vanna/{qianfan → legacy/qianfan}/__init__.py +0 -0
/vanna/{qianwen → legacy/qianwen}/QianwenAI_embeddings.py +0 -0
/vanna/{qianwen → legacy/qianwen}/__init__.py +0 -0
/vanna/{types → legacy/types}/__init__.py +0 -0
/vanna/{vannadb → legacy/vannadb}/__init__.py +0 -0
/vanna/{vllm → legacy/vllm}/__init__.py +0 -0
/vanna/{weaviate → legacy/weaviate}/__init__.py +0 -0
/vanna/{xinference → legacy/xinference}/__init__.py +0 -0
{vanna-0.7.9.dist-info → vanna-2.0.0rc1.dist-info}/WHEEL +0 -0
{vanna-0.7.9.dist-info → vanna-2.0.0rc1.dist-info}/licenses/LICENSE +0 -0

vanna/core/evaluation/runner.py ADDED Viewed

@@ -0,0 +1,313 @@
+"""
+Evaluation runner with parallel execution support.
+This module provides the EvaluationRunner class that executes test cases
+against agents with configurable parallelism for efficient evaluation,
+especially when comparing multiple LLMs or model versions.
+"""
+import asyncio
+from typing import Any, List, Dict, Optional, AsyncGenerator, TYPE_CHECKING
+from datetime import datetime
+from .base import (
+    TestCase,
+    AgentResult,
+    TestCaseResult,
+    AgentVariant,
+    Evaluator,
+)
+from vanna.core import UiComponent
+from vanna.core.user.request_context import RequestContext
+from vanna.core.observability import ObservabilityProvider
+if TYPE_CHECKING:
+    from vanna import Agent
+    from .report import EvaluationReport, ComparisonReport
+class EvaluationRunner:
+    """Run evaluations with parallel execution support.
+    The primary use case is comparing multiple agent variants (e.g., different LLMs)
+    on the same set of test cases. The runner executes test cases in parallel with
+    configurable concurrency to handle I/O-bound LLM operations efficiently.
+    Example:
+        >>> runner = EvaluationRunner(
+        ...     evaluators=[TrajectoryEvaluator(), OutputEvaluator()],
+        ...     max_concurrency=20
+        ... )
+        >>> comparison = await runner.compare_agents(
+        ...     agent_variants=[claude_variant, gpt_variant],
+        ...     test_cases=dataset.test_cases
+        ... )
+    """
+    def __init__(
+        self,
+        evaluators: List[Evaluator],
+        max_concurrency: int = 10,
+        observability_provider: Optional[ObservabilityProvider] = None,
+    ):
+        """Initialize the evaluation runner.
+        Args:
+            evaluators: List of evaluators to apply to each test case
+            max_concurrency: Maximum number of concurrent test case executions
+            observability_provider: Optional observability for tracking eval runs
+        """
+        self.evaluators = evaluators
+        self.max_concurrency = max_concurrency
+        self.observability = observability_provider
+        self._semaphore = asyncio.Semaphore(max_concurrency)
+    async def run_evaluation(
+        self,
+        agent: "Agent",
+        test_cases: List[TestCase],
+    ) -> "EvaluationReport":
+        """Run evaluation on a single agent.
+        Args:
+            agent: The agent to evaluate
+            test_cases: List of test cases to run
+        Returns:
+            EvaluationReport with results for all test cases
+        """
+        from .report import EvaluationReport
+        results = await self._run_test_cases_parallel(agent, test_cases)
+        return EvaluationReport(
+            agent_name="agent",
+            results=results,
+            evaluators=self.evaluators,
+            timestamp=datetime.now(),
+        )
+    async def compare_agents(
+        self,
+        agent_variants: List[AgentVariant],
+        test_cases: List[TestCase],
+    ) -> "ComparisonReport":
+        """Compare multiple agent variants on same test cases.
+        This is the PRIMARY use case for LLM comparison. Runs all variants
+        in parallel for maximum efficiency with I/O-bound LLM calls.
+        Args:
+            agent_variants: List of agent variants to compare
+            test_cases: Test cases to run on each variant
+        Returns:
+            ComparisonReport with results for all variants
+        """
+        from .report import ComparisonReport
+        # Create span for overall comparison
+        if self.observability:
+            span = await self.observability.create_span(
+                "agent_comparison",
+                attributes={
+                    "num_variants": len(agent_variants),
+                    "num_test_cases": len(test_cases),
+                },
+            )
+        # Run all variants in parallel
+        tasks = [
+            self._run_agent_variant(variant, test_cases) for variant in agent_variants
+        ]
+        variant_reports = await asyncio.gather(*tasks)
+        if self.observability:
+            await self.observability.end_span(span)
+        return ComparisonReport(
+            variants=agent_variants,
+            reports=dict(zip([v.name for v in agent_variants], variant_reports)),
+            test_cases=test_cases,
+            timestamp=datetime.now(),
+        )
+    async def compare_agents_streaming(
+        self,
+        agent_variants: List[AgentVariant],
+        test_cases: List[TestCase],
+    ) -> AsyncGenerator[tuple[str, TestCaseResult, int, int], None]:
+        """Stream comparison results as they complete.
+        Useful for long-running evaluations where you want to see
+        progress updates in real-time (e.g., for UI display).
+        Args:
+            agent_variants: Agent variants to compare
+            test_cases: Test cases to run
+        Yields:
+            Tuples of (variant_name, result, completed_count, total_count)
+        """
+        queue: asyncio.Queue[tuple[str, TestCaseResult]] = asyncio.Queue()
+        async def worker(variant: AgentVariant) -> None:
+            """Worker that runs test cases for one variant."""
+            results = await self._run_test_cases_parallel(variant.agent, test_cases)
+            for result in results:
+                await queue.put((variant.name, result))
+        # Start all workers
+        workers = [asyncio.create_task(worker(v)) for v in agent_variants]
+        # Yield results as they arrive
+        completed = 0
+        total = len(agent_variants) * len(test_cases)
+        while completed < total:
+            variant_name, result = await queue.get()
+            completed += 1
+            yield variant_name, result, completed, total
+        # Wait for all workers to complete
+        await asyncio.gather(*workers)
+    async def _run_agent_variant(
+        self,
+        variant: AgentVariant,
+        test_cases: List[TestCase],
+    ) -> "EvaluationReport":
+        """Run a single agent variant on all test cases.
+        Args:
+            variant: The agent variant to evaluate
+            test_cases: Test cases to run
+        Returns:
+            EvaluationReport for this variant
+        """
+        from .report import EvaluationReport
+        if self.observability:
+            span = await self.observability.create_span(
+                f"variant_{variant.name}",
+                attributes={
+                    "variant": variant.name,
+                    "num_test_cases": len(test_cases),
+                    **variant.metadata,
+                },
+            )
+        results = await self._run_test_cases_parallel(variant.agent, test_cases)
+        if self.observability:
+            await self.observability.end_span(span)
+        return EvaluationReport(
+            agent_name=variant.name,
+            results=results,
+            evaluators=self.evaluators,
+            metadata=variant.metadata,
+            timestamp=datetime.now(),
+        )
+    async def _run_test_cases_parallel(
+        self,
+        agent: "Agent",
+        test_cases: List[TestCase],
+    ) -> List[TestCaseResult]:
+        """Run test cases in parallel with concurrency limit.
+        Args:
+            agent: The agent to run test cases on
+            test_cases: Test cases to execute
+        Returns:
+            List of TestCaseResult, one per test case
+        """
+        tasks = [
+            self._run_single_test_case(agent, test_case) for test_case in test_cases
+        ]
+        return await asyncio.gather(*tasks)
+    async def _run_single_test_case(
+        self,
+        agent: "Agent",
+        test_case: TestCase,
+    ) -> TestCaseResult:
+        """Run a single test case with semaphore to limit concurrency.
+        Args:
+            agent: The agent to execute
+            test_case: The test case to run
+        Returns:
+            TestCaseResult with agent execution and evaluations
+        """
+        async with self._semaphore:
+            # Execute agent
+            start_time = asyncio.get_event_loop().time()
+            agent_result = await self._execute_agent(agent, test_case)
+            execution_time = asyncio.get_event_loop().time() - start_time
+            # Run evaluators
+            eval_results = []
+            for evaluator in self.evaluators:
+                eval_result = await evaluator.evaluate(test_case, agent_result)
+                eval_results.append(eval_result)
+            return TestCaseResult(
+                test_case=test_case,
+                agent_result=agent_result,
+                evaluations=eval_results,
+                execution_time_ms=execution_time * 1000,
+            )
+    async def _execute_agent(
+        self,
+        agent: "Agent",
+        test_case: TestCase,
+    ) -> AgentResult:
+        """Execute agent and capture full trajectory.
+        Args:
+            agent: The agent to execute
+            test_case: The test case to run
+        Returns:
+            AgentResult with all captured data
+        """
+        components: List[UiComponent] = []
+        tool_calls: List[Dict[str, Any]] = []
+        error: Optional[str] = None
+        try:
+            # Create request context with user info from test case
+            # This allows the agent's UserResolver to resolve the correct user
+            request_context = RequestContext(
+                cookies={"user_id": test_case.user.id},
+                headers={},
+                metadata={"test_case_user": test_case.user},
+            )
+            async for component in agent.send_message(
+                request_context=request_context,
+                message=test_case.message,
+                conversation_id=test_case.conversation_id,
+            ):
+                components.append(component)
+        except Exception as e:
+            error = str(e)
+        # TODO: Extract tool calls and LLM requests from observability
+        # For now, these will be empty unless we hook into observability
+        return AgentResult(
+            test_case_id=test_case.id,
+            components=components,
+            tool_calls=tool_calls,
+            llm_requests=[],
+            error=error,
+        )

vanna/core/filter/__init__.py ADDED Viewed

@@ -0,0 +1,10 @@
+"""
+Conversation filtering system for managing conversation history.
+This module provides interfaces for filtering and transforming conversation
+history before it's sent to the LLM.
+"""
+from .base import ConversationFilter
+__all__ = ["ConversationFilter"]

vanna/core/filter/base.py ADDED Viewed

@@ -0,0 +1,67 @@
+"""
+Base conversation filter interface.
+Conversation filters allow you to transform conversation history before
+it's sent to the LLM for processing.
+"""
+from abc import ABC
+from typing import TYPE_CHECKING, List
+if TYPE_CHECKING:
+    from ..storage import Message
+class ConversationFilter(ABC):
+    """Filter for transforming conversation history.
+    Subclass this to create custom filters that can:
+    - Remove sensitive information
+    - Summarize long conversations
+    - Manage context window limits
+    - Deduplicate similar messages
+    - Prioritize recent or relevant messages
+    Example:
+        class ContextWindowFilter(ConversationFilter):
+            def __init__(self, max_tokens: int = 8000):
+                self.max_tokens = max_tokens
+            async def filter_messages(self, messages: List[Message]) -> List[Message]:
+                # Estimate tokens (rough approximation)
+                total_tokens = 0
+                filtered = []
+                # Keep system message and recent messages
+                for msg in reversed(messages):
+                    msg_tokens = len(msg.content or "") // 4
+                    if total_tokens + msg_tokens > self.max_tokens:
+                        break
+                    filtered.insert(0, msg)
+                    total_tokens += msg_tokens
+                return filtered
+        agent = AgentRunner(
+            llm_service=...,
+            conversation_filters=[
+                SensitiveDataFilter(),
+                ContextWindowFilter(max_tokens=8000)
+            ]
+        )
+    """
+    async def filter_messages(self, messages: List["Message"]) -> List["Message"]:
+        """Filter and transform conversation messages.
+        Args:
+            messages: List of conversation messages
+        Returns:
+            Filtered/transformed list of messages
+        Note:
+            Filters are applied in order, so messages passed to later
+            filters may already be modified by earlier filters.
+        """
+        return messages

vanna/core/lifecycle/__init__.py ADDED Viewed

@@ -0,0 +1,10 @@
+"""
+Lifecycle hook system for agent execution.
+This module provides hooks for intercepting and modifying agent behavior
+at various points in the execution lifecycle.
+"""
+from .base import LifecycleHook
+__all__ = ["LifecycleHook"]

vanna/core/lifecycle/base.py ADDED Viewed

@@ -0,0 +1,83 @@
+"""
+Base lifecycle hook interface.
+Lifecycle hooks allow you to intercept and customize agent behavior
+at key points in the execution flow.
+"""
+from abc import ABC
+from typing import TYPE_CHECKING, Any, Optional
+if TYPE_CHECKING:
+    from ..user.models import User
+    from ..tool import Tool
+    from ..tool.models import ToolContext, ToolResult
+class LifecycleHook(ABC):
+    """Hook into agent execution lifecycle.
+    Subclass this to create custom hooks that can:
+    - Modify messages before processing
+    - Add logging or telemetry
+    - Enforce quotas or rate limits
+    - Transform tool results
+    - Add custom validation
+    Example:
+        class LoggingHook(LifecycleHook):
+            async def before_message(self, user: User, message: str) -> Optional[str]:
+                print(f"User {user.username} sent: {message}")
+                return None  # Don't modify
+        agent = AgentRunner(
+            llm_service=...,
+            lifecycle_hooks=[LoggingHook(), QuotaCheckHook()]
+        )
+    """
+    async def before_message(self, user: "User", message: str) -> Optional[str]:
+        """Called before processing a user message.
+        Args:
+            user: User sending the message
+            message: Original message content
+        Returns:
+            Modified message string, or None to keep original
+        Raises:
+            AgentError: To halt message processing (e.g., quota exceeded)
+        """
+        return None
+    async def after_message(self, result: Any) -> None:
+        """Called after message has been fully processed.
+        Args:
+            result: Final result from message processing
+        """
+        pass
+    async def before_tool(self, tool: "Tool[Any]", context: "ToolContext") -> None:
+        """Called before tool execution.
+        Args:
+            tool: Tool about to be executed
+            context: Tool execution context
+        Raises:
+            AgentError: To prevent tool execution
+        """
+        pass
+    async def after_tool(self, result: "ToolResult") -> Optional["ToolResult"]:
+        """Called after tool execution.
+        Args:
+            result: Result from tool execution
+        Returns:
+            Modified ToolResult, or None to keep original
+        """
+        return None

vanna/core/llm/__init__.py ADDED Viewed

@@ -0,0 +1,16 @@
+"""
+LLM domain.
+This module provides the core abstractions for LLM services in the Vanna Agents framework.
+"""
+from .base import LlmService
+from .models import LlmMessage, LlmRequest, LlmResponse, LlmStreamChunk
+__all__ = [
+    "LlmService",
+    "LlmMessage",
+    "LlmRequest",
+    "LlmResponse",
+    "LlmStreamChunk",
+]

vanna/core/llm/base.py ADDED Viewed

@@ -0,0 +1,40 @@
+"""
+LLM domain interface.
+This module contains the abstract base class for LLM services.
+"""
+from abc import ABC, abstractmethod
+from typing import Any, AsyncGenerator, List
+from .models import LlmRequest, LlmResponse, LlmStreamChunk
+class LlmService(ABC):
+    """Service for LLM communication."""
+    @abstractmethod
+    async def send_request(self, request: LlmRequest) -> LlmResponse:
+        """Send a request to the LLM."""
+        pass
+    @abstractmethod
+    async def stream_request(
+        self, request: LlmRequest
+    ) -> AsyncGenerator[LlmStreamChunk, None]:
+        """Stream a request to the LLM.
+        Args:
+            request: The LLM request to stream
+        Yields:
+            LlmStreamChunk instances as they arrive
+        """
+        # This is an async generator method
+        raise NotImplementedError
+        yield  # pragma: no cover - makes this an async generator
+    @abstractmethod
+    async def validate_tools(self, tools: List[Any]) -> List[str]:
+        """Validate tool schemas and return any errors."""
+        pass

vanna/core/llm/models.py ADDED Viewed

@@ -0,0 +1,61 @@
+"""
+LLM domain models.
+This module contains data models for LLM communication.
+"""
+from typing import Any, Dict, List, Optional
+from pydantic import BaseModel, Field
+from ..tool.models import ToolCall
+from ..user.models import User
+class LlmMessage(BaseModel):
+    """Message format for LLM communication."""
+    role: str = Field(description="Message role")
+    content: str = Field(description="Message content")
+    tool_calls: Optional[List[ToolCall]] = Field(default=None)
+    tool_call_id: Optional[str] = Field(default=None)
+class LlmRequest(BaseModel):
+    """Request to LLM service."""
+    messages: List[LlmMessage] = Field(description="Messages to send")
+    tools: Optional[List[Any]] = Field(
+        default=None, description="Available tools"
+    )  # Will be ToolSchema but avoiding circular import
+    user: User = Field(description="User making the request")
+    stream: bool = Field(default=False, description="Whether to stream response")
+    temperature: float = Field(default=0.7, ge=0.0, le=2.0)
+    max_tokens: Optional[int] = Field(default=None, gt=0)
+    system_prompt: Optional[str] = Field(
+        default=None, description="System prompt for the LLM"
+    )
+    metadata: Dict[str, Any] = Field(default_factory=dict)
+class LlmResponse(BaseModel):
+    """Response from LLM."""
+    content: Optional[str] = None
+    tool_calls: Optional[List[ToolCall]] = None
+    finish_reason: Optional[str] = None
+    usage: Optional[Dict[str, int]] = None
+    metadata: Dict[str, Any] = Field(default_factory=dict)
+    def is_tool_call(self) -> bool:
+        """Check if this response contains tool calls."""
+        return self.tool_calls is not None and len(self.tool_calls) > 0
+class LlmStreamChunk(BaseModel):
+    """Streaming chunk from LLM."""
+    content: Optional[str] = None
+    tool_calls: Optional[List[ToolCall]] = None
+    finish_reason: Optional[str] = None
+    metadata: Dict[str, Any] = Field(default_factory=dict)

vanna/core/middleware/__init__.py ADDED Viewed

@@ -0,0 +1,10 @@
+"""
+Middleware system for LLM request/response interception.
+This module provides middleware interfaces for intercepting and transforming
+LLM requests and responses.
+"""
+from .base import LlmMiddleware
+__all__ = ["LlmMiddleware"]

vanna/core/middleware/base.py ADDED Viewed

@@ -0,0 +1,69 @@
+"""
+Base LLM middleware interface.
+Middleware allows you to intercept and transform LLM requests and responses
+for caching, monitoring, content filtering, and more.
+"""
+from abc import ABC
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from ..llm import LlmRequest, LlmResponse
+class LlmMiddleware(ABC):
+    """Middleware for intercepting LLM requests and responses.
+    Subclass this to create custom middleware that can:
+    - Cache LLM responses
+    - Log requests/responses
+    - Filter or modify content
+    - Track costs and usage
+    - Implement fallback strategies
+    Example:
+        class CachingMiddleware(LlmMiddleware):
+            def __init__(self):
+                self.cache = {}
+            async def before_llm_request(self, request: LlmRequest) -> LlmRequest:
+                # Could check cache here
+                return request
+            async def after_llm_response(self, request: LlmRequest, response: LlmResponse) -> LlmResponse:
+                # Cache the response
+                cache_key = self._compute_key(request)
+                self.cache[cache_key] = response
+                return response
+        agent = AgentRunner(
+            llm_service=...,
+            llm_middlewares=[CachingMiddleware(), LoggingMiddleware()]
+        )
+    """
+    async def before_llm_request(self, request: "LlmRequest") -> "LlmRequest":
+        """Called before sending request to LLM.
+        Args:
+            request: The LLM request about to be sent
+        Returns:
+            Modified request, or original if no changes
+        """
+        return request
+    async def after_llm_response(
+        self, request: "LlmRequest", response: "LlmResponse"
+    ) -> "LlmResponse":
+        """Called after receiving response from LLM.
+        Args:
+            request: The original request
+            response: The LLM response
+        Returns:
+            Modified response, or original if no changes
+        """
+        return response

vanna/core/observability/__init__.py ADDED Viewed

@@ -0,0 +1,11 @@
+"""
+Observability system for telemetry and monitoring.
+This module provides interfaces for collecting metrics, traces, and
+monitoring agent behavior.
+"""
+from .base import ObservabilityProvider
+from .models import Span, Metric
+__all__ = ["ObservabilityProvider", "Span", "Metric"]

vanna 0.7.9__py3-none-any.whl → 2.0.0rc1__py3-none-any.whl

vanna 0.7.9py3-none-any.whl → 2.0.0rc1py3-none-any.whl