PyPI - dao-ai - Versions diffs - 0.0.28__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

dao-ai 0.0.28py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

dao_ai/__init__.py +29 -0
dao_ai/agent_as_code.py +2 -5
dao_ai/cli.py +245 -40
dao_ai/config.py +1491 -370
dao_ai/genie/__init__.py +38 -0
dao_ai/genie/cache/__init__.py +43 -0
dao_ai/genie/cache/base.py +72 -0
dao_ai/genie/cache/core.py +79 -0
dao_ai/genie/cache/lru.py +347 -0
dao_ai/genie/cache/semantic.py +970 -0
dao_ai/genie/core.py +35 -0
dao_ai/graph.py +27 -253
dao_ai/hooks/__init__.py +9 -6
dao_ai/hooks/core.py +27 -195
dao_ai/logging.py +56 -0
dao_ai/memory/__init__.py +10 -0
dao_ai/memory/core.py +65 -30
dao_ai/memory/databricks.py +402 -0
dao_ai/memory/postgres.py +79 -38
dao_ai/messages.py +6 -4
dao_ai/middleware/__init__.py +125 -0
dao_ai/middleware/assertions.py +806 -0
dao_ai/middleware/base.py +50 -0
dao_ai/middleware/core.py +67 -0
dao_ai/middleware/guardrails.py +420 -0
dao_ai/middleware/human_in_the_loop.py +232 -0
dao_ai/middleware/message_validation.py +586 -0
dao_ai/middleware/summarization.py +197 -0
dao_ai/models.py +1306 -114
dao_ai/nodes.py +245 -159
dao_ai/optimization.py +674 -0
dao_ai/orchestration/__init__.py +52 -0
dao_ai/orchestration/core.py +294 -0
dao_ai/orchestration/supervisor.py +278 -0
dao_ai/orchestration/swarm.py +271 -0
dao_ai/prompts.py +128 -31
dao_ai/providers/databricks.py +573 -601
dao_ai/state.py +157 -21
dao_ai/tools/__init__.py +13 -5
dao_ai/tools/agent.py +1 -3
dao_ai/tools/core.py +64 -11
dao_ai/tools/email.py +232 -0
dao_ai/tools/genie.py +144 -294
dao_ai/tools/mcp.py +223 -155
dao_ai/tools/memory.py +50 -0
dao_ai/tools/python.py +9 -14
dao_ai/tools/search.py +14 -0
dao_ai/tools/slack.py +22 -10
dao_ai/tools/sql.py +202 -0
dao_ai/tools/time.py +30 -7
dao_ai/tools/unity_catalog.py +165 -88
dao_ai/tools/vector_search.py +331 -221
dao_ai/utils.py +166 -20
dao_ai-0.1.2.dist-info/METADATA +455 -0
dao_ai-0.1.2.dist-info/RECORD +64 -0
dao_ai/chat_models.py +0 -204
dao_ai/guardrails.py +0 -112
dao_ai/tools/human_in_the_loop.py +0 -100
dao_ai-0.0.28.dist-info/METADATA +0 -1168
dao_ai-0.0.28.dist-info/RECORD +0 -41
{dao_ai-0.0.28.dist-info → dao_ai-0.1.2.dist-info}/WHEEL +0 -0
{dao_ai-0.0.28.dist-info → dao_ai-0.1.2.dist-info}/entry_points.txt +0 -0
{dao_ai-0.0.28.dist-info → dao_ai-0.1.2.dist-info}/licenses/LICENSE +0 -0

dao_ai/tools/genie.py CHANGED Viewed

@@ -1,284 +1,73 @@
-import bisect
+"""
+Genie tool for natural language queries to databases.
+This module provides the tool factory for creating LangGraph tools that
+interact with Databricks Genie.
+For the core Genie service and cache implementations, see:
+- dao_ai.genie: GenieService, GenieServiceBase
+- dao_ai.genie.cache: LRUCacheService, SemanticCacheService
+"""
 import json
 import os
-import time
-from dataclasses import asdict, dataclass
-from datetime import datetime
 from textwrap import dedent
-from typing import Annotated, Any, Callable, Optional, Union
+from typing import Annotated, Any, Callable
-import mlflow
 import pandas as pd
-from databricks.sdk import WorkspaceClient
+from databricks_ai_bridge.genie import Genie, GenieResponse
+from langchain.tools import ToolRuntime, tool
 from langchain_core.messages import ToolMessage
-from langchain_core.tools import InjectedToolCallId, tool
-from langgraph.prebuilt import InjectedState
 from langgraph.types import Command
 from loguru import logger
-from pydantic import BaseModel, Field
-from dao_ai.config import AnyVariable, CompositeVariableModel, GenieRoomModel, value_of
-MAX_TOKENS_OF_DATA: int = 20000
-MAX_ITERATIONS: int = 50
-DEFAULT_POLLING_INTERVAL_SECS: int = 2
+from pydantic import BaseModel
-def _count_tokens(text):
-    import tiktoken
-    encoding = tiktoken.encoding_for_model("gpt-4o")
-    return len(encoding.encode(text))
-@dataclass
-class GenieResponse:
-    conversation_id: str
-    result: Union[str, pd.DataFrame]
-    query: Optional[str] = ""
-    description: Optional[str] = ""
-    def to_json(self):
-        return json.dumps(asdict(self))
+from dao_ai.config import (
+    AnyVariable,
+    CompositeVariableModel,
+    GenieLRUCacheParametersModel,
+    GenieRoomModel,
+    GenieSemanticCacheParametersModel,
+    value_of,
+)
+from dao_ai.genie import GenieService, GenieServiceBase
+from dao_ai.genie.cache import CacheResult, LRUCacheService, SemanticCacheService
+from dao_ai.state import AgentState, Context, SessionState
 class GenieToolInput(BaseModel):
-    """Input schema for the Genie tool."""
-    question: str = Field(
-        description="The question to ask Genie about your data. Ask simple, clear questions about your tabular data. For complex analysis, ask multiple simple questions rather than one complex question."
-    )
+    """Input schema for Genie tool - only includes user-facing parameters."""
+    question: str
-def _truncate_result(dataframe: pd.DataFrame) -> str:
-    query_result = dataframe.to_markdown()
-    tokens_used = _count_tokens(query_result)
-    # If the full result fits, return it
-    if tokens_used <= MAX_TOKENS_OF_DATA:
-        return query_result.strip()
-    def is_too_big(n):
-        return _count_tokens(dataframe.iloc[:n].to_markdown()) > MAX_TOKENS_OF_DATA
-    # Use bisect_left to find the cutoff point of rows within the max token data limit in a O(log n) complexity
-    # Passing True, as this is the target value we are looking for when _is_too_big returns
-    cutoff = bisect.bisect_left(range(len(dataframe) + 1), True, key=is_too_big)
-    # Slice to the found limit
-    truncated_df = dataframe.iloc[:cutoff]
-    # Edge case: Cannot return any rows because of tokens so return an empty string
-    if len(truncated_df) == 0:
-        return ""
-    truncated_result = truncated_df.to_markdown()
-    # Double-check edge case if we overshot by one
-    if _count_tokens(truncated_result) > MAX_TOKENS_OF_DATA:
-        truncated_result = truncated_df.iloc[:-1].to_markdown()
-    return truncated_result
-@mlflow.trace(span_type="PARSER")
-def _parse_query_result(resp, truncate_results) -> Union[str, pd.DataFrame]:
-    output = resp["result"]
-    if not output:
-        return "EMPTY"
-    columns = resp["manifest"]["schema"]["columns"]
-    header = [str(col["name"]) for col in columns]
-    rows = []
-    for item in output["data_array"]:
-        row = []
-        for column, value in zip(columns, item):
-            type_name = column["type_name"]
-            if value is None:
-                row.append(None)
-                continue
-            if type_name in ["INT", "LONG", "SHORT", "BYTE"]:
-                row.append(int(value))
-            elif type_name in ["FLOAT", "DOUBLE", "DECIMAL"]:
-                row.append(float(value))
-            elif type_name == "BOOLEAN":
-                row.append(value.lower() == "true")
-            elif type_name == "DATE" or type_name == "TIMESTAMP":
-                row.append(datetime.strptime(value[:10], "%Y-%m-%d").date())
-            elif type_name == "BINARY":
-                row.append(bytes(value, "utf-8"))
-            else:
-                row.append(value)
-        rows.append(row)
-    dataframe = pd.DataFrame(rows, columns=header)
-    if truncate_results:
-        query_result = _truncate_result(dataframe)
-    else:
-        query_result = dataframe.to_markdown()
-    return query_result.strip()
-class Genie:
-    def __init__(
-        self,
-        space_id,
-        client: WorkspaceClient | None = None,
-        truncate_results: bool = False,
-        polling_interval: int = DEFAULT_POLLING_INTERVAL_SECS,
-    ):
-        self.space_id = space_id
-        workspace_client = client or WorkspaceClient()
-        self.genie = workspace_client.genie
-        self.description = self.genie.get_space(space_id).description
-        self.headers = {
-            "Accept": "application/json",
-            "Content-Type": "application/json",
-        }
-        self.truncate_results = truncate_results
-        if polling_interval < 1 or polling_interval > 30:
-            raise ValueError("poll_interval must be between 1 and 30 seconds")
-        self.poll_interval = polling_interval
-    @mlflow.trace()
-    def start_conversation(self, content):
-        resp = self.genie._api.do(
-            "POST",
-            f"/api/2.0/genie/spaces/{self.space_id}/start-conversation",
-            body={"content": content},
-            headers=self.headers,
-        )
-        return resp
-    @mlflow.trace()
-    def create_message(self, conversation_id, content):
-        resp = self.genie._api.do(
-            "POST",
-            f"/api/2.0/genie/spaces/{self.space_id}/conversations/{conversation_id}/messages",
-            body={"content": content},
-            headers=self.headers,
-        )
-        return resp
-    @mlflow.trace()
-    def poll_for_result(self, conversation_id, message_id):
-        @mlflow.trace()
-        def poll_query_results(attachment_id, query_str, description):
-            iteration_count = 0
-            while iteration_count < MAX_ITERATIONS:
-                iteration_count += 1
-                resp = self.genie._api.do(
-                    "GET",
-                    f"/api/2.0/genie/spaces/{self.space_id}/conversations/{conversation_id}/messages/{message_id}/attachments/{attachment_id}/query-result",
-                    headers=self.headers,
-                )["statement_response"]
-                state = resp["status"]["state"]
-                if state == "SUCCEEDED":
-                    result = _parse_query_result(resp, self.truncate_results)
-                    return GenieResponse(
-                        conversation_id, result, query_str, description
-                    )
-                elif state in ["RUNNING", "PENDING"]:
-                    logger.debug("Waiting for query result...")
-                    time.sleep(self.poll_interval)
-                else:
-                    return GenieResponse(
-                        conversation_id,
-                        f"No query result: {resp['state']}",
-                        query_str,
-                        description,
-                    )
-            return GenieResponse(
-                conversation_id,
-                f"Genie query for result timed out after {MAX_ITERATIONS} iterations of {self.poll_interval} seconds",
-                query_str,
-                description,
-            )
-        @mlflow.trace()
-        def poll_result():
-            iteration_count = 0
-            while iteration_count < MAX_ITERATIONS:
-                iteration_count += 1
-                resp = self.genie._api.do(
-                    "GET",
-                    f"/api/2.0/genie/spaces/{self.space_id}/conversations/{conversation_id}/messages/{message_id}",
-                    headers=self.headers,
-                )
-                if resp["status"] == "COMPLETED":
-                    # Check if attachments key exists in response
-                    attachments = resp.get("attachments", [])
-                    if not attachments:
-                        # Handle case where response has no attachments
-                        return GenieResponse(
-                            conversation_id,
-                            result=f"Genie query completed but no attachments found. Response: {resp}",
-                        )
-                    attachment = next((r for r in attachments if "query" in r), None)
-                    if attachment:
-                        query_obj = attachment["query"]
-                        description = query_obj.get("description", "")
-                        query_str = query_obj.get("query", "")
-                        attachment_id = attachment["attachment_id"]
-                        return poll_query_results(attachment_id, query_str, description)
-                    if resp["status"] == "COMPLETED":
-                        text_content = next(
-                            (r for r in attachments if "text" in r), None
-                        )
-                        if text_content:
-                            return GenieResponse(
-                                conversation_id, result=text_content["text"]["content"]
-                            )
-                        return GenieResponse(
-                            conversation_id,
-                            result="Genie query completed but no text content found in attachments.",
-                        )
-                elif resp["status"] in {"CANCELLED", "QUERY_RESULT_EXPIRED"}:
-                    return GenieResponse(
-                        conversation_id, result=f"Genie query {resp['status'].lower()}."
-                    )
-                elif resp["status"] == "FAILED":
-                    return GenieResponse(
-                        conversation_id,
-                        result=f"Genie query failed with error: {resp.get('error', 'Unknown error')}",
-                    )
-                # includes EXECUTING_QUERY, Genie can retry after this status
-                else:
-                    logger.debug(f"Waiting...: {resp['status']}")
-                    time.sleep(self.poll_interval)
-            return GenieResponse(
-                conversation_id,
-                f"Genie query timed out after {MAX_ITERATIONS} iterations of {self.poll_interval} seconds",
-            )
+def _response_to_json(response: GenieResponse) -> str:
+    """Convert GenieResponse to JSON string, handling DataFrame results."""
+    # Convert result to string if it's a DataFrame
+    result: str | pd.DataFrame = response.result
+    if isinstance(result, pd.DataFrame):
+        result = result.to_markdown()
-        return poll_result()
-    @mlflow.trace()
-    def ask_question(self, question: str, conversation_id: str | None = None):
-        logger.debug(
-            f"ask_question called with question: {question}, conversation_id: {conversation_id}"
-        )
-        if conversation_id:
-            resp = self.create_message(conversation_id, question)
-        else:
-            resp = self.start_conversation(question)
-        logger.debug(f"ask_question response: {resp}")
-        return self.poll_for_result(resp["conversation_id"], resp["message_id"])
+    data: dict[str, Any] = {
+        "result": result,
+        "query": response.query,
+        "description": response.description,
+        "conversation_id": response.conversation_id,
+    }
+    return json.dumps(data)
 def create_genie_tool(
     genie_room: GenieRoomModel | dict[str, Any],
-    name: Optional[str] = None,
-    description: Optional[str] = None,
-    persist_conversation: bool = False,
+    name: str | None = None,
+    description: str | None = None,
+    persist_conversation: bool = True,
     truncate_results: bool = False,
-    poll_interval: int = DEFAULT_POLLING_INTERVAL_SECS,
-) -> Callable[[str], GenieResponse]:
+    lru_cache_parameters: GenieLRUCacheParametersModel | dict[str, Any] | None = None,
+    semantic_cache_parameters: GenieSemanticCacheParametersModel
+    | dict[str, Any]
+    | None = None,
+) -> Callable[..., Command]:
     """
     Create a tool for interacting with Databricks Genie for natural language queries to databases.
@@ -290,17 +79,37 @@ def create_genie_tool(
         genie_room: GenieRoomModel or dict containing Genie configuration
         name: Optional custom name for the tool. If None, uses default "genie_tool"
         description: Optional custom description for the tool. If None, uses default description
+        persist_conversation: Whether to persist conversation IDs across tool calls for
+            multi-turn conversations within the same Genie space
+        truncate_results: Whether to truncate large query results to fit token limits
+        lru_cache_parameters: Optional LRU cache configuration for SQL query caching
+        semantic_cache_parameters: Optional semantic cache configuration using pg_vector
+            for similarity-based query matching
     Returns:
         A LangGraph tool that processes natural language queries through Genie
     """
+    logger.debug(
+        "Creating Genie tool",
+        genie_room_type=type(genie_room).__name__,
+        persist_conversation=persist_conversation,
+        truncate_results=truncate_results,
+        name=name,
+        has_lru_cache=lru_cache_parameters is not None,
+        has_semantic_cache=semantic_cache_parameters is not None,
+    )
     if isinstance(genie_room, dict):
         genie_room = GenieRoomModel(**genie_room)
-    space_id: AnyVariable = genie_room.space_id or os.environ.get(
-        "DATABRICKS_GENIE_SPACE_ID"
-    )
+    if isinstance(lru_cache_parameters, dict):
+        lru_cache_parameters = GenieLRUCacheParametersModel(**lru_cache_parameters)
+    if isinstance(semantic_cache_parameters, dict):
+        semantic_cache_parameters = GenieSemanticCacheParametersModel(
+            **semantic_cache_parameters
+        )
     space_id: AnyVariable = genie_room.space_id or os.environ.get(
         "DATABRICKS_GENIE_SPACE_ID"
     )
@@ -308,13 +117,6 @@ def create_genie_tool(
         space_id = CompositeVariableModel(**space_id)
     space_id = value_of(space_id)
-    # genie: Genie = Genie(
-    #     space_id=space_id,
-    #     client=genie_room.workspace_client,
-    #     truncate_results=truncate_results,
-    #     polling_interval=poll_interval,
-    # )
     default_description: str = dedent("""
     This tool lets you have a conversation and chat with tabular data about <topic>. You should ask
     questions about the data and the tool will try to answer them.
@@ -337,51 +139,99 @@ Returns:
 GenieResponse: A response object containing the conversation ID and result from Genie."""
     tool_description = tool_description + function_docs
+    genie: Genie = Genie(
+        space_id=space_id,
+        client=genie_room.workspace_client,
+        truncate_results=truncate_results,
+    )
+    genie_service: GenieServiceBase = GenieService(genie)
+    # Wrap with semantic cache first (checked second due to decorator pattern)
+    if semantic_cache_parameters is not None:
+        genie_service = SemanticCacheService(
+            impl=genie_service,
+            parameters=semantic_cache_parameters,
+            workspace_client=genie_room.workspace_client,  # Pass workspace client for conversation history
+        ).initialize()  # Eagerly initialize to fail fast and create table
+    # Wrap with LRU cache last (checked first - fast O(1) exact match)
+    if lru_cache_parameters is not None:
+        genie_service = LRUCacheService(
+            impl=genie_service,
+            parameters=lru_cache_parameters,
+        )
     @tool(
         name_or_callable=tool_name,
         description=tool_description,
     )
     def genie_tool(
         question: Annotated[str, "The question to ask Genie about your data"],
-        state: Annotated[dict, InjectedState],
-        tool_call_id: Annotated[str, InjectedToolCallId],
+        runtime: ToolRuntime[Context, AgentState],
     ) -> Command:
-        genie: Genie = Genie(
-            space_id=space_id,
-            client=genie_room.workspace_client,
-            truncate_results=truncate_results,
-            polling_interval=poll_interval,
-        )
+        """Process a natural language question through Databricks Genie.
-        """Process a natural language question through Databricks Genie."""
-        # Get existing conversation mapping and retrieve conversation ID for this space
-        conversation_ids: dict[str, str] = state.get("genie_conversation_ids", {})
-        existing_conversation_id: str | None = conversation_ids.get(space_id)
-        logger.debug(
-            f"Existing conversation ID for space {space_id}: {existing_conversation_id}"
+        Uses ToolRuntime to access state and context in a type-safe way.
+        """
+        # Access state through runtime
+        state: AgentState = runtime.state
+        tool_call_id: str = runtime.tool_call_id
+        # Ensure space_id is a string for state keys
+        space_id_str: str = str(space_id)
+        # Get session state (or create new one)
+        session: SessionState = state.get("session", SessionState())
+        # Get existing conversation ID from session
+        existing_conversation_id: str | None = session.genie.get_conversation_id(
+            space_id_str
+        )
+        logger.trace(
+            "Using existing conversation ID",
+            space_id=space_id_str,
+            conversation_id=existing_conversation_id,
         )
-        response: GenieResponse = genie.ask_question(
+        # Call ask_question which always returns CacheResult with cache metadata
+        cache_result: CacheResult = genie_service.ask_question(
             question, conversation_id=existing_conversation_id
         )
+        genie_response: GenieResponse = cache_result.response
+        cache_hit: bool = cache_result.cache_hit
+        cache_key: str | None = cache_result.served_by
-        current_conversation_id: str = response.conversation_id
+        current_conversation_id: str = genie_response.conversation_id
         logger.debug(
-            f"Current conversation ID for space {space_id}: {current_conversation_id}"
+            "Genie question answered",
+            space_id=space_id_str,
+            conversation_id=current_conversation_id,
+            cache_hit=cache_hit,
+            cache_key=cache_key,
         )
-        # Update the conversation mapping with the new conversation ID for this space
+        # Update session state with cache information
+        if persist_conversation:
+            session.genie.update_space(
+                space_id=space_id_str,
+                conversation_id=current_conversation_id,
+                cache_hit=cache_hit,
+                cache_key=cache_key,
+                last_query=question,
+            )
+        # Build update dict with response and session
         update: dict[str, Any] = {
-            "messages": [ToolMessage(response.to_json(), tool_call_id=tool_call_id)],
+            "messages": [
+                ToolMessage(
+                    _response_to_json(genie_response), tool_call_id=tool_call_id
+                )
+            ],
         }
         if persist_conversation:
-            updated_conversation_ids: dict[str, str] = conversation_ids.copy()
-            updated_conversation_ids[space_id] = current_conversation_id
-            update["genie_conversation_ids"] = updated_conversation_ids
-        logger.debug(f"State update: {update}")
+            update["session"] = session
         return Command(update=update)

dao-ai 0.0.28__py3-none-any.whl → 0.1.2__py3-none-any.whl

dao-ai 0.0.28py3-none-any.whl → 0.1.2py3-none-any.whl