PyPI - dao-ai - Versions diffs - 0.0.25__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

dao-ai 0.0.25py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

dao_ai/__init__.py +29 -0
dao_ai/agent_as_code.py +5 -5
dao_ai/cli.py +245 -40
dao_ai/config.py +1863 -338
dao_ai/genie/__init__.py +38 -0
dao_ai/genie/cache/__init__.py +43 -0
dao_ai/genie/cache/base.py +72 -0
dao_ai/genie/cache/core.py +79 -0
dao_ai/genie/cache/lru.py +347 -0
dao_ai/genie/cache/semantic.py +970 -0
dao_ai/genie/core.py +35 -0
dao_ai/graph.py +27 -228
dao_ai/hooks/__init__.py +9 -6
dao_ai/hooks/core.py +27 -195
dao_ai/logging.py +56 -0
dao_ai/memory/__init__.py +10 -0
dao_ai/memory/core.py +65 -30
dao_ai/memory/databricks.py +402 -0
dao_ai/memory/postgres.py +79 -38
dao_ai/messages.py +6 -4
dao_ai/middleware/__init__.py +125 -0
dao_ai/middleware/assertions.py +806 -0
dao_ai/middleware/base.py +50 -0
dao_ai/middleware/core.py +67 -0
dao_ai/middleware/guardrails.py +420 -0
dao_ai/middleware/human_in_the_loop.py +232 -0
dao_ai/middleware/message_validation.py +586 -0
dao_ai/middleware/summarization.py +197 -0
dao_ai/models.py +1306 -114
dao_ai/nodes.py +261 -166
dao_ai/optimization.py +674 -0
dao_ai/orchestration/__init__.py +52 -0
dao_ai/orchestration/core.py +294 -0
dao_ai/orchestration/supervisor.py +278 -0
dao_ai/orchestration/swarm.py +271 -0
dao_ai/prompts.py +128 -31
dao_ai/providers/databricks.py +645 -172
dao_ai/state.py +157 -21
dao_ai/tools/__init__.py +13 -5
dao_ai/tools/agent.py +1 -3
dao_ai/tools/core.py +64 -11
dao_ai/tools/email.py +232 -0
dao_ai/tools/genie.py +144 -295
dao_ai/tools/mcp.py +220 -133
dao_ai/tools/memory.py +50 -0
dao_ai/tools/python.py +9 -14
dao_ai/tools/search.py +14 -0
dao_ai/tools/slack.py +22 -10
dao_ai/tools/sql.py +202 -0
dao_ai/tools/time.py +30 -7
dao_ai/tools/unity_catalog.py +165 -88
dao_ai/tools/vector_search.py +360 -40
dao_ai/utils.py +218 -16
dao_ai-0.1.2.dist-info/METADATA +455 -0
dao_ai-0.1.2.dist-info/RECORD +64 -0
{dao_ai-0.0.25.dist-info → dao_ai-0.1.2.dist-info}/WHEEL +1 -1
dao_ai/chat_models.py +0 -204
dao_ai/guardrails.py +0 -112
dao_ai/tools/human_in_the_loop.py +0 -100
dao_ai-0.0.25.dist-info/METADATA +0 -1165
dao_ai-0.0.25.dist-info/RECORD +0 -41
{dao_ai-0.0.25.dist-info → dao_ai-0.1.2.dist-info}/entry_points.txt +0 -0
{dao_ai-0.0.25.dist-info → dao_ai-0.1.2.dist-info}/licenses/LICENSE +0 -0

dao_ai/utils.py CHANGED Viewed

@@ -3,9 +3,11 @@ import importlib.metadata
 import os
 import re
 import site
-from importlib.metadata import version
+from importlib.metadata import PackageNotFoundError, version
+from pathlib import Path
 from typing import Any, Callable, Sequence
+from langchain_core.tools import BaseTool
 from loguru import logger
 import dao_ai
@@ -18,15 +20,15 @@ def is_lib_provided(lib_name: str, pip_requirements: Sequence[str]) -> bool:
     )
-def is_installed():
+def is_installed() -> bool:
     current_file = os.path.abspath(dao_ai.__file__)
     site_packages = [os.path.abspath(path) for path in site.getsitepackages()]
     if site.getusersitepackages():
         site_packages.append(os.path.abspath(site.getusersitepackages()))
     found: bool = any(current_file.startswith(pkg_path) for pkg_path in site_packages)
-    logger.debug(
-        f"Checking if dao_ai is installed: {found} (current file: {current_file}"
+    logger.trace(
+        "Checking if dao_ai is installed", is_installed=found, current_file=current_file
     )
     return found
@@ -37,6 +39,114 @@ def normalize_name(name: str) -> str:
     return normalized.strip("_")
+def normalize_host(host: str | None) -> str | None:
+    """Ensure host URL has https:// scheme.
+    The DATABRICKS_HOST environment variable should always include the https://
+    scheme, but some environments (e.g., Databricks Apps infrastructure) may
+    provide the host without it. This function normalizes the host to ensure
+    it has the proper scheme.
+    Args:
+        host: The host URL, with or without scheme
+    Returns:
+        The host URL with https:// scheme, or None if host is None/empty
+    """
+    if not host:
+        return None
+    host = host.strip()
+    if not host:
+        return None
+    if not host.startswith("http://") and not host.startswith("https://"):
+        return f"https://{host}"
+    return host
+def get_default_databricks_host() -> str | None:
+    """Get the default Databricks workspace host.
+    Attempts to get the host from:
+    1. DATABRICKS_HOST environment variable
+    2. WorkspaceClient ambient authentication (e.g., from ~/.databrickscfg)
+    Returns:
+        The Databricks workspace host URL (with https:// scheme), or None if not available.
+    """
+    # Try environment variable first
+    host: str | None = os.environ.get("DATABRICKS_HOST")
+    if host:
+        return normalize_host(host)
+    # Fall back to WorkspaceClient
+    try:
+        from databricks.sdk import WorkspaceClient
+        w: WorkspaceClient = WorkspaceClient()
+        return normalize_host(w.config.host)
+    except Exception:
+        logger.trace("Could not get default Databricks host from WorkspaceClient")
+        return None
+def dao_ai_version() -> str:
+    """
+    Get the dao-ai package version, with fallback for source installations.
+    Tries to get the version from installed package metadata first. If the package
+    is not installed (e.g., running from source), falls back to reading from
+    pyproject.toml. Returns "dev" if neither method works.
+    Returns:
+        str: The version string, or "dev" if version cannot be determined
+    """
+    try:
+        # Try to get version from installed package metadata
+        return version("dao-ai")
+    except PackageNotFoundError:
+        # Package not installed, try reading from pyproject.toml
+        logger.trace(
+            "dao-ai package not installed, attempting to read version from pyproject.toml"
+        )
+        try:
+            import tomllib  # Python 3.11+
+        except ImportError:
+            try:
+                import tomli as tomllib  # Fallback for Python < 3.11
+            except ImportError:
+                logger.warning(
+                    "Cannot determine dao-ai version: package not installed and tomllib/tomli not available"
+                )
+                return "dev"
+        try:
+            # Find pyproject.toml relative to this file
+            project_root = Path(__file__).parents[2]
+            pyproject_path = project_root / "pyproject.toml"
+            if not pyproject_path.exists():
+                logger.warning(
+                    "Cannot determine dao-ai version: pyproject.toml not found",
+                    path=str(pyproject_path),
+                )
+                return "dev"
+            with open(pyproject_path, "rb") as f:
+                pyproject_data = tomllib.load(f)
+                pkg_version = pyproject_data.get("project", {}).get("version", "dev")
+                logger.trace(
+                    "Read version from pyproject.toml",
+                    version=pkg_version,
+                    path=str(pyproject_path),
+                )
+                return pkg_version
+        except Exception as e:
+            logger.warning(
+                "Cannot determine dao-ai version from pyproject.toml", error=str(e)
+            )
+            return "dev"
 def get_installed_packages() -> dict[str, str]:
     """Get all installed packages with versions"""
@@ -45,16 +155,14 @@ def get_installed_packages() -> dict[str, str]:
         f"databricks-langchain=={version('databricks-langchain')}",
         f"databricks-mcp=={version('databricks-mcp')}",
         f"databricks-sdk[openai]=={version('databricks-sdk')}",
-        f"duckduckgo-search=={version('duckduckgo-search')}",
+        f"ddgs=={version('ddgs')}",
+        f"flashrank=={version('flashrank')}",
         f"langchain=={version('langchain')}",
         f"langchain-mcp-adapters=={version('langchain-mcp-adapters')}",
         f"langchain-openai=={version('langchain-openai')}",
         f"langchain-tavily=={version('langchain-tavily')}",
         f"langgraph=={version('langgraph')}",
         f"langgraph-checkpoint-postgres=={version('langgraph-checkpoint-postgres')}",
-        f"langgraph-prebuilt=={version('langgraph-prebuilt')}",
-        f"langgraph-supervisor=={version('langgraph-supervisor')}",
-        f"langgraph-swarm=={version('langgraph-swarm')}",
         f"langmem=={version('langmem')}",
         f"loguru=={version('loguru')}",
         f"mcp=={version('mcp')}",
@@ -65,6 +173,7 @@ def get_installed_packages() -> dict[str, str]:
         f"psycopg[binary,pool]=={version('psycopg')}",
         f"pydantic=={version('pydantic')}",
         f"pyyaml=={version('pyyaml')}",
+        f"tomli=={version('tomli')}",
         f"unitycatalog-ai[databricks]=={version('unitycatalog-ai')}",
         f"unitycatalog-langchain[databricks]=={version('unitycatalog-langchain')}",
     ]
@@ -85,18 +194,18 @@ def load_function(function_name: str) -> Callable[..., Any]:
              "module.submodule.function_name"
     Returns:
-        The imported callable function
+        The imported callable function or langchain tool
     Raises:
         ImportError: If the module cannot be imported
         AttributeError: If the function doesn't exist in the module
-        TypeError: If the resolved object is not callable
+        TypeError: If the resolved object is not callable or invocable
     Example:
         >>> func = callable_from_fqn("dao_ai.models.get_latest_model_version")
         >>> version = func("my_model")
     """
-    logger.debug(f"Loading function: {function_name}")
+    logger.trace("Loading function", function_name=function_name)
     try:
         # Split the FQN into module path and function name
@@ -106,11 +215,16 @@ def load_function(function_name: str) -> Callable[..., Any]:
         module = importlib.import_module(module_path)
         # Get the function from the module
-        func = getattr(module, func_name)
+        func: Any = getattr(module, func_name)
+        # Verify that the resolved object is callable or is a LangChain tool
+        # In langchain 1.x, StructuredTool objects are not directly callable
+        # but have an invoke() method
+        is_callable: bool = callable(func)
+        is_langchain_tool: bool = isinstance(func, BaseTool)
-        # Verify that the resolved object is callable
-        if not callable(func):
-            raise TypeError(f"Function {func_name} is not callable.")
+        if not is_callable and not is_langchain_tool:
+            raise TypeError(f"Function {func_name} is not callable or invocable.")
         return func
     except (ImportError, AttributeError, TypeError) as e:
@@ -118,5 +232,93 @@ def load_function(function_name: str) -> Callable[..., Any]:
         raise ImportError(f"Failed to import {function_name}: {e}")
+def type_from_fqn(type_name: str) -> type:
+    """
+    Load a type from a fully qualified name (FQN).
+    Dynamically imports and returns a type (class) from a module using its
+    fully qualified name. Useful for loading Pydantic models, dataclasses,
+    or any Python type specified as a string in configuration files.
+    Args:
+        type_name: Fully qualified type name in format "module.path.ClassName"
+    Returns:
+        The imported type/class
+    Raises:
+        ValueError: If the FQN format is invalid
+        ImportError: If the module cannot be imported
+        AttributeError: If the type doesn't exist in the module
+        TypeError: If the resolved object is not a type
+    Example:
+        >>> ProductModel = type_from_fqn("my_models.ProductInfo")
+        >>> instance = ProductModel(name="Widget", price=9.99)
+    """
+    logger.trace("Loading type", type_name=type_name)
+    try:
+        # Split the FQN into module path and class name
+        parts = type_name.rsplit(".", 1)
+        if len(parts) != 2:
+            raise ValueError(
+                f"Invalid type name '{type_name}'. "
+                "Expected format: 'module.path.ClassName'"
+            )
+        module_path, class_name = parts
+        # Dynamically import the module
+        try:
+            module = importlib.import_module(module_path)
+        except ModuleNotFoundError as e:
+            raise ImportError(
+                f"Could not import module '{module_path}' for type '{type_name}': {e}"
+            ) from e
+        # Get the class from the module
+        if not hasattr(module, class_name):
+            raise AttributeError(
+                f"Module '{module_path}' does not have attribute '{class_name}'"
+            )
+        resolved_type = getattr(module, class_name)
+        # Verify it's actually a type
+        if not isinstance(resolved_type, type):
+            raise TypeError(
+                f"'{type_name}' resolved to {resolved_type}, which is not a type"
+            )
+        return resolved_type
+    except (ValueError, ImportError, AttributeError, TypeError) as e:
+        # Provide a detailed error message that includes the original exception
+        raise type(e)(f"Failed to load type '{type_name}': {e}") from e
 def is_in_model_serving() -> bool:
-    return os.environ.get("IS_IN_DB_MODEL_SERVING_ENV", "false").lower() == "true"
+    """Check if running in Databricks Model Serving environment.
+    Detects Model Serving by checking for environment variables that are
+    typically set in that environment.
+    """
+    # Primary check - explicit Databricks Model Serving env var
+    if os.environ.get("IS_IN_DB_MODEL_SERVING_ENV", "false").lower() == "true":
+        return True
+    # Secondary check - Model Serving sets these environment variables
+    if os.environ.get("DATABRICKS_MODEL_SERVING_ENV"):
+        return True
+    # Check for cluster type indicator
+    cluster_type = os.environ.get("DATABRICKS_CLUSTER_TYPE", "")
+    if "model-serving" in cluster_type.lower():
+        return True
+    # Check for model serving specific paths
+    if os.path.exists("/opt/conda/envs/mlflow-env"):
+        return True
+    return False

dao-ai 0.0.25__py3-none-any.whl → 0.1.2__py3-none-any.whl

dao-ai 0.0.25py3-none-any.whl → 0.1.2py3-none-any.whl