PyPI - spice-mcp - Versions diffs - 0.1.1__py3-none-any.whl → 0.1.3__py3-none-any.whl - Mend

spice-mcp 0.1.1py3-none-any.whl → 0.1.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

spice_mcp/adapters/dune/__init__.py +4 -2
spice_mcp/adapters/dune/cache.py +2 -34
spice_mcp/adapters/dune/extract.py +33 -631
spice_mcp/adapters/dune/typing_utils.py +8 -1
spice_mcp/adapters/spellbook/__init__.py +6 -0
spice_mcp/adapters/spellbook/explorer.py +313 -0
spice_mcp/config.py +1 -1
spice_mcp/core/models.py +0 -8
spice_mcp/core/ports.py +0 -15
spice_mcp/mcp/server.py +321 -135
spice_mcp/mcp/tools/base.py +1 -1
spice_mcp/mcp/tools/execute_query.py +48 -59
{spice_mcp-0.1.1.dist-info → spice_mcp-0.1.3.dist-info}/METADATA +18 -13
{spice_mcp-0.1.1.dist-info → spice_mcp-0.1.3.dist-info}/RECORD +17 -17
spice_mcp/mcp/tools/sui_package_overview.py +0 -56
spice_mcp/service_layer/sui_service.py +0 -131
{spice_mcp-0.1.1.dist-info → spice_mcp-0.1.3.dist-info}/WHEEL +0 -0
{spice_mcp-0.1.1.dist-info → spice_mcp-0.1.3.dist-info}/entry_points.txt +0 -0
{spice_mcp-0.1.1.dist-info → spice_mcp-0.1.3.dist-info}/licenses/LICENSE +0 -0

spice_mcp/adapters/dune/typing_utils.py CHANGED Viewed

@@ -9,4 +9,11 @@ def resolve_raw_sql_template_id() -> int:
     Tests stub HTTP boundaries and only require a consistent integer. This
     placeholder can be adjusted if upstream semantics change.
     """
-    return int(os.getenv("SPICE_RAW_SQL_QUERY_ID", "4060379"))
+    env_value = os.getenv("SPICE_RAW_SQL_QUERY_ID")
+    if env_value:
+        try:
+            return int(env_value.strip())
+        except (ValueError, AttributeError):
+            # Invalid environment variable, fallback to default
+            pass
+    return 4060379

spice_mcp/adapters/spellbook/__init__.py ADDED Viewed

@@ -0,0 +1,6 @@
+"""Spellbook adapter for discovering dbt models from GitHub repository."""
+from .explorer import SpellbookExplorer
+__all__ = ["SpellbookExplorer"]

spice_mcp/adapters/spellbook/explorer.py ADDED Viewed

@@ -0,0 +1,313 @@
+"""
+Spellbook Explorer - Parses dbt models from Spellbook GitHub repository.
+This adapter clones or accesses the Spellbook GitHub repo and parses dbt models
+to discover available tables, schemas, and column information.
+"""
+from __future__ import annotations
+import os
+import re
+import subprocess
+import tempfile
+from collections.abc import Sequence
+from pathlib import Path
+from typing import Any
+from ...core.models import SchemaMatch, TableColumn, TableDescription, TableSummary
+from ...core.ports import CatalogExplorer
+class SpellbookExplorer(CatalogExplorer):
+    """
+    Explorer that parses Spellbook dbt models from GitHub repository.
+    Spellbook repo: https://github.com/duneanalytics/spellbook
+    """
+    SPELLBOOK_REPO_URL = "https://github.com/duneanalytics/spellbook.git"
+    DEFAULT_BRANCH = "main"
+    def __init__(
+        self,
+        repo_path: Path | str | None = None,
+        repo_url: str | None = None,
+        branch: str | None = None,
+    ):
+        """
+        Initialize Spellbook explorer.
+        Args:
+            repo_path: Local path to spellbook repo (if None, will clone to temp dir)
+            repo_url: GitHub repo URL (defaults to official spellbook repo)
+            branch: Git branch to use (defaults to 'main')
+        """
+        self.repo_url = repo_url or self.SPELLBOOK_REPO_URL
+        self.branch = branch or self.DEFAULT_BRANCH
+        self._repo_path: Path | None = None
+        self._models_cache: dict[str, list[dict[str, Any]]] | None = None
+        if repo_path:
+            self._repo_path = Path(repo_path)
+        else:
+            # Use cache directory if available, otherwise temp
+            cache_base = os.getenv("SPICE_SPELLBOOK_CACHE", tempfile.gettempdir())
+            self._repo_path = Path(cache_base) / "spellbook_repo"
+    def _ensure_repo(self) -> Path:
+        """Ensure spellbook repo is cloned locally."""
+        if self._repo_path is None:
+            raise RuntimeError("Repository path not set")
+        repo_path = self._repo_path
+        # Clone if doesn't exist
+        if not repo_path.exists() or not (repo_path / ".git").exists():
+            repo_path.parent.mkdir(parents=True, exist_ok=True)
+            subprocess.run(
+                ["git", "clone", "--depth", "1", "--branch", self.branch, self.repo_url, str(repo_path)],
+                check=True,
+                capture_output=True,
+            )
+        else:
+            # Update if exists
+            try:
+                subprocess.run(
+                    ["git", "-C", str(repo_path), "pull", "origin", self.branch],
+                    check=False,
+                    capture_output=True,
+                    timeout=30,
+                )
+            except Exception:
+                pass  # Ignore update failures
+        return repo_path
+    def _load_models(self) -> dict[str, list[dict[str, Any]]]:
+        """Load all dbt models from spellbook repo, organized by schema/subproject."""
+        if self._models_cache is not None:
+            return self._models_cache
+        repo_path = self._ensure_repo()
+        models: dict[str, list[dict[str, Any]]] = {}
+        # Spellbook uses subprojects - look in dbt_subprojects/ and models/ directories
+        subproject_dirs = [
+            repo_path / "dbt_subprojects",
+            repo_path / "models",
+        ]
+        for base_dir in subproject_dirs:
+            if not base_dir.exists():
+                continue
+            # Walk through subproject directories
+            for subproject_dir in base_dir.iterdir():
+                if not subproject_dir.is_dir():
+                    continue
+                # Skip hidden directories
+                if subproject_dir.name.startswith("."):
+                    continue
+                schema_name = subproject_dir.name
+                if schema_name not in models:
+                    models[schema_name] = []
+                # Find SQL model files
+                models_dir = subproject_dir / "models"
+                if not models_dir.exists():
+                    models_dir = subproject_dir
+                for sql_file in models_dir.rglob("*.sql"):
+                    # Skip files in target/ or node_modules/
+                    if "target" in sql_file.parts or "node_modules" in sql_file.parts:
+                        continue
+                    # Extract model name from file path
+                    # models/schema/table.sql -> table
+                    model_name = sql_file.stem
+                    # Try to find schema.yml for metadata
+                    schema_yml = sql_file.parent / "schema.yml"
+                    if not schema_yml.exists():
+                        schema_yml = sql_file.parent.parent / "schema.yml"
+                    models[schema_name].append({
+                        "name": model_name,
+                        "file": sql_file,
+                        "schema_yml": schema_yml if schema_yml.exists() else None,
+                        "schema": schema_name,
+                    })
+        self._models_cache = models
+        return models
+    def find_schemas(self, keyword: str) -> Sequence[SchemaMatch]:
+        """
+        Find schemas (subprojects) matching keyword in Spellbook repo.
+        This searches through dbt subproject names and model descriptions.
+        """
+        models = self._load_models()
+        matches: list[SchemaMatch] = []
+        keyword_lower = keyword.lower()
+        for schema_name, model_list in models.items():
+            # Match schema name
+            if keyword_lower in schema_name.lower():
+                matches.append(SchemaMatch(schema=schema_name))
+                continue
+            # Match model names/descriptions
+            for model in model_list:
+                if keyword_lower in model["name"].lower():
+                    if not any(m.schema == schema_name for m in matches):
+                        matches.append(SchemaMatch(schema=schema_name))
+                    break
+        return matches
+    def list_tables(self, schema: str, limit: int | None = None) -> Sequence[TableSummary]:
+        """
+        List tables (dbt models) in a given schema/subproject.
+        Returns model names from the spellbook repository.
+        """
+        models = self._load_models()
+        schema_models = models.get(schema, [])
+        summaries = [
+            TableSummary(schema=schema, table=model["name"])
+            for model in schema_models
+        ]
+        if limit is not None:
+            summaries = summaries[:limit]
+        return summaries
+    def describe_table(self, schema: str, table: str) -> TableDescription:
+        """
+        Describe table columns by parsing dbt model SQL and schema.yml.
+        Attempts to extract column information from:
+        1. schema.yml file (if exists)
+        2. SQL SELECT statement columns
+        3. Fallback to basic inference
+        """
+        models = self._load_models()
+        schema_models = models.get(schema, [])
+        # Find matching model
+        model_info = None
+        for model in schema_models:
+            if model["name"] == table:
+                model_info = model
+                break
+        if model_info is None:
+            raise ValueError(f"Table {schema}.{table} not found in Spellbook")
+        columns: list[TableColumn] = []
+        # Try to parse schema.yml first
+        if model_info["schema_yml"]:
+            columns = self._parse_schema_yml(model_info["schema_yml"], table)
+        # Fallback: parse SQL file for column hints
+        if not columns:
+            columns = self._parse_sql_columns(model_info["file"])
+        # If still no columns, create a basic placeholder
+        if not columns:
+            columns = [
+                TableColumn(name="column_1", dune_type="VARCHAR", polars_dtype="Utf8")
+            ]
+        return TableDescription(
+            fully_qualified_name=f"{schema}.{table}",
+            columns=columns,
+        )
+    def _parse_schema_yml(self, schema_yml_path: Path, table_name: str) -> list[TableColumn]:
+        """Parse dbt schema.yml to extract column definitions."""
+        try:
+            try:
+                import yaml
+            except ImportError:
+                # PyYAML not available, skip schema.yml parsing
+                return []
+            with open(schema_yml_path, encoding="utf-8") as f:
+                content = yaml.safe_load(f)
+            if not isinstance(content, dict):
+                return []
+            # Find model in schema.yml
+            models = content.get("models", [])
+            for model in models:
+                if model.get("name") == table_name:
+                    cols = model.get("columns", [])
+                    return [
+                        TableColumn(
+                            name=col.get("name", ""),
+                            dune_type=col.get("data_type", "VARCHAR"),
+                            polars_dtype=col.get("data_type"),
+                            comment=col.get("description"),
+                        )
+                        for col in cols
+                    ]
+        except Exception:
+            pass
+        return []
+    def _parse_sql_columns(self, sql_file: Path) -> list[TableColumn]:
+        """Parse SQL file to extract column names from SELECT statements."""
+        try:
+            with open(sql_file, encoding="utf-8") as f:
+                sql = f.read()
+            # Look for SELECT ... FROM patterns
+            # Match: SELECT col1, col2, col3 FROM ...
+            select_match = re.search(
+                r"SELECT\s+(.+?)\s+FROM",
+                sql,
+                re.IGNORECASE | re.DOTALL,
+            )
+            if select_match:
+                cols_str = select_match.group(1)
+                # Split by comma, but handle function calls and aliases
+                cols = []
+                for col in cols_str.split(","):
+                    col = col.strip()
+                    # Extract column name (handle aliases: col AS alias -> col)
+                    if " AS " in col.upper():
+                        col = col.split(" AS ", 1)[0].strip()
+                    elif " " in col and not col.startswith("("):
+                        # Might be alias without AS
+                        parts = col.split()
+                        col = parts[0].strip()
+                    # Clean up function calls: function(col) -> col
+                    col = re.sub(r"^\w+\((.+)\)", r"\1", col)
+                    col = col.strip().strip('"').strip("'")
+                    if col and col not in ["*", "DISTINCT"]:
+                        cols.append(
+                            TableColumn(
+                                name=col,
+                                dune_type="VARCHAR",  # Default, can't infer from SQL
+                                polars_dtype="Utf8",
+                            )
+                        )
+                return cols[:20]  # Limit to reasonable number
+        except Exception:
+            pass
+        return []

spice_mcp/config.py CHANGED Viewed

@@ -41,7 +41,7 @@ class Config:
     cache: CacheConfig = field(default_factory=CacheConfig)
     logging: LoggingConfig = field(default_factory=LoggingConfig)
     http: HttpClientConfig = field(default_factory=HttpClientConfig)
-    max_concurrent_queries: int = 5
+    max_concurrent_queries: int = 5  # Note: Not currently enforced (kept for future use)
     default_timeout_seconds: int = 30
     @classmethod

spice_mcp/core/models.py CHANGED Viewed

@@ -78,11 +78,3 @@ class TableDescription:
     columns: list[TableColumn] = field(default_factory=list)
-@dataclass(slots=True)
-class SuiPackageOverview:
-    package_ids: list[str]
-    window_hours: int
-    events_preview: list[dict[str, Any]] | None = None
-    transactions_preview: list[dict[str, Any]] | None = None
-    objects_preview: list[dict[str, Any]] | None = None
-    stats: dict[str, Any] = field(default_factory=dict)

spice_mcp/core/ports.py CHANGED Viewed

@@ -8,7 +8,6 @@ from .models import (
     QueryResult,
     ResultMetadata,
     SchemaMatch,
-    SuiPackageOverview,
     TableDescription,
     TableSummary,
 )
@@ -39,15 +38,6 @@ class CatalogExplorer(Protocol):
         ...
-class SuiInspector(Protocol):
-    """Port for Sui package exploration helpers."""
-    def package_overview(
-        self, packages: Sequence[str], *, hours: int, timeout_seconds: float | None = None
-    ) -> SuiPackageOverview:
-        ...
 class QueryAdmin(Protocol):
     """Port for managing Dune saved queries."""
@@ -62,8 +52,3 @@ class QueryAdmin(Protocol):
     def fork(self, source_query_id: int, *, name: str | None = None) -> Mapping[str, Any]:
         ...
-    def events_preview(
-        self, packages: Sequence[str], *, hours: int, limit: int
-    ) -> Sequence[Mapping[str, object]]:
-        ...

spice-mcp 0.1.1__py3-none-any.whl → 0.1.3__py3-none-any.whl

spice-mcp 0.1.1py3-none-any.whl → 0.1.3py3-none-any.whl