PyPI - sqlsaber - Versions diffs - 0.14.0__py3-none-any.whl → 0.16.0__py3-none-any.whl - Mend

sqlsaber 0.14.0py3-none-any.whl → 0.16.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of sqlsaber might be problematic. Click here for more details.

Files changed (38) hide show

sqlsaber/agents/__init__.py +2 -4
sqlsaber/agents/base.py +18 -221
sqlsaber/agents/mcp.py +2 -2
sqlsaber/agents/pydantic_ai_agent.py +170 -0
sqlsaber/cli/auth.py +146 -79
sqlsaber/cli/commands.py +22 -7
sqlsaber/cli/database.py +1 -1
sqlsaber/cli/interactive.py +65 -30
sqlsaber/cli/models.py +58 -29
sqlsaber/cli/streaming.py +114 -77
sqlsaber/config/api_keys.py +9 -11
sqlsaber/config/providers.py +116 -0
sqlsaber/config/settings.py +50 -30
sqlsaber/database/connection.py +3 -3
sqlsaber/mcp/mcp.py +43 -51
sqlsaber/models/__init__.py +0 -3
sqlsaber/tools/__init__.py +25 -0
sqlsaber/tools/base.py +85 -0
sqlsaber/tools/enums.py +21 -0
sqlsaber/tools/instructions.py +251 -0
sqlsaber/tools/registry.py +130 -0
sqlsaber/tools/sql_tools.py +275 -0
sqlsaber/tools/visualization_tools.py +144 -0
{sqlsaber-0.14.0.dist-info → sqlsaber-0.16.0.dist-info}/METADATA +20 -39
sqlsaber-0.16.0.dist-info/RECORD +51 -0
sqlsaber/agents/anthropic.py +0 -579
sqlsaber/agents/streaming.py +0 -16
sqlsaber/clients/__init__.py +0 -6
sqlsaber/clients/anthropic.py +0 -285
sqlsaber/clients/base.py +0 -31
sqlsaber/clients/exceptions.py +0 -117
sqlsaber/clients/models.py +0 -282
sqlsaber/clients/streaming.py +0 -257
sqlsaber/models/events.py +0 -28
sqlsaber-0.14.0.dist-info/RECORD +0 -51
{sqlsaber-0.14.0.dist-info → sqlsaber-0.16.0.dist-info}/WHEEL +0 -0
{sqlsaber-0.14.0.dist-info → sqlsaber-0.16.0.dist-info}/entry_points.txt +0 -0
{sqlsaber-0.14.0.dist-info → sqlsaber-0.16.0.dist-info}/licenses/LICENSE +0 -0

sqlsaber/agents/anthropic.py DELETED Viewed

@@ -1,579 +0,0 @@
-"""Anthropic-specific SQL agent implementation using the custom client."""
-import asyncio
-import json
-from typing import Any, AsyncIterator
-from sqlsaber.agents.base import BaseSQLAgent
-from sqlsaber.agents.streaming import (
-    build_tool_result_block,
-)
-from sqlsaber.clients import AnthropicClient
-from sqlsaber.clients.models import (
-    ContentBlock,
-    ContentType,
-    CreateMessageRequest,
-    Message,
-    MessageRole,
-    ToolDefinition,
-)
-from sqlsaber.config.settings import Config
-from sqlsaber.database.connection import BaseDatabaseConnection
-from sqlsaber.memory.manager import MemoryManager
-from sqlsaber.models.events import StreamEvent
-class AnthropicSQLAgent(BaseSQLAgent):
-    """SQL Agent using the custom Anthropic client."""
-    # Constants
-    MAX_TOKENS = 4096
-    DEFAULT_SQL_LIMIT = 100
-    def __init__(
-        self, db_connection: BaseDatabaseConnection, database_name: str | None = None
-    ):
-        super().__init__(db_connection)
-        config = Config()
-        config.validate()  # This will raise ValueError if credentials are missing
-        if config.oauth_token:
-            self.client = AnthropicClient(oauth_token=config.oauth_token)
-        else:
-            self.client = AnthropicClient(api_key=config.api_key)
-        self.model = config.model_name.replace("anthropic:", "")
-        self.database_name = database_name
-        self.memory_manager = MemoryManager()
-        # Track last query results for streaming
-        self._last_results = None
-        self._last_query = None
-        # Define tools in the new format
-        self.tools: list[ToolDefinition] = [
-            ToolDefinition(
-                name="list_tables",
-                description="Get a list of all tables in the database with row counts. Use this first to discover available tables.",
-                input_schema={
-                    "type": "object",
-                    "properties": {},
-                    "required": [],
-                },
-            ),
-            ToolDefinition(
-                name="introspect_schema",
-                description="Introspect database schema to understand table structures.",
-                input_schema={
-                    "type": "object",
-                    "properties": {
-                        "table_pattern": {
-                            "type": "string",
-                            "description": "Optional pattern to filter tables (e.g., 'public.users', 'user%', '%order%')",
-                        }
-                    },
-                    "required": [],
-                },
-            ),
-            ToolDefinition(
-                name="execute_sql",
-                description="Execute a SQL query against the database.",
-                input_schema={
-                    "type": "object",
-                    "properties": {
-                        "query": {
-                            "type": "string",
-                            "description": "SQL query to execute",
-                        },
-                        "limit": {
-                            "type": "integer",
-                            "description": f"Maximum number of rows to return (default: {AnthropicSQLAgent.DEFAULT_SQL_LIMIT})",
-                            "default": AnthropicSQLAgent.DEFAULT_SQL_LIMIT,
-                        },
-                    },
-                    "required": ["query"],
-                },
-            ),
-            ToolDefinition(
-                name="plot_data",
-                description="Create a plot of query results.",
-                input_schema={
-                    "type": "object",
-                    "properties": {
-                        "y_values": {
-                            "type": "array",
-                            "items": {"type": ["number", "null"]},
-                            "description": "Y-axis data points (required)",
-                        },
-                        "x_values": {
-                            "type": "array",
-                            "items": {"type": ["number", "null"]},
-                            "description": "X-axis data points (optional, will use indices if not provided)",
-                        },
-                        "plot_type": {
-                            "type": "string",
-                            "enum": ["line", "scatter", "histogram"],
-                            "description": "Type of plot to create (default: line)",
-                            "default": "line",
-                        },
-                        "title": {
-                            "type": "string",
-                            "description": "Title for the plot",
-                        },
-                        "x_label": {
-                            "type": "string",
-                            "description": "Label for X-axis",
-                        },
-                        "y_label": {
-                            "type": "string",
-                            "description": "Label for Y-axis",
-                        },
-                    },
-                    "required": ["y_values"],
-                },
-            ),
-        ]
-        # Build system prompt with memories if available
-        self.system_prompt = self._build_system_prompt()
-    def _build_system_prompt(self) -> str:
-        """Build system prompt with optional memory context."""
-        # For OAuth authentication, start with Claude Code identity
-        # Check if we're using OAuth by looking at the client
-        is_oauth = (
-            hasattr(self, "client")
-            and hasattr(self.client, "use_oauth")
-            and self.client.use_oauth
-        )
-        if is_oauth:
-            # For OAuth, keep system prompt minimal - just Claude Code identity
-            return "You are Claude Code, Anthropic's official CLI for Claude."
-        else:
-            return self._get_sql_assistant_instructions()
-    def _get_sql_assistant_instructions(self) -> str:
-        """Get the detailed SQL assistant instructions."""
-        db_type = self._get_database_type_name()
-        instructions = f"""You are also a helpful SQL assistant that helps users query their {db_type} database.
-Your responsibilities:
-1. Understand user's natural language requests, think and convert them to SQL
-2. Use the provided tools efficiently to explore database schema
-3. Generate appropriate SQL queries
-4. Execute queries safely - queries that modify the database are not allowed
-5. Format and explain results clearly
-6. Create visualizations when requested or when they would be helpful
-IMPORTANT - Schema Discovery Strategy:
-1. ALWAYS start with 'list_tables' to see available tables and row counts
-2. Based on the user's query, identify which specific tables are relevant
-3. Use 'introspect_schema' with a table_pattern to get details ONLY for relevant tables
-4. Timestamp columns must be converted to text when you write queries
-Guidelines:
-- Use list_tables first, then introspect_schema for specific tables only
-- Use table patterns like 'sample%' or '%experiment%' to filter related tables
-- Use proper JOIN syntax and avoid cartesian products
-- Include appropriate WHERE clauses to limit results
-- Explain what the query does in simple terms
-- Handle errors gracefully and suggest fixes
-- Be security conscious - use parameterized queries when needed
-"""
-        # Add memory context if database name is available
-        if self.database_name:
-            memory_context = self.memory_manager.format_memories_for_prompt(
-                self.database_name
-            )
-            if memory_context.strip():
-                instructions += memory_context
-        return instructions
-    def add_memory(self, content: str) -> str | None:
-        """Add a memory for the current database."""
-        if not self.database_name:
-            return None
-        memory = self.memory_manager.add_memory(self.database_name, content)
-        # Rebuild system prompt with new memory
-        self.system_prompt = self._build_system_prompt()
-        return memory.id
-    async def execute_sql(self, query: str, limit: int | None = None) -> str:
-        """Execute a SQL query against the database with streaming support."""
-        # Call parent implementation for core functionality
-        result = await super().execute_sql(query, limit)
-        # Parse result to extract data for streaming (AnthropicSQLAgent specific)
-        try:
-            result_data = json.loads(result)
-            if result_data.get("success") and "results" in result_data:
-                # Store results for streaming
-                actual_limit = (
-                    limit if limit is not None else len(result_data["results"])
-                )
-                self._last_results = result_data["results"][:actual_limit]
-                self._last_query = query
-        except (json.JSONDecodeError, KeyError):
-            # If we can't parse the result, just continue without storing
-            pass
-        return result
-    async def process_tool_call(
-        self, tool_name: str, tool_input: dict[str, Any]
-    ) -> str:
-        """Process a tool call and return the result."""
-        # Use parent implementation for core tools
-        return await super().process_tool_call(tool_name, tool_input)
-    def _convert_user_message_to_message(
-        self, msg_content: str | list[dict[str, Any]]
-    ) -> Message:
-        """Convert user message content to Message object."""
-        if isinstance(msg_content, str):
-            return Message(MessageRole.USER, msg_content)
-        # Handle tool results format
-        tool_result_blocks = []
-        if isinstance(msg_content, list):
-            for item in msg_content:
-                if isinstance(item, dict) and item.get("type") == "tool_result":
-                    tool_result_blocks.append(
-                        ContentBlock(ContentType.TOOL_RESULT, item)
-                    )
-        if tool_result_blocks:
-            return Message(MessageRole.USER, tool_result_blocks)
-        # Fallback to string representation
-        return Message(MessageRole.USER, str(msg_content))
-    def _convert_assistant_message_to_message(
-        self, msg_content: str | list[dict[str, Any]]
-    ) -> Message:
-        """Convert assistant message content to Message object."""
-        if isinstance(msg_content, str):
-            return Message(MessageRole.ASSISTANT, msg_content)
-        if isinstance(msg_content, list):
-            content_blocks = []
-            for block in msg_content:
-                if isinstance(block, dict):
-                    if block.get("type") == "text":
-                        text_content = block.get("text", "")
-                        if text_content:  # Only add non-empty text blocks
-                            content_blocks.append(
-                                ContentBlock(ContentType.TEXT, text_content)
-                            )
-                    elif block.get("type") == "tool_use":
-                        content_blocks.append(
-                            ContentBlock(
-                                ContentType.TOOL_USE,
-                                {
-                                    "id": block["id"],
-                                    "name": block["name"],
-                                    "input": block["input"],
-                                },
-                            )
-                        )
-            if content_blocks:
-                return Message(MessageRole.ASSISTANT, content_blocks)
-        # Fallback to string representation
-        return Message(MessageRole.ASSISTANT, str(msg_content))
-    def _convert_history_to_messages(self) -> list[Message]:
-        """Convert conversation history to Message objects."""
-        messages = []
-        for msg in self.conversation_history:
-            if msg["role"] == "user":
-                messages.append(self._convert_user_message_to_message(msg["content"]))
-            elif msg["role"] == "assistant":
-                messages.append(
-                    self._convert_assistant_message_to_message(msg["content"])
-                )
-        return messages
-    def _convert_tool_results_to_message(
-        self, tool_results: list[dict[str, Any]]
-    ) -> Message:
-        """Convert tool results to a user Message object."""
-        tool_result_blocks = []
-        for tool_result in tool_results:
-            tool_result_blocks.append(
-                ContentBlock(ContentType.TOOL_RESULT, tool_result)
-            )
-        return Message(MessageRole.USER, tool_result_blocks)
-    def _convert_response_content_to_message(
-        self, content: list[dict[str, Any]]
-    ) -> Message:
-        """Convert response content to assistant Message object."""
-        content_blocks = []
-        for block in content:
-            if block.get("type") == "text":
-                text_content = block["text"]
-                if text_content:  # Only add non-empty text blocks
-                    content_blocks.append(ContentBlock(ContentType.TEXT, text_content))
-            elif block.get("type") == "tool_use":
-                content_blocks.append(
-                    ContentBlock(
-                        ContentType.TOOL_USE,
-                        {
-                            "id": block["id"],
-                            "name": block["name"],
-                            "input": block["input"],
-                        },
-                    )
-                )
-        return Message(MessageRole.ASSISTANT, content_blocks)
-    async def _execute_and_yield_tool_results(
-        self,
-        response_content: list[dict[str, Any]],
-        cancellation_token: asyncio.Event | None = None,
-    ) -> AsyncIterator[StreamEvent | list[dict[str, Any]]]:
-        """Execute tool calls and yield appropriate stream events."""
-        tool_results = []
-        for block in response_content:
-            if block.get("type") == "tool_use":
-                # Check for cancellation before tool execution
-                if cancellation_token is not None and cancellation_token.is_set():
-                    yield tool_results
-                    return
-                yield StreamEvent(
-                    "tool_use",
-                    {
-                        "name": block["name"],
-                        "input": block["input"],
-                        "status": "executing",
-                    },
-                )
-                tool_result = await self.process_tool_call(
-                    block["name"], block["input"]
-                )
-                # Yield specific events based on tool type
-                if block["name"] == "execute_sql" and self._last_results:
-                    yield StreamEvent(
-                        "query_result",
-                        {
-                            "query": self._last_query,
-                            "results": self._last_results,
-                        },
-                    )
-                elif block["name"] in ["list_tables", "introspect_schema"]:
-                    yield StreamEvent(
-                        "tool_result",
-                        {
-                            "tool_name": block["name"],
-                            "result": tool_result,
-                        },
-                    )
-                elif block["name"] == "plot_data":
-                    yield StreamEvent(
-                        "plot_result",
-                        {
-                            "tool_name": block["name"],
-                            "input": block["input"],
-                            "result": tool_result,
-                        },
-                    )
-                tool_results.append(build_tool_result_block(block["id"], tool_result))
-        yield tool_results
-    async def _handle_stream_events(
-        self,
-        stream_iterator: AsyncIterator[Any],
-        cancellation_token: asyncio.Event | None = None,
-    ) -> AsyncIterator[StreamEvent | Any]:
-        """Handle streaming events and yield stream events, return final response."""
-        response = None
-        async for event in stream_iterator:
-            if cancellation_token is not None and cancellation_token.is_set():
-                yield None
-                return
-            # Handle different event types
-            if hasattr(event, "type"):
-                if event.type == "content_block_start":
-                    if hasattr(event.content_block, "type"):
-                        if event.content_block.type == "tool_use":
-                            yield StreamEvent(
-                                "tool_use",
-                                {
-                                    "name": event.content_block.name,
-                                    "status": "started",
-                                },
-                            )
-                elif event.type == "content_block_delta":
-                    if hasattr(event.delta, "text"):
-                        text = event.delta.text
-                        if text is not None and text:  # Only yield non-empty text
-                            yield StreamEvent("text", text)
-            elif isinstance(event, dict) and event.get("type") == "response_ready":
-                response = event["data"]
-        yield response
-    def _create_message_request(self, messages: list[Message]) -> CreateMessageRequest:
-        """Create a CreateMessageRequest with standard parameters."""
-        return CreateMessageRequest(
-            model=self.model,
-            messages=messages,
-            max_tokens=self.MAX_TOKENS,
-            system=self.system_prompt,
-            tools=self.tools,
-            stream=True,
-        )
-    async def query_stream(
-        self,
-        user_query: str,
-        use_history: bool = True,
-        cancellation_token: asyncio.Event | None = None,
-    ) -> AsyncIterator[StreamEvent]:
-        """Process a user query and stream responses."""
-        # Initialize for tracking state
-        self._last_results = None
-        self._last_query = None
-        try:
-            # Ensure conversation is active for persistence
-            await self._ensure_conversation()
-            # Store user message in conversation history and persistence
-            if use_history:
-                self.conversation_history.append(
-                    {"role": "user", "content": user_query}
-                )
-                await self._store_user_message(user_query)
-            # Build messages with history if requested
-            messages = []
-            if use_history:
-                messages = self._convert_history_to_messages()
-            # For OAuth with no history, inject SQL assistant instructions as first user message
-            is_oauth = hasattr(self.client, "use_oauth") and self.client.use_oauth
-            if is_oauth and not messages:
-                instructions = self._get_sql_assistant_instructions()
-                messages.append(Message(MessageRole.USER, instructions))
-            # Add current user message if not already in messages from history
-            if not use_history:
-                messages.append(Message(MessageRole.USER, user_query))
-            # Create initial request and get response
-            request = self._create_message_request(messages)
-            response = None
-            async for event in self._handle_stream_events(
-                self.client.create_message_with_tools(request, cancellation_token),
-                cancellation_token,
-            ):
-                if isinstance(event, StreamEvent):
-                    yield event
-                else:
-                    response = event
-            # Handle tool use cycles
-            collected_content = []
-            while response is not None and response.stop_reason == "tool_use":
-                if cancellation_token is not None and cancellation_token.is_set():
-                    return
-                # Add assistant's response to conversation
-                assistant_content = {"role": "assistant", "content": response.content}
-                collected_content.append(assistant_content)
-                # Store the assistant message immediately (not from collected_content)
-                if use_history:
-                    await self._store_assistant_message(response.content)
-                # Execute tools and get results
-                tool_results = []
-                async for event in self._execute_and_yield_tool_results(
-                    response.content, cancellation_token
-                ):
-                    if isinstance(event, StreamEvent):
-                        yield event
-                    elif isinstance(event, list):
-                        tool_results = event
-                # Continue conversation with tool results
-                tool_content = {"role": "user", "content": tool_results}
-                collected_content.append(tool_content)
-                # Store the tool message immediately and update history
-                if use_history:
-                    # Only add the NEW messages to history (not the accumulated ones)
-                    # collected_content has [assistant1, tool1, assistant2, tool2, ...]
-                    # We only want to add the last 2 items that were just added
-                    new_messages_for_history = collected_content[
-                        -2:
-                    ]  # Last assistant + tool pair
-                    self.conversation_history.extend(new_messages_for_history)
-                    await self._store_tool_message(tool_results)
-                if cancellation_token is not None and cancellation_token.is_set():
-                    return
-                yield StreamEvent("processing", "Analyzing results...")
-                # Build new messages with collected content
-                new_messages = messages.copy()
-                for content in collected_content:
-                    if content["role"] == "user":
-                        new_messages.append(
-                            self._convert_tool_results_to_message(content["content"])
-                        )
-                    elif content["role"] == "assistant":
-                        new_messages.append(
-                            self._convert_response_content_to_message(
-                                content["content"]
-                            )
-                        )
-                # Get next response
-                request = self._create_message_request(new_messages)
-                response = None
-                async for event in self._handle_stream_events(
-                    self.client.create_message_with_tools(request, cancellation_token),
-                    cancellation_token,
-                ):
-                    if isinstance(event, StreamEvent):
-                        yield event
-                    else:
-                        response = event
-            # Update conversation history with final response
-            if use_history and response is not None:
-                self.conversation_history.append(
-                    {"role": "assistant", "content": response.content}
-                )
-                # Store final assistant message in persistence (only if not tool_use)
-                if response.stop_reason != "tool_use":
-                    await self._store_assistant_message(response.content)
-        except asyncio.CancelledError:
-            return
-        except Exception as e:
-            yield StreamEvent("error", str(e))
-    async def close(self):
-        """Close the client."""
-        await self.client.close()

sqlsaber/agents/streaming.py DELETED Viewed

@@ -1,16 +0,0 @@
-"""Streaming utilities for agents."""
-from typing import Any
-class StreamingResponse:
-    """Helper class to manage streaming response construction."""
-    def __init__(self, content: list[dict[str, Any]], stop_reason: str):
-        self.content = content
-        self.stop_reason = stop_reason
-def build_tool_result_block(tool_use_id: str, content: str) -> dict[str, Any]:
-    """Build a tool result block for the conversation."""
-    return {"type": "tool_result", "tool_use_id": tool_use_id, "content": content}

sqlsaber/clients/__init__.py DELETED Viewed

@@ -1,6 +0,0 @@
-"""Client implementations for various LLM APIs."""
-from .base import BaseLLMClient
-from .anthropic import AnthropicClient
-__all__ = ["BaseLLMClient", "AnthropicClient"]

sqlsaber 0.14.0__py3-none-any.whl → 0.16.0__py3-none-any.whl

Potentially problematic release.

sqlsaber 0.14.0py3-none-any.whl → 0.16.0py3-none-any.whl