PyPI - voxagent - Versions diffs - 0.1.0__py3-none-any.whl - Mend

voxagent 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

voxagent/__init__.py +143 -0
voxagent/_version.py +5 -0
voxagent/agent/__init__.py +32 -0
voxagent/agent/abort.py +178 -0
voxagent/agent/core.py +902 -0
voxagent/code/__init__.py +9 -0
voxagent/mcp/__init__.py +16 -0
voxagent/mcp/manager.py +188 -0
voxagent/mcp/tool.py +152 -0
voxagent/providers/__init__.py +110 -0
voxagent/providers/anthropic.py +498 -0
voxagent/providers/augment.py +293 -0
voxagent/providers/auth.py +116 -0
voxagent/providers/base.py +268 -0
voxagent/providers/chatgpt.py +415 -0
voxagent/providers/claudecode.py +162 -0
voxagent/providers/cli_base.py +265 -0
voxagent/providers/codex.py +183 -0
voxagent/providers/failover.py +90 -0
voxagent/providers/google.py +532 -0
voxagent/providers/groq.py +96 -0
voxagent/providers/ollama.py +425 -0
voxagent/providers/openai.py +435 -0
voxagent/providers/registry.py +175 -0
voxagent/py.typed +1 -0
voxagent/security/__init__.py +14 -0
voxagent/security/events.py +75 -0
voxagent/security/filter.py +169 -0
voxagent/security/registry.py +87 -0
voxagent/session/__init__.py +39 -0
voxagent/session/compaction.py +237 -0
voxagent/session/lock.py +103 -0
voxagent/session/model.py +109 -0
voxagent/session/storage.py +184 -0
voxagent/streaming/__init__.py +52 -0
voxagent/streaming/emitter.py +286 -0
voxagent/streaming/events.py +255 -0
voxagent/subagent/__init__.py +20 -0
voxagent/subagent/context.py +124 -0
voxagent/subagent/definition.py +172 -0
voxagent/tools/__init__.py +32 -0
voxagent/tools/context.py +50 -0
voxagent/tools/decorator.py +175 -0
voxagent/tools/definition.py +131 -0
voxagent/tools/executor.py +109 -0
voxagent/tools/policy.py +89 -0
voxagent/tools/registry.py +89 -0
voxagent/types/__init__.py +46 -0
voxagent/types/messages.py +134 -0
voxagent/types/run.py +176 -0
voxagent-0.1.0.dist-info/METADATA +186 -0
voxagent-0.1.0.dist-info/RECORD +53 -0
voxagent-0.1.0.dist-info/WHEEL +4 -0

voxagent/providers/chatgpt.py ADDED Viewed

@@ -0,0 +1,415 @@
+"""ChatGPT Backend API provider.
+This provider uses ChatGPT's private backend API (used by Codex CLI) to access
+models like gpt-5 and gpt-5-codex-mini using a ChatGPT Plus subscription.
+API Endpoint: https://chatgpt.com/backend-api/codex/responses
+Auth: OAuth Bearer token (from Codex CLI or voxdomus vault)
+Note: This is an unofficial/undocumented API.
+Tool Format:
+    The ChatGPT backend API uses a flat tool format different from the standard
+    OpenAI nested format. This provider automatically converts between formats:
+    Standard OpenAI format (what voxagent uses):
+        {"type": "function", "function": {"name": "...", "description": "...", "parameters": {...}}}
+    ChatGPT backend format (flat):
+        {"type": "function", "name": "...", "description": "...", "parameters": {...}}
+    The conversion is handled transparently in _convert_tools().
+"""
+from __future__ import annotations
+import json
+import logging
+import os
+import ssl
+from collections.abc import AsyncIterator
+from typing import Any
+import certifi
+import httpx
+from voxagent.providers.base import (
+    AbortSignal,
+    BaseProvider,
+    ErrorChunk,
+    MessageEndChunk,
+    StreamChunk,
+    TextDeltaChunk,
+    ToolUseChunk,
+)
+from voxagent.types import Message, ToolCall
+logger = logging.getLogger(__name__)
+# API endpoint
+CHATGPT_API_ENDPOINT = "https://chatgpt.com/backend-api/codex/responses"
+# Default instructions
+DEFAULT_INSTRUCTIONS = "You are a helpful AI assistant."
+class ChatGPTProvider(BaseProvider):
+    """Provider for ChatGPT's private backend API.
+    Uses OAuth tokens to access ChatGPT Plus models with full tool support.
+    The provider automatically converts voxagent's OpenAI-standard tool format
+    to the flat format expected by the ChatGPT backend API.
+    """
+    ENV_KEY = "CHATGPT_ACCESS_TOKEN"
+    SUPPORTED_MODELS = [
+        "gpt-5",
+        "gpt-5-codex",
+        "gpt-5-codex-mini",
+        "codex-mini-latest",
+    ]
+    def __init__(
+        self,
+        model: str = "gpt-5-codex-mini",
+        api_key: str | None = None,
+        base_url: str | None = None,
+        instructions: str | None = None,
+        **kwargs: Any,
+    ) -> None:
+        """Initialize ChatGPT provider.
+        Args:
+            model: Model name (gpt-5, gpt-5-codex-mini, etc.).
+            api_key: OAuth access token. Falls back to CHATGPT_ACCESS_TOKEN env var.
+            base_url: Optional override for API endpoint.
+            instructions: Custom system instructions for Codex API.
+            **kwargs: Additional arguments.
+        """
+        super().__init__(api_key=api_key, base_url=base_url, **kwargs)
+        self._model = model
+        self._instructions = instructions or DEFAULT_INSTRUCTIONS
+    @property
+    def name(self) -> str:
+        """Get the provider name."""
+        return "chatgpt"
+    @property
+    def models(self) -> list[str]:
+        """Get supported models."""
+        return self.SUPPORTED_MODELS
+    @property
+    def supports_tools(self) -> bool:
+        """Check if the provider supports tool/function calling.
+        Returns:
+            True. The ChatGPT backend API supports tools with a flat format.
+            Tools are automatically converted from OpenAI's nested format.
+        """
+        return True
+    @property
+    def supports_streaming(self) -> bool:
+        """ChatGPT backend requires streaming."""
+        return True
+    @property
+    def context_limit(self) -> int:
+        """Approximate context limit."""
+        return 128000  # GPT-5 models have large context
+    def _convert_tools(self, tools: list[Any] | None) -> list[dict[str, Any]]:
+        """Convert OpenAI nested tool format to ChatGPT flat format.
+        OpenAI standard format (voxagent uses this):
+            {"type": "function", "function": {"name": "...", "description": "...", "parameters": {...}}}
+        ChatGPT backend format (flat):
+            {"type": "function", "name": "...", "description": "...", "parameters": {...}}
+        Args:
+            tools: List of tools in OpenAI standard format.
+        Returns:
+            List of tools in ChatGPT flat format.
+        """
+        if not tools:
+            return []
+        converted: list[dict[str, Any]] = []
+        for tool in tools:
+            if isinstance(tool, dict):
+                # Check if it's the nested OpenAI format
+                if "function" in tool and isinstance(tool["function"], dict):
+                    func = tool["function"]
+                    converted.append({
+                        "type": "function",
+                        "name": func.get("name", ""),
+                        "description": func.get("description", ""),
+                        "parameters": func.get("parameters", {"type": "object", "properties": {}}),
+                    })
+                # Already flat format or unknown - pass through
+                elif "name" in tool:
+                    converted.append(tool)
+                else:
+                    logger.warning("Unknown tool format, skipping: %s", tool)
+            else:
+                logger.warning("Tool is not a dict, skipping: %s", type(tool))
+        return converted
+    def _get_headers(self) -> dict[str, str]:
+        """Get request headers."""
+        token = self.api_key
+        if not token:
+            raise ValueError("No access token. Set CHATGPT_ACCESS_TOKEN or pass api_key.")
+        return {
+            "Authorization": f"Bearer {token}",
+            "Content-Type": "application/json",
+        }
+    def _build_input(
+        self,
+        messages: list[Message],
+        system: str | None = None,
+    ) -> list[dict[str, Any]]:
+        """Build input array for API request.
+        Note: System messages in the messages list are skipped because the
+        ChatGPT backend uses a separate 'instructions' field for system prompts.
+        The voxagent Agent may pass both a system prompt and system messages
+        in the list - we handle this by using the system param only.
+        Tool results in voxagent come as user messages with content being a list
+        of ToolResultBlock objects. These need to be converted to the ChatGPT
+        function_call_output format.
+        Assistant messages with tool_calls need to be converted to function_call
+        items so that the backend can match tool results to tool calls.
+        """
+        input_msgs: list[dict[str, Any]] = []
+        for msg in messages:
+            # Skip system messages - ChatGPT API doesn't support them in input
+            if msg.role == "system":
+                continue
+            # Handle assistant messages with tool calls
+            if msg.role == "assistant" and msg.tool_calls:
+                # Add text content first if present
+                if isinstance(msg.content, str) and msg.content:
+                    input_msgs.append({
+                        "type": "message",
+                        "role": "assistant",
+                        "content": [{"type": "input_text", "text": msg.content}],
+                    })
+                # Add function_call items for each tool call
+                for tc in msg.tool_calls:
+                    # Convert params to JSON string if needed
+                    args = tc.params
+                    if isinstance(args, dict):
+                        import json
+                        args = json.dumps(args)
+                    input_msgs.append({
+                        "type": "function_call",
+                        "call_id": tc.id,
+                        "name": tc.name,
+                        "arguments": args,
+                    })
+                continue
+            # Handle content that may be a list (tool results or content blocks)
+            if isinstance(msg.content, list):
+                for block in msg.content:
+                    # Handle ToolResultBlock (Pydantic model or dict)
+                    if hasattr(block, "type") and getattr(block, "type", None) == "tool_result":
+                        # Pydantic ToolResultBlock
+                        input_msgs.append({
+                            "type": "function_call_output",
+                            "call_id": getattr(block, "tool_use_id", ""),
+                            "output": getattr(block, "content", ""),
+                        })
+                    elif isinstance(block, dict) and block.get("type") == "tool_result":
+                        # Dict-style tool result
+                        input_msgs.append({
+                            "type": "function_call_output",
+                            "call_id": block.get("tool_use_id", ""),
+                            "output": block.get("content", ""),
+                        })
+                    elif hasattr(block, "text"):
+                        # TextBlock
+                        input_msgs.append({
+                            "type": "message",
+                            "role": "user" if msg.role == "user" else "assistant",
+                            "content": [{"type": "input_text", "text": block.text}],
+                        })
+                    elif isinstance(block, dict) and "text" in block:
+                        input_msgs.append({
+                            "type": "message",
+                            "role": "user" if msg.role == "user" else "assistant",
+                            "content": [{"type": "input_text", "text": block["text"]}],
+                        })
+            elif isinstance(msg.content, str):
+                # Simple string content
+                role = "user" if msg.role == "user" else "assistant"
+                input_msgs.append({
+                    "type": "message",
+                    "role": role,
+                    "content": [{"type": "input_text", "text": msg.content}],
+                })
+        return input_msgs
+    def _build_request_body(
+        self,
+        messages: list[Message],
+        system: str | None = None,
+        tools: list[Any] | None = None,
+    ) -> dict[str, Any]:
+        """Build request body for API.
+        Args:
+            messages: Conversation messages (system messages are filtered out).
+            system: System prompt to use as instructions.
+            tools: Optional tool definitions in OpenAI standard format.
+                   These will be converted to ChatGPT's flat format.
+        Returns:
+            Request body dict ready to send to the ChatGPT backend API.
+        """
+        # Use system prompt if provided, otherwise fall back to default instructions
+        instructions = system if system else self._instructions
+        # Convert tools from OpenAI nested format to ChatGPT flat format
+        converted_tools = self._convert_tools(tools)
+        has_tools = len(converted_tools) > 0
+        body: dict[str, Any] = {
+            "model": self._model,
+            "instructions": instructions,
+            "input": self._build_input(messages, system),
+            "tools": converted_tools,
+            "tool_choice": "auto" if has_tools else "none",
+            "parallel_tool_calls": False,
+            "reasoning": {"summary": "auto"},
+            "store": False,
+            "stream": True,
+        }
+        return body
+    async def stream(
+        self,
+        messages: list[Message],
+        system: str | None = None,
+        tools: list[Any] | None = None,
+        abort_signal: AbortSignal | None = None,
+    ) -> AsyncIterator[StreamChunk]:
+        """Stream a response from ChatGPT backend.
+        Args:
+            messages: Conversation messages.
+            system: Optional system prompt.
+            tools: Optional tool definitions.
+            abort_signal: Optional abort signal.
+        Yields:
+            StreamChunk objects.
+        """
+        body = self._build_request_body(messages, system, tools)
+        endpoint = self._base_url or CHATGPT_API_ENDPOINT
+        try:
+            async with httpx.AsyncClient() as client:
+                async with client.stream(
+                    "POST",
+                    endpoint,
+                    headers=self._get_headers(),
+                    json=body,
+                    timeout=120.0,
+                ) as response:
+                    if response.status_code == 401:
+                        yield ErrorChunk(error="Authentication failed - token may be expired")
+                        return
+                    response.raise_for_status()
+                    async for line in response.aiter_lines():
+                        if abort_signal and abort_signal.aborted:
+                            break
+                        if not line or not line.startswith("data:"):
+                            continue
+                        data_str = line[5:].strip()
+                        if data_str == "[DONE]":
+                            break
+                        try:
+                            data = json.loads(data_str)
+                            event_type = data.get("type", "")
+                            # Text delta
+                            if event_type == "response.output_text.delta":
+                                text = data.get("delta", "")
+                                if text:
+                                    yield TextDeltaChunk(delta=text)
+                            # Tool calls - use output_item.done which has all data
+                            elif event_type == "response.output_item.done":
+                                item = data.get("item", {})
+                                if item.get("type") == "function_call":
+                                    yield ToolUseChunk(
+                                        tool_call=ToolCall(
+                                            id=item.get("call_id", ""),
+                                            name=item.get("name", ""),
+                                            params=json.loads(item.get("arguments", "{}")),
+                                        )
+                                    )
+                        except json.JSONDecodeError:
+                            continue
+        except httpx.HTTPStatusError as e:
+            # Can't access response.text on streaming response without read()
+            yield ErrorChunk(error=f"HTTP {e.response.status_code}")
+        except Exception as e:
+            yield ErrorChunk(error=str(e))
+        yield MessageEndChunk()
+    async def complete(
+        self,
+        messages: list[Message],
+        system: str | None = None,
+        tools: list[Any] | None = None,
+    ) -> Message:
+        """Get a complete response (collects streamed chunks)."""
+        text_parts: list[str] = []
+        tool_calls: list[ToolCall] = []
+        async for chunk in self.stream(messages, system, tools):
+            if isinstance(chunk, TextDeltaChunk):
+                text_parts.append(chunk.delta)
+            elif isinstance(chunk, ToolUseChunk):
+                tool_calls.append(chunk.tool_call)
+            elif isinstance(chunk, ErrorChunk):
+                raise Exception(chunk.error)
+        return Message(
+            role="assistant",
+            content="".join(text_parts) if text_parts else None,
+            tool_calls=tool_calls if tool_calls else None,
+        )
+    def count_tokens(
+        self,
+        messages: list[Message],
+        system: str | None = None,
+    ) -> int:
+        """Estimate token count (rough approximation)."""
+        text = system or ""
+        for msg in messages:
+            text += msg.content or ""
+        # Rough estimate: ~4 chars per token
+        return len(text) // 4
+__all__ = ["ChatGPTProvider", "CHATGPT_API_ENDPOINT"]

voxagent/providers/claudecode.py ADDED Viewed

@@ -0,0 +1,162 @@
+"""Claude Code CLI provider.
+This provider wraps the Anthropic Claude Code CLI (claude command).
+It requires:
+1. The claude CLI to be installed
+2. Authentication via: claude setup-token
+Models available:
+- sonnet: Claude Sonnet (latest)
+- opus: Claude Opus (latest)
+- haiku: Claude Haiku (latest)
+"""
+from __future__ import annotations
+import json
+import logging
+from collections.abc import AsyncIterator
+from typing import Any
+from voxagent.providers.cli_base import CLINotFoundError, CLIProvider
+from voxagent.providers.base import (
+    AbortSignal,
+    ErrorChunk,
+    MessageEndChunk,
+    StreamChunk,
+    TextDeltaChunk,
+)
+from voxagent.types import Message
+logger = logging.getLogger(__name__)
+class ClaudeCodeProvider(CLIProvider):
+    """Provider for Claude Code CLI.
+    Uses the claude CLI in print mode with text output for non-interactive use.
+    """
+    CLI_NAME = "claude"
+    ENV_KEY = "ANTHROPIC_API_KEY"
+    SUPPORTED_MODELS = [
+        "sonnet",
+        "opus",
+        "haiku",
+    ]
+    def __init__(
+        self,
+        model: str = "sonnet",
+        api_key: str | None = None,
+        base_url: str | None = None,
+        **kwargs: Any,
+    ) -> None:
+        """Initialize Claude Code provider.
+        Args:
+            model: Model alias (sonnet, opus, haiku).
+            api_key: Optional Anthropic API key.
+            base_url: Optional base URL override.
+            **kwargs: Additional arguments.
+        """
+        super().__init__(model=model, api_key=api_key, base_url=base_url, **kwargs)
+    @property
+    def name(self) -> str:
+        """Get the provider name."""
+        return "claudecode"
+    @property
+    def models(self) -> list[str]:
+        """Get supported models."""
+        return self.SUPPORTED_MODELS
+    @property
+    def supports_tools(self) -> bool:
+        """Claude Code has tool support but we don't expose it."""
+        return False
+    @property
+    def context_limit(self) -> int:
+        """Approximate context limit."""
+        return 200000
+    def _build_cli_args(
+        self,
+        prompt: str,
+        system: str | None = None,
+    ) -> list[str]:
+        """Build claude CLI arguments.
+        Uses print mode for non-interactive execution.
+        """
+        args = ["--print", "--output-format", "text"]
+        if self._model:
+            args.extend(["--model", self._model])
+        if system:
+            args.extend(["--system-prompt", system])
+        # Add the prompt
+        args.append(prompt)
+        return args
+    def _parse_output(self, stdout: str, stderr: str) -> str:
+        """Parse claude CLI output."""
+        # claude --print outputs just the response text
+        return stdout.strip()
+    async def stream(
+        self,
+        messages: list[Message],
+        system: str | None = None,
+        tools: list[Any] | None = None,
+        abort_signal: AbortSignal | None = None,
+    ) -> AsyncIterator[StreamChunk]:
+        """Stream a response from Claude Code CLI.
+        Note: The claude CLI has its own MCP tool configuration.
+        Tools passed from voxDomus are not used.
+        """
+        if tools:
+            logger.debug(
+                "Claude CLI has its own MCP tools - ignoring %d passed tools",
+                len(tools),
+            )
+        try:
+            prompt = self._messages_to_prompt(messages)
+            response = await self._run_cli(prompt, system)
+            if response:
+                yield TextDeltaChunk(delta=response)
+        except CLINotFoundError as e:
+            yield ErrorChunk(error=str(e))
+        except Exception as e:
+            yield ErrorChunk(error=f"Claude Code CLI error: {e}")
+        yield MessageEndChunk()
+    async def complete(
+        self,
+        messages: list[Message],
+        system: str | None = None,
+        tools: list[Any] | None = None,
+    ) -> Message:
+        """Get a complete response from Claude Code CLI."""
+        text_parts: list[str] = []
+        async for chunk in self.stream(messages, system, tools):
+            if isinstance(chunk, TextDeltaChunk):
+                text_parts.append(chunk.delta)
+            elif isinstance(chunk, ErrorChunk):
+                raise Exception(chunk.error)
+        return Message(role="assistant", content="".join(text_parts))
+__all__ = ["ClaudeCodeProvider"]