PyPI - cli2api - Versions diffs - 0.1.0__py3-none-any.whl - Mend

cli2api 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

cli2api/__init__.py +3 -0
cli2api/__main__.py +22 -0
cli2api/api/__init__.py +5 -0
cli2api/api/dependencies.py +38 -0
cli2api/api/router.py +12 -0
cli2api/api/utils.py +15 -0
cli2api/api/v1/__init__.py +5 -0
cli2api/api/v1/chat.py +378 -0
cli2api/api/v1/models.py +52 -0
cli2api/api/v1/responses.py +255 -0
cli2api/config/__init__.py +5 -0
cli2api/config/settings.py +86 -0
cli2api/main.py +143 -0
cli2api/providers/__init__.py +5 -0
cli2api/providers/claude.py +440 -0
cli2api/schemas/__init__.py +36 -0
cli2api/schemas/internal.py +25 -0
cli2api/schemas/openai.py +229 -0
cli2api/streaming/__init__.py +5 -0
cli2api/streaming/sse.py +41 -0
cli2api/tools/__init__.py +5 -0
cli2api/tools/handler.py +396 -0
cli2api/utils/__init__.py +0 -0
cli2api/utils/logging.py +109 -0
cli2api-0.1.0.dist-info/METADATA +217 -0
cli2api-0.1.0.dist-info/RECORD +28 -0
cli2api-0.1.0.dist-info/WHEEL +4 -0
cli2api-0.1.0.dist-info/entry_points.txt +2 -0

cli2api/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+"""CLI2API - OpenAI-compatible API over CLI tools."""
+__version__ = "0.1.0"

cli2api/__main__.py ADDED Viewed

@@ -0,0 +1,22 @@
+"""Entry point for running CLI2API as a module."""
+import uvicorn
+from cli2api.api.dependencies import get_settings
+def main():
+    """Run the CLI2API server."""
+    settings = get_settings()
+    uvicorn.run(
+        "cli2api.main:app",
+        host=settings.host,
+        port=settings.port,
+        reload=settings.debug,
+        log_level=settings.log_level.lower(),
+    )
+if __name__ == "__main__":
+    main()

cli2api/api/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""API module with FastAPI routers."""
+from cli2api.api.router import api_router
+__all__ = ["api_router"]

cli2api/api/dependencies.py ADDED Viewed

@@ -0,0 +1,38 @@
+"""FastAPI dependencies for dependency injection."""
+from functools import lru_cache
+from pathlib import Path
+from cli2api.config.settings import Settings
+from cli2api.providers.claude import ClaudeCodeProvider
+@lru_cache
+def get_settings() -> Settings:
+    """Get cached application settings.
+    Returns:
+        Singleton Settings instance.
+    """
+    return Settings()
+@lru_cache
+def get_provider() -> ClaudeCodeProvider:
+    """Get cached Claude provider.
+    Returns:
+        Singleton ClaudeCodeProvider instance.
+    Raises:
+        RuntimeError: If Claude CLI is not configured.
+    """
+    settings = get_settings()
+    if not settings.claude_cli_path:
+        raise RuntimeError("Claude CLI not found. Set CLI2API_CLAUDE_CLI_PATH.")
+    return ClaudeCodeProvider(
+        executable_path=Path(settings.claude_cli_path),
+        default_timeout=settings.default_timeout,
+        models=settings.get_claude_models(),
+    )

cli2api/api/router.py ADDED Viewed

@@ -0,0 +1,12 @@
+"""Main API router combining all endpoints."""
+from fastapi import APIRouter
+from cli2api.api.v1 import chat, models, responses
+api_router = APIRouter()
+# Include v1 routers
+api_router.include_router(chat.router, prefix="/v1", tags=["chat"])
+api_router.include_router(models.router, prefix="/v1", tags=["models"])
+api_router.include_router(responses.router, prefix="/v1", tags=["responses"])

cli2api/api/utils.py ADDED Viewed

@@ -0,0 +1,15 @@
+"""Shared utilities for API endpoints."""
+def parse_model_name(model_id: str) -> str:
+    """Extract actual model name from prefixed format.
+    Args:
+        model_id: Model ID like "claude: sonnet" or "sonnet".
+    Returns:
+        Actual model name like "sonnet".
+    """
+    if ": " in model_id:
+        return model_id.split(": ", 1)[1]
+    return model_id

cli2api/api/v1/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""API v1 endpoints."""
+from cli2api.api.v1 import chat, models, responses
+__all__ = ["chat", "models", "responses"]

cli2api/api/v1/chat.py ADDED Viewed

@@ -0,0 +1,378 @@
+"""Chat completions endpoint - OpenAI compatible."""
+import time
+import uuid
+from typing import AsyncIterator
+from fastapi import APIRouter, Depends, HTTPException
+from fastapi.responses import StreamingResponse
+from cli2api.api.dependencies import get_provider
+from cli2api.api.utils import parse_model_name
+from cli2api.providers.claude import ClaudeCodeProvider
+from cli2api.schemas.openai import (
+    ChatCompletionChunk,
+    ChatCompletionChoice,
+    ChatCompletionRequest,
+    ChatCompletionResponse,
+    ChatMessage,
+    DeltaContent,
+    ResponseMessage,
+    StreamChoice,
+    ToolCall,
+    ToolCallFunction,
+    UsageInfo,
+)
+from cli2api.streaming.sse import sse_encode, sse_error
+from cli2api.utils.logging import get_logger
+logger = get_logger(__name__)
+router = APIRouter()
+@router.post("/chat/completions")
+async def chat_completions(
+    request: ChatCompletionRequest,
+    provider: ClaudeCodeProvider = Depends(get_provider),
+):
+    """Create a chat completion.
+    OpenAI-compatible endpoint supporting both streaming and non-streaming modes.
+    Args:
+        request: Chat completion request.
+        provider: Claude provider (injected).
+        settings: Application settings (injected).
+    Returns:
+        ChatCompletionResponse for non-streaming, StreamingResponse for streaming.
+    """
+    actual_model = parse_model_name(request.model)
+    completion_id = f"chatcmpl-{uuid.uuid4().hex[:24]}"
+    if request.stream:
+        return StreamingResponse(
+            stream_completion(
+                provider=provider,
+                messages=request.messages,
+                model=actual_model,
+                completion_id=completion_id,
+                tools=request.tools,
+                reasoning_effort=request.reasoning_effort,
+            ),
+            media_type="text/event-stream",
+            headers={
+                "Cache-Control": "no-cache",
+                "Connection": "keep-alive",
+                "X-Accel-Buffering": "no",
+            },
+        )
+    else:
+        # Non-streaming response
+        try:
+            result = await provider.execute(
+                messages=request.messages,
+                model=actual_model,
+                tools=request.tools,
+            )
+        except TimeoutError as e:
+            raise HTTPException(status_code=504, detail=str(e))
+        except RuntimeError as e:
+            raise HTTPException(status_code=500, detail=str(e))
+        # Build usage info
+        usage = UsageInfo()
+        if result.usage:
+            usage = UsageInfo(
+                prompt_tokens=result.usage.get("input_tokens", 0),
+                completion_tokens=result.usage.get("output_tokens", 0),
+                total_tokens=(
+                    result.usage.get("input_tokens", 0)
+                    + result.usage.get("output_tokens", 0)
+                ),
+            )
+        # Check for tool_calls in result
+        if result.tool_calls:
+            tool_calls = [
+                ToolCall(
+                    id=tc["id"],
+                    type=tc.get("type", "function"),
+                    function=ToolCallFunction(
+                        name=tc["function"]["name"],
+                        arguments=tc["function"]["arguments"],
+                    ),
+                )
+                for tc in result.tool_calls
+            ]
+            response = ChatCompletionResponse(
+                id=completion_id,
+                model=request.model,
+                choices=[
+                    ChatCompletionChoice(
+                        index=0,
+                        message=ResponseMessage(
+                            role="assistant",
+                            content=result.content if result.content else None,
+                            tool_calls=tool_calls,
+                        ),
+                        finish_reason="tool_calls",
+                    )
+                ],
+                usage=usage,
+            )
+            return response.model_dump(exclude_none=True)
+        response = ChatCompletionResponse(
+            id=completion_id,
+            model=request.model,
+            choices=[
+                ChatCompletionChoice(
+                    index=0,
+                    message=ResponseMessage(role="assistant", content=result.content),
+                    finish_reason="stop",
+                )
+            ],
+            usage=usage,
+        )
+        return response.model_dump(exclude_none=True)
+def split_content_chunks(content: str, max_size: int = 150) -> list[str]:
+    """Split large content into smaller chunks.
+    Tries to split on word boundaries for cleaner output.
+    Args:
+        content: Content to split.
+        max_size: Maximum chunk size in characters.
+    Returns:
+        List of content chunks.
+    """
+    if len(content) <= max_size:
+        return [content]
+    chunks = []
+    remaining = content
+    while remaining:
+        if len(remaining) <= max_size:
+            chunks.append(remaining)
+            break
+        # Try to find a good split point (space, newline)
+        split_at = max_size
+        for sep in [" ", "\n", ".", ",", ";"]:
+            pos = remaining.rfind(sep, 0, max_size)
+            if pos > max_size // 2:  # Don't split too early
+                split_at = pos + 1
+                break
+        chunks.append(remaining[:split_at])
+        remaining = remaining[split_at:]
+    return chunks
+async def stream_completion(
+    provider: ClaudeCodeProvider,
+    messages: list[ChatMessage],
+    model: str,
+    completion_id: str,
+    tools: list[dict] | None = None,
+    reasoning_effort: str | None = None,
+) -> AsyncIterator[str]:
+    """Generate SSE events for a streaming completion.
+    Args:
+        provider: The Claude provider to use.
+        messages: Chat messages.
+        model: Model identifier.
+        completion_id: Unique completion ID.
+        tools: Optional tool definitions.
+        reasoning_effort: Reasoning effort for extended thinking (low/medium/high).
+    Yields:
+        SSE-encoded strings.
+    """
+    created = int(time.time())
+    sent_final = False
+    logger.info(f"[{completion_id}] Starting stream for model={model}")
+    try:
+        # First chunk with role
+        first_chunk = ChatCompletionChunk(
+            id=completion_id,
+            created=created,
+            model=model,
+            choices=[
+                StreamChoice(
+                    index=0,
+                    delta=DeltaContent(role="assistant"),
+                    finish_reason=None,
+                )
+            ],
+        )
+        yield sse_encode(first_chunk.model_dump())
+        # When tools are provided, buffer content to check for tool_calls before sending
+        content_buffer = "" if tools else None
+        # Stream content chunks
+        async for chunk in provider.execute_stream(
+            messages=messages, model=model, tools=tools, reasoning_effort=reasoning_effort
+        ):
+            if chunk.is_final:
+                if not sent_final:
+                    # Check for tool_calls in chunk or buffered content
+                    tool_calls_data = chunk.tool_calls
+                    # If we buffered content, check it for tool_calls
+                    if content_buffer and not tool_calls_data:
+                        from cli2api.tools.handler import ToolHandler
+                        _, parsed_tools = ToolHandler.parse_tool_calls(content_buffer)
+                        if parsed_tools:
+                            tool_calls_data = parsed_tools
+                    if tool_calls_data:
+                        tool_calls = [
+                            ToolCall(
+                                id=tc["id"],
+                                type=tc.get("type", "function"),
+                                function=ToolCallFunction(
+                                    name=tc["function"]["name"],
+                                    arguments=tc["function"]["arguments"],
+                                ),
+                            )
+                            for tc in tool_calls_data
+                        ]
+                        tool_chunk = ChatCompletionChunk(
+                            id=completion_id,
+                            created=created,
+                            model=model,
+                            choices=[
+                                StreamChoice(
+                                    index=0,
+                                    delta=DeltaContent(tool_calls=tool_calls),
+                                    finish_reason="tool_calls",
+                                )
+                            ],
+                        )
+                        yield sse_encode(tool_chunk.model_dump())
+                    else:
+                        # No tool_calls - send buffered content if any
+                        if content_buffer:
+                            content_parts = split_content_chunks(content_buffer)
+                            for part in content_parts:
+                                content_chunk = ChatCompletionChunk(
+                                    id=completion_id,
+                                    created=created,
+                                    model=model,
+                                    choices=[
+                                        StreamChoice(
+                                            index=0,
+                                            delta=DeltaContent(content=part),
+                                            finish_reason=None,
+                                        )
+                                    ],
+                                )
+                                yield sse_encode(content_chunk.model_dump())
+                        # Normal final chunk
+                        final_chunk = ChatCompletionChunk(
+                            id=completion_id,
+                            created=created,
+                            model=model,
+                            choices=[
+                                StreamChoice(
+                                    index=0,
+                                    delta=DeltaContent(),
+                                    finish_reason="stop",
+                                )
+                            ],
+                        )
+                        yield sse_encode(final_chunk.model_dump())
+                    sent_final = True
+            elif chunk.reasoning:
+                # Stream reasoning/thinking content
+                from cli2api.schemas.openai import ReasoningDetail
+                reasoning_chunk = ChatCompletionChunk(
+                    id=completion_id,
+                    created=created,
+                    model=model,
+                    choices=[
+                        StreamChoice(
+                            index=0,
+                            delta=DeltaContent(
+                                reasoning_details=[
+                                    ReasoningDetail(
+                                        type="reasoning.text",
+                                        text=chunk.reasoning,
+                                    )
+                                ]
+                            ),
+                            finish_reason=None,
+                        )
+                    ],
+                )
+                yield sse_encode(reasoning_chunk.model_dump())
+            elif chunk.content:
+                # Check if this is a step indicator (should be streamed immediately)
+                is_step = chunk.content.startswith("`") and any(
+                    emoji in chunk.content for emoji in ["🤔", "⚡", "🔍", "📄", "🔧", "✏️"]
+                )
+                if content_buffer is not None and not is_step:
+                    # Buffer regular content when tools are active (might be tool_call JSON)
+                    content_buffer += chunk.content
+                else:
+                    # Stream step indicators and regular content immediately
+                    content_parts = split_content_chunks(chunk.content)
+                    for part in content_parts:
+                        content_chunk = ChatCompletionChunk(
+                            id=completion_id,
+                            created=created,
+                            model=model,
+                            choices=[
+                                StreamChoice(
+                                    index=0,
+                                    delta=DeltaContent(content=part),
+                                    finish_reason=None,
+                                )
+                            ],
+                        )
+                        yield sse_encode(content_chunk.model_dump())
+        # Ensure final chunk is sent
+        if not sent_final:
+            final_chunk = ChatCompletionChunk(
+                id=completion_id,
+                created=created,
+                model=model,
+                choices=[
+                    StreamChoice(
+                        index=0,
+                        delta=DeltaContent(),
+                        finish_reason="stop",
+                    )
+                ],
+            )
+            yield sse_encode(final_chunk.model_dump())
+        # Final [DONE] event
+        logger.info(f"[{completion_id}] Stream completed successfully")
+        yield "data: [DONE]\n\n"
+    except RuntimeError as e:
+        logger.error(f"[{completion_id}] Provider error: {e}")
+        yield sse_error(str(e))
+        yield "data: [DONE]\n\n"
+    except Exception as e:
+        logger.error(f"[{completion_id}] Stream error: {e}")
+        yield sse_error(str(e))
+        yield "data: [DONE]\n\n"

cli2api/api/v1/models.py ADDED Viewed

@@ -0,0 +1,52 @@
+"""Models endpoint - OpenAI compatible."""
+from fastapi import APIRouter, Depends, HTTPException
+from cli2api.api.dependencies import get_provider
+from cli2api.providers.claude import ClaudeCodeProvider
+from cli2api.schemas.openai import ModelInfo, ModelsResponse
+router = APIRouter()
+@router.get("/models")
+async def list_models(
+    provider: ClaudeCodeProvider = Depends(get_provider),
+) -> ModelsResponse:
+    """List available models.
+    Returns:
+        ModelsResponse with all available Claude models.
+    """
+    models = []
+    for model_id in provider.supported_models:
+        # Format as "claude: model"
+        full_id = f"claude: {model_id}"
+        models.append(ModelInfo(id=full_id, owned_by="claude"))
+    return ModelsResponse(data=sorted(models, key=lambda m: m.id))
+@router.get("/models/{model_id:path}")
+async def get_model(
+    model_id: str,
+    provider: ClaudeCodeProvider = Depends(get_provider),
+) -> ModelInfo:
+    """Get information about a specific model.
+    Args:
+        model_id: The model identifier (e.g., "claude: sonnet" or "sonnet").
+        provider: Claude provider (injected).
+    Returns:
+        ModelInfo for the requested model.
+    Raises:
+        HTTPException: If model not found.
+    """
+    # Parse model name
+    actual_model = model_id.split(": ", 1)[1] if ": " in model_id else model_id
+    if actual_model in provider.supported_models:
+        return ModelInfo(id=f"claude: {actual_model}", owned_by="claude")
+    raise HTTPException(status_code=404, detail=f"Model not found: {model_id}")