PyPI - ccproxy-api - Versions diffs - 0.1.4__py3-none-any.whl → 0.1.6__py3-none-any.whl - Mend

ccproxy-api 0.1.4py3-none-any.whl → 0.1.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (72) hide show

ccproxy/_version.py +2 -2
ccproxy/adapters/codex/__init__.py +11 -0
ccproxy/adapters/openai/adapter.py +1 -1
ccproxy/adapters/openai/models.py +1 -1
ccproxy/adapters/openai/response_adapter.py +355 -0
ccproxy/adapters/openai/response_models.py +178 -0
ccproxy/adapters/openai/streaming.py +1 -0
ccproxy/api/app.py +150 -224
ccproxy/api/dependencies.py +22 -2
ccproxy/api/middleware/errors.py +27 -3
ccproxy/api/middleware/logging.py +4 -0
ccproxy/api/responses.py +6 -1
ccproxy/api/routes/claude.py +222 -17
ccproxy/api/routes/codex.py +1231 -0
ccproxy/api/routes/health.py +228 -3
ccproxy/api/routes/proxy.py +25 -6
ccproxy/api/services/permission_service.py +2 -2
ccproxy/auth/openai/__init__.py +13 -0
ccproxy/auth/openai/credentials.py +166 -0
ccproxy/auth/openai/oauth_client.py +334 -0
ccproxy/auth/openai/storage.py +184 -0
ccproxy/claude_sdk/__init__.py +4 -8
ccproxy/claude_sdk/client.py +661 -131
ccproxy/claude_sdk/exceptions.py +16 -0
ccproxy/claude_sdk/manager.py +219 -0
ccproxy/claude_sdk/message_queue.py +342 -0
ccproxy/claude_sdk/options.py +6 -1
ccproxy/claude_sdk/session_client.py +546 -0
ccproxy/claude_sdk/session_pool.py +550 -0
ccproxy/claude_sdk/stream_handle.py +538 -0
ccproxy/claude_sdk/stream_worker.py +392 -0
ccproxy/claude_sdk/streaming.py +53 -11
ccproxy/cli/commands/auth.py +398 -1
ccproxy/cli/commands/serve.py +99 -1
ccproxy/cli/options/claude_options.py +47 -0
ccproxy/config/__init__.py +0 -3
ccproxy/config/claude.py +171 -23
ccproxy/config/codex.py +100 -0
ccproxy/config/discovery.py +10 -1
ccproxy/config/scheduler.py +2 -2
ccproxy/config/settings.py +38 -1
ccproxy/core/codex_transformers.py +389 -0
ccproxy/core/http_transformers.py +458 -75
ccproxy/core/logging.py +108 -12
ccproxy/core/transformers.py +5 -0
ccproxy/models/claude_sdk.py +57 -0
ccproxy/models/detection.py +208 -0
ccproxy/models/requests.py +22 -0
ccproxy/models/responses.py +16 -0
ccproxy/observability/access_logger.py +72 -14
ccproxy/observability/metrics.py +151 -0
ccproxy/observability/storage/duckdb_simple.py +12 -0
ccproxy/observability/storage/models.py +16 -0
ccproxy/observability/streaming_response.py +107 -0
ccproxy/scheduler/manager.py +31 -6
ccproxy/scheduler/tasks.py +122 -0
ccproxy/services/claude_detection_service.py +269 -0
ccproxy/services/claude_sdk_service.py +333 -130
ccproxy/services/codex_detection_service.py +263 -0
ccproxy/services/proxy_service.py +618 -197
ccproxy/utils/__init__.py +9 -1
ccproxy/utils/disconnection_monitor.py +83 -0
ccproxy/utils/id_generator.py +12 -0
ccproxy/utils/model_mapping.py +7 -5
ccproxy/utils/startup_helpers.py +470 -0
ccproxy_api-0.1.6.dist-info/METADATA +615 -0
{ccproxy_api-0.1.4.dist-info → ccproxy_api-0.1.6.dist-info}/RECORD +70 -47
ccproxy/config/loader.py +0 -105
ccproxy_api-0.1.4.dist-info/METADATA +0 -369
{ccproxy_api-0.1.4.dist-info → ccproxy_api-0.1.6.dist-info}/WHEEL +0 -0
{ccproxy_api-0.1.4.dist-info → ccproxy_api-0.1.6.dist-info}/entry_points.txt +0 -0
{ccproxy_api-0.1.4.dist-info → ccproxy_api-0.1.6.dist-info}/licenses/LICENSE +0 -0

ccproxy/core/http_transformers.py CHANGED Viewed

@@ -3,6 +3,7 @@
 from typing import TYPE_CHECKING, Any
 import structlog
+from typing_extensions import TypedDict
 from ccproxy.core.transformers import RequestTransformer, ResponseTransformer
 from ccproxy.core.types import ProxyRequest, ProxyResponse, TransformContext
@@ -20,13 +21,64 @@ claude_code_prompt = "You are Claude Code, Anthropic's official CLI for Claude."
 # claude_code_prompt = "<system-reminder>\nAs you answer the user's questions, you can use the following context:\n# important-instruction-reminders\nDo what has been asked; nothing more, nothing less.\nNEVER create files unless they're absolutely necessary for achieving your goal.\nALWAYS prefer editing an existing file to creating a new one.\nNEVER proactively create documentation files (*.md) or README files. Only create documentation files if explicitly requested by the User.\n\n      \n      IMPORTANT: this context may or may not be relevant to your tasks. You should not respond to this context unless it is highly relevant to your task.\n</system-reminder>\n"
-def get_claude_code_prompt() -> dict[str, Any]:
-    """Get the Claude Code system prompt with cache control."""
-    return {
-        "type": "text",
-        "text": claude_code_prompt,
-        "cache_control": {"type": "ephemeral"},
-    }
+def get_detected_system_field(
+    app_state: Any = None, injection_mode: str = "minimal"
+) -> Any:
+    """Get the detected system field for injection.
+    Args:
+        app_state: App state containing detection data
+        injection_mode: 'minimal' or 'full' mode
+    Returns:
+        The system field to inject (preserving exact Claude CLI structure), or None if no detection data available
+    """
+    if not app_state or not hasattr(app_state, "claude_detection_data"):
+        return None
+    claude_data = app_state.claude_detection_data
+    detected_system = claude_data.system_prompt.system_field
+    if injection_mode == "full":
+        # Return the complete detected system field exactly as Claude CLI sent it
+        return detected_system
+    else:
+        # Minimal mode: extract just the first system message, preserving its structure
+        if isinstance(detected_system, str):
+            return detected_system
+        elif isinstance(detected_system, list) and detected_system:
+            # Return only the first message object with its complete structure (type, text, cache_control)
+            return [detected_system[0]]
+    return None
+def get_fallback_system_field() -> list[dict[str, Any]]:
+    """Get fallback system field when no detection data is available."""
+    return [
+        {
+            "type": "text",
+            "text": claude_code_prompt,
+            "cache_control": {"type": "ephemeral"},
+        }
+    ]
+class RequestData(TypedDict):
+    """Typed structure for transformed request data."""
+    method: str
+    url: str
+    headers: dict[str, str]
+    body: bytes | None
+class ResponseData(TypedDict):
+    """Typed structure for transformed response data."""
+    status_code: int
+    headers: dict[str, str]
+    body: bytes
 class HTTPRequestTransformer(RequestTransformer):
@@ -73,24 +125,39 @@ class HTTPRequestTransformer(RequestTransformer):
         elif context and isinstance(context, dict):
             access_token = context.get("access_token", "")
-        transformed_headers = self.create_proxy_headers(request.headers, access_token)
+        # Extract app_state from context if available
+        app_state = None
+        if context and hasattr(context, "app_state"):
+            app_state = context.app_state
+        elif context and isinstance(context, dict):
+            app_state = context.get("app_state")
+        transformed_headers = self.create_proxy_headers(
+            request.headers, access_token, self.proxy_mode, app_state
+        )
         # Transform body
         transformed_body = request.body
         if request.body:
             if isinstance(request.body, bytes):
                 transformed_body = self.transform_request_body(
-                    request.body, transformed_path
+                    request.body, transformed_path, self.proxy_mode, app_state
                 )
             elif isinstance(request.body, str):
                 transformed_body = self.transform_request_body(
-                    request.body.encode("utf-8"), transformed_path
+                    request.body.encode("utf-8"),
+                    transformed_path,
+                    self.proxy_mode,
+                    app_state,
                 )
             elif isinstance(request.body, dict):
                 import json
                 transformed_body = self.transform_request_body(
-                    json.dumps(request.body).encode("utf-8"), transformed_path
+                    json.dumps(request.body).encode("utf-8"),
+                    transformed_path,
+                    self.proxy_mode,
+                    app_state,
                 )
         # Create new transformed request
@@ -105,6 +172,88 @@ class HTTPRequestTransformer(RequestTransformer):
             metadata=request.metadata,
         )
+    async def transform_proxy_request(
+        self,
+        method: str,
+        path: str,
+        headers: dict[str, str],
+        body: bytes | None,
+        query_params: dict[str, str | list[str]] | None,
+        access_token: str,
+        target_base_url: str = "https://api.anthropic.com",
+        app_state: Any = None,
+        injection_mode: str = "minimal",
+    ) -> RequestData:
+        """Transform request using direct parameters from ProxyService.
+        This method provides the same functionality as ProxyService._transform_request()
+        but is properly located in the transformer layer.
+        Args:
+            method: HTTP method
+            path: Request path
+            headers: Request headers
+            body: Request body
+            query_params: Query parameters
+            access_token: OAuth access token
+            target_base_url: Base URL for the target API
+            app_state: Optional app state containing detection data
+            injection_mode: System prompt injection mode
+        Returns:
+            Dictionary with transformed request data (method, url, headers, body)
+        """
+        import urllib.parse
+        # Transform path
+        transformed_path = self.transform_path(path, self.proxy_mode)
+        target_url = f"{target_base_url.rstrip('/')}{transformed_path}"
+        # Add beta=true query parameter for /v1/messages requests if not already present
+        if transformed_path == "/v1/messages":
+            if query_params is None:
+                query_params = {}
+            elif "beta" not in query_params:
+                query_params = dict(query_params)  # Make a copy
+            if "beta" not in query_params:
+                query_params["beta"] = "true"
+        # Transform body first (as it might change size)
+        proxy_body = None
+        if body:
+            proxy_body = self.transform_request_body(
+                body, path, self.proxy_mode, app_state, injection_mode
+            )
+        # Transform headers (and update Content-Length if body changed)
+        proxy_headers = self.create_proxy_headers(
+            headers, access_token, self.proxy_mode, app_state
+        )
+        # Update Content-Length if body was transformed and size changed
+        if proxy_body and body and len(proxy_body) != len(body):
+            # Remove any existing content-length headers (case-insensitive)
+            proxy_headers = {
+                k: v for k, v in proxy_headers.items() if k.lower() != "content-length"
+            }
+            proxy_headers["Content-Length"] = str(len(proxy_body))
+        elif proxy_body and not body:
+            # New body was created where none existed
+            proxy_headers["Content-Length"] = str(len(proxy_body))
+        # Add query parameters to URL if present
+        if query_params:
+            query_string = urllib.parse.urlencode(query_params)
+            target_url = f"{target_url}?{query_string}"
+        return RequestData(
+            method=method,
+            url=target_url,
+            headers=proxy_headers,
+            body=proxy_body,
+        )
     def transform_path(self, path: str, proxy_mode: str = "full") -> str:
         """Transform request path."""
         # Remove /api prefix if present (for new proxy endpoints)
@@ -122,7 +271,11 @@ class HTTPRequestTransformer(RequestTransformer):
         return path
     def create_proxy_headers(
-        self, headers: dict[str, str], access_token: str, proxy_mode: str = "full"
+        self,
+        headers: dict[str, str],
+        access_token: str,
+        proxy_mode: str = "full",
+        app_state: Any = None,
     ) -> dict[str, str]:
         """Create proxy headers from original headers with Claude CLI identity."""
         proxy_headers = {}
@@ -170,27 +323,35 @@ class HTTPRequestTransformer(RequestTransformer):
         if "connection" not in [k.lower() for k in proxy_headers]:
             proxy_headers["Connection"] = "keep-alive"
-        # Critical Claude/Anthropic headers for tools and beta features
-        proxy_headers["anthropic-beta"] = (
-            "claude-code-20250219,oauth-2025-04-20,"
-            "interleaved-thinking-2025-05-14,fine-grained-tool-streaming-2025-05-14"
-        )
-        proxy_headers["anthropic-version"] = "2023-06-01"
-        proxy_headers["anthropic-dangerous-direct-browser-access"] = "true"
-        # Claude CLI identity headers
-        proxy_headers["x-app"] = "cli"
-        proxy_headers["User-Agent"] = "claude-cli/1.0.60 (external, cli)"
-        # Stainless SDK compatibility headers
-        proxy_headers["X-Stainless-Lang"] = "js"
-        proxy_headers["X-Stainless-Retry-Count"] = "0"
-        proxy_headers["X-Stainless-Timeout"] = "60"
-        proxy_headers["X-Stainless-Package-Version"] = "0.55.1"
-        proxy_headers["X-Stainless-OS"] = "Linux"
-        proxy_headers["X-Stainless-Arch"] = "x64"
-        proxy_headers["X-Stainless-Runtime"] = "node"
-        proxy_headers["X-Stainless-Runtime-Version"] = "v24.3.0"
+        # Use detected Claude CLI headers when available
+        if app_state and hasattr(app_state, "claude_detection_data"):
+            claude_data = app_state.claude_detection_data
+            detected_headers = claude_data.headers.to_headers_dict()
+            proxy_headers.update(detected_headers)
+            logger.debug("using_detected_headers", version=claude_data.claude_version)
+        else:
+            # Fallback to hardcoded Claude/Anthropic headers
+            proxy_headers["anthropic-beta"] = (
+                "claude-code-20250219,oauth-2025-04-20,"
+                "interleaved-thinking-2025-05-14,fine-grained-tool-streaming-2025-05-14"
+            )
+            proxy_headers["anthropic-version"] = "2023-06-01"
+            proxy_headers["anthropic-dangerous-direct-browser-access"] = "true"
+            # Claude CLI identity headers
+            proxy_headers["x-app"] = "cli"
+            proxy_headers["User-Agent"] = "claude-cli/1.0.60 (external, cli)"
+            # Stainless SDK compatibility headers
+            proxy_headers["X-Stainless-Lang"] = "js"
+            proxy_headers["X-Stainless-Retry-Count"] = "0"
+            proxy_headers["X-Stainless-Timeout"] = "60"
+            proxy_headers["X-Stainless-Package-Version"] = "0.55.1"
+            proxy_headers["X-Stainless-OS"] = "Linux"
+            proxy_headers["X-Stainless-Arch"] = "x64"
+            proxy_headers["X-Stainless-Runtime"] = "node"
+            proxy_headers["X-Stainless-Runtime-Version"] = "v24.3.0"
+            logger.debug("using_fallback_headers")
         # Standard HTTP headers for proper API interaction
         proxy_headers["accept-language"] = "*"
@@ -200,8 +361,146 @@ class HTTPRequestTransformer(RequestTransformer):
         return proxy_headers
+    def _count_cache_control_blocks(self, data: dict[str, Any]) -> dict[str, int]:
+        """Count cache_control blocks in different parts of the request.
+        Returns:
+            Dictionary with counts for 'injected_system', 'user_system', and 'messages'
+        """
+        counts = {"injected_system": 0, "user_system": 0, "messages": 0}
+        # Count in system field
+        system = data.get("system")
+        if system:
+            if isinstance(system, str):
+                # String system prompts don't have cache_control
+                pass
+            elif isinstance(system, list):
+                # Count cache_control in system prompt blocks
+                # The first block(s) are injected, rest are user's
+                injected_count = 0
+                for i, block in enumerate(system):
+                    if isinstance(block, dict) and "cache_control" in block:
+                        # Check if this is the injected prompt (contains Claude Code identity)
+                        text = block.get("text", "")
+                        if "Claude Code" in text or "Anthropic's official CLI" in text:
+                            counts["injected_system"] += 1
+                            injected_count = max(injected_count, i + 1)
+                        elif i < injected_count:
+                            # Part of injected system (multiple blocks)
+                            counts["injected_system"] += 1
+                        else:
+                            counts["user_system"] += 1
+        # Count in messages
+        messages = data.get("messages", [])
+        for msg in messages:
+            content = msg.get("content")
+            if isinstance(content, list):
+                for block in content:
+                    if isinstance(block, dict) and "cache_control" in block:
+                        counts["messages"] += 1
+        return counts
+    def _limit_cache_control_blocks(
+        self, data: dict[str, Any], max_blocks: int = 4
+    ) -> dict[str, Any]:
+        """Limit the number of cache_control blocks to comply with Anthropic's limit.
+        Priority order:
+        1. Injected system prompt cache_control (highest priority - Claude Code identity)
+        2. User's system prompt cache_control
+        3. User's message cache_control (lowest priority)
+        Args:
+            data: Request data dictionary
+            max_blocks: Maximum number of cache_control blocks allowed (default: 4)
+        Returns:
+            Modified data dictionary with cache_control blocks limited
+        """
+        import copy
+        # Deep copy to avoid modifying original
+        data = copy.deepcopy(data)
+        # Count existing blocks
+        counts = self._count_cache_control_blocks(data)
+        total = counts["injected_system"] + counts["user_system"] + counts["messages"]
+        if total <= max_blocks:
+            # No need to remove anything
+            return data
+        logger.warning(
+            "cache_control_limit_exceeded",
+            total_blocks=total,
+            max_blocks=max_blocks,
+            injected=counts["injected_system"],
+            user_system=counts["user_system"],
+            messages=counts["messages"],
+        )
+        # Calculate how many to remove
+        to_remove = total - max_blocks
+        removed = 0
+        # Remove from messages first (lowest priority)
+        if to_remove > 0 and counts["messages"] > 0:
+            messages = data.get("messages", [])
+            for msg in reversed(messages):  # Remove from end first
+                if removed >= to_remove:
+                    break
+                content = msg.get("content")
+                if isinstance(content, list):
+                    for block in reversed(content):
+                        if removed >= to_remove:
+                            break
+                        if isinstance(block, dict) and "cache_control" in block:
+                            del block["cache_control"]
+                            removed += 1
+                            logger.debug("removed_cache_control", location="message")
+        # Remove from user system prompts next
+        if removed < to_remove and counts["user_system"] > 0:
+            system = data.get("system")
+            if isinstance(system, list):
+                # Find and remove cache_control from user system blocks (non-injected)
+                for block in reversed(system):
+                    if removed >= to_remove:
+                        break
+                    if isinstance(block, dict) and "cache_control" in block:
+                        text = block.get("text", "")
+                        # Skip injected prompts (highest priority)
+                        if (
+                            "Claude Code" not in text
+                            and "Anthropic's official CLI" not in text
+                        ):
+                            del block["cache_control"]
+                            removed += 1
+                            logger.debug(
+                                "removed_cache_control", location="user_system"
+                            )
+        # In theory, we should never need to remove injected system cache_control
+        # but include this for completeness
+        if removed < to_remove:
+            logger.error(
+                "cannot_preserve_injected_cache_control",
+                needed_to_remove=to_remove,
+                actually_removed=removed,
+            )
+        return data
     def transform_request_body(
-        self, body: bytes, path: str, proxy_mode: str = "full"
+        self,
+        body: bytes,
+        path: str,
+        proxy_mode: str = "full",
+        app_state: Any = None,
+        injection_mode: str = "minimal",
     ) -> bytes:
         """Transform request body."""
         if not body:
@@ -213,60 +512,77 @@ class HTTPRequestTransformer(RequestTransformer):
             body = self._transform_openai_to_anthropic(body)
         # Apply system prompt transformation for Claude Code identity
-        return self.transform_system_prompt(body)
+        return self.transform_system_prompt(body, app_state, injection_mode)
-    def transform_system_prompt(self, body: bytes) -> bytes:
-        """Transform system prompt to ensure Claude Code identification comes first.
+    def transform_system_prompt(
+        self, body: bytes, app_state: Any = None, injection_mode: str = "minimal"
+    ) -> bytes:
+        """Transform system prompt based on injection mode.
         Args:
             body: Original request body as bytes
+            app_state: Optional app state containing detection data
+            injection_mode: System prompt injection mode ('minimal' or 'full')
         Returns:
-            Transformed request body as bytes with Claude Code system prompt
+            Transformed request body as bytes with system prompt injection
         """
         try:
             import json
             data = json.loads(body.decode("utf-8"))
-        except (json.JSONDecodeError, UnicodeDecodeError):
+        except (json.JSONDecodeError, UnicodeDecodeError) as e:
             # Return original if not valid JSON
+            logger.warning(
+                "http_transform_json_decode_failed",
+                error=str(e),
+                body_preview=body[:200].decode("utf-8", errors="replace")
+                if body
+                else None,
+                body_length=len(body) if body else 0,
+            )
             return body
-        # Check if request has a system prompt
-        if "system" not in data or (
-            isinstance(data["system"], str) and data["system"] == claude_code_prompt
-        ):
-            # No system prompt, inject Claude Code identification
-            data["system"] = [get_claude_code_prompt()]
-            return json.dumps(data).encode("utf-8")
-        system = data["system"]
-        if isinstance(system, str):
-            # Handle string system prompt
-            if system == claude_code_prompt:
-                # Already correct, convert to proper array format
-                data["system"] = [get_claude_code_prompt()]
-                return json.dumps(data).encode("utf-8")
-            # Prepend Claude Code prompt to existing string
-            data["system"] = [
-                get_claude_code_prompt(),
-                {"type": "text", "text": system},
-            ]
-        elif isinstance(system, list):
-            # Handle array system prompt
-            if len(system) > 0:
-                # Check if first element has correct text
-                first = system[0]
-                if isinstance(first, dict) and first.get("text") == claude_code_prompt:
-                    # Already has Claude Code first, ensure it has cache_control
-                    data["system"][0] = get_claude_code_prompt()
-                    return json.dumps(data).encode("utf-8")
-            # Prepend Claude Code prompt
-            data["system"] = [get_claude_code_prompt()] + system
+        # Get the system field to inject
+        detected_system = get_detected_system_field(app_state, injection_mode)
+        if detected_system is None:
+            # No detection data, use fallback
+            detected_system = get_fallback_system_field()
+        # Always inject the system prompt (detected or fallback)
+        if "system" not in data:
+            # No existing system prompt, inject the detected/fallback one
+            data["system"] = detected_system
+        else:
+            # Request has existing system prompt, prepend the detected/fallback one
+            existing_system = data["system"]
+            if isinstance(detected_system, str):
+                # Detected system is a string
+                if isinstance(existing_system, str):
+                    # Both are strings, convert to list format
+                    data["system"] = [
+                        {"type": "text", "text": detected_system},
+                        {"type": "text", "text": existing_system},
+                    ]
+                elif isinstance(existing_system, list):
+                    # Detected is string, existing is list
+                    data["system"] = [
+                        {"type": "text", "text": detected_system}
+                    ] + existing_system
+            elif isinstance(detected_system, list):
+                # Detected system is a list
+                if isinstance(existing_system, str):
+                    # Detected is list, existing is string
+                    data["system"] = detected_system + [
+                        {"type": "text", "text": existing_system}
+                    ]
+                elif isinstance(existing_system, list):
+                    # Both are lists, concatenate
+                    data["system"] = detected_system + existing_system
+        # Limit cache_control blocks to comply with Anthropic's limit
+        data = self._limit_cache_control_blocks(data)
         return json.dumps(data).encode("utf-8")
@@ -290,7 +606,14 @@ class HTTPRequestTransformer(RequestTransformer):
                 messages = data.get("messages", [])
                 if messages and any(msg.get("role") == "system" for msg in messages):
                     return True
-            except (json.JSONDecodeError, UnicodeDecodeError):
+            except (json.JSONDecodeError, UnicodeDecodeError) as e:
+                logger.warning(
+                    "openai_request_detection_json_decode_failed",
+                    error=str(e),
+                    body_preview=body[:100].decode("utf-8", errors="replace")
+                    if body
+                    else None,
+                )
                 pass
         return False
@@ -387,6 +710,65 @@ class HTTPResponseTransformer(ResponseTransformer):
             metadata=response.metadata,
         )
+    async def transform_proxy_response(
+        self,
+        status_code: int,
+        headers: dict[str, str],
+        body: bytes,
+        original_path: str,
+        proxy_mode: str = "full",
+    ) -> ResponseData:
+        """Transform response using direct parameters from ProxyService.
+        This method provides the same functionality as ProxyService._transform_response()
+        but is properly located in the transformer layer.
+        Args:
+            status_code: HTTP status code
+            headers: Response headers
+            body: Response body
+            original_path: Original request path for context
+            proxy_mode: Proxy transformation mode
+        Returns:
+            Dictionary with transformed response data (status_code, headers, body)
+        """
+        # For error responses, handle OpenAI transformation if needed
+        if status_code >= 400:
+            transformed_error_body = body
+            if self._is_openai_request(original_path):
+                try:
+                    import json
+                    from ccproxy.adapters.openai.adapter import OpenAIAdapter
+                    error_data = json.loads(body.decode("utf-8"))
+                    openai_adapter = OpenAIAdapter()
+                    openai_error = openai_adapter.adapt_error(error_data)
+                    transformed_error_body = json.dumps(openai_error).encode("utf-8")
+                except (json.JSONDecodeError, UnicodeDecodeError):
+                    # Keep original error if parsing fails
+                    pass
+            return ResponseData(
+                status_code=status_code,
+                headers=headers,
+                body=transformed_error_body,
+            )
+        # For successful responses, transform normally
+        transformed_body = self.transform_response_body(body, original_path, proxy_mode)
+        transformed_headers = self.transform_response_headers(
+            headers, original_path, len(transformed_body), proxy_mode
+        )
+        return ResponseData(
+            status_code=status_code,
+            headers=transformed_headers,
+            body=transformed_body,
+        )
     def transform_response_body(
         self, body: bytes, path: str, proxy_mode: str = "full"
     ) -> bytes:
@@ -411,6 +793,7 @@ class HTTPResponseTransformer(ResponseTransformer):
                 "content-length",
                 "transfer-encoding",
                 "content-encoding",
+                "date",  # Remove upstream date header to avoid conflicts
             ]:
                 transformed_headers[key] = value

ccproxy-api 0.1.4__py3-none-any.whl → 0.1.6__py3-none-any.whl

ccproxy-api 0.1.4py3-none-any.whl → 0.1.6py3-none-any.whl