PyPI - ripperdoc - Versions diffs - 0.2.7__py3-none-any.whl → 0.2.9__py3-none-any.whl - Mend

ripperdoc 0.2.7py3-none-any.whl → 0.2.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (87) hide show

ripperdoc/__init__.py +1 -1
ripperdoc/cli/cli.py +33 -115
ripperdoc/cli/commands/__init__.py +70 -6
ripperdoc/cli/commands/agents_cmd.py +6 -3
ripperdoc/cli/commands/clear_cmd.py +1 -4
ripperdoc/cli/commands/config_cmd.py +1 -1
ripperdoc/cli/commands/context_cmd.py +3 -2
ripperdoc/cli/commands/doctor_cmd.py +18 -4
ripperdoc/cli/commands/help_cmd.py +11 -1
ripperdoc/cli/commands/hooks_cmd.py +610 -0
ripperdoc/cli/commands/models_cmd.py +26 -9
ripperdoc/cli/commands/permissions_cmd.py +57 -37
ripperdoc/cli/commands/resume_cmd.py +6 -4
ripperdoc/cli/commands/status_cmd.py +4 -4
ripperdoc/cli/commands/tasks_cmd.py +8 -4
ripperdoc/cli/ui/file_mention_completer.py +64 -8
ripperdoc/cli/ui/interrupt_handler.py +3 -4
ripperdoc/cli/ui/message_display.py +5 -3
ripperdoc/cli/ui/panels.py +13 -10
ripperdoc/cli/ui/provider_options.py +247 -0
ripperdoc/cli/ui/rich_ui.py +196 -77
ripperdoc/cli/ui/spinner.py +25 -1
ripperdoc/cli/ui/tool_renderers.py +8 -2
ripperdoc/cli/ui/wizard.py +215 -0
ripperdoc/core/agents.py +9 -3
ripperdoc/core/config.py +49 -12
ripperdoc/core/custom_commands.py +412 -0
ripperdoc/core/default_tools.py +11 -2
ripperdoc/core/hooks/__init__.py +99 -0
ripperdoc/core/hooks/config.py +301 -0
ripperdoc/core/hooks/events.py +535 -0
ripperdoc/core/hooks/executor.py +496 -0
ripperdoc/core/hooks/integration.py +344 -0
ripperdoc/core/hooks/manager.py +745 -0
ripperdoc/core/permissions.py +40 -8
ripperdoc/core/providers/anthropic.py +548 -68
ripperdoc/core/providers/gemini.py +70 -5
ripperdoc/core/providers/openai.py +60 -5
ripperdoc/core/query.py +140 -39
ripperdoc/core/query_utils.py +2 -0
ripperdoc/core/skills.py +9 -3
ripperdoc/core/system_prompt.py +4 -2
ripperdoc/core/tool.py +9 -5
ripperdoc/sdk/client.py +2 -2
ripperdoc/tools/ask_user_question_tool.py +5 -3
ripperdoc/tools/background_shell.py +2 -1
ripperdoc/tools/bash_output_tool.py +1 -1
ripperdoc/tools/bash_tool.py +30 -20
ripperdoc/tools/dynamic_mcp_tool.py +29 -8
ripperdoc/tools/enter_plan_mode_tool.py +1 -1
ripperdoc/tools/exit_plan_mode_tool.py +1 -1
ripperdoc/tools/file_edit_tool.py +8 -4
ripperdoc/tools/file_read_tool.py +9 -5
ripperdoc/tools/file_write_tool.py +9 -5
ripperdoc/tools/glob_tool.py +3 -2
ripperdoc/tools/grep_tool.py +3 -2
ripperdoc/tools/kill_bash_tool.py +1 -1
ripperdoc/tools/ls_tool.py +1 -1
ripperdoc/tools/mcp_tools.py +13 -10
ripperdoc/tools/multi_edit_tool.py +8 -7
ripperdoc/tools/notebook_edit_tool.py +7 -4
ripperdoc/tools/skill_tool.py +1 -1
ripperdoc/tools/task_tool.py +5 -4
ripperdoc/tools/todo_tool.py +2 -2
ripperdoc/tools/tool_search_tool.py +3 -2
ripperdoc/utils/conversation_compaction.py +11 -7
ripperdoc/utils/file_watch.py +8 -2
ripperdoc/utils/json_utils.py +2 -1
ripperdoc/utils/mcp.py +11 -3
ripperdoc/utils/memory.py +4 -2
ripperdoc/utils/message_compaction.py +21 -7
ripperdoc/utils/message_formatting.py +11 -7
ripperdoc/utils/messages.py +105 -66
ripperdoc/utils/path_ignore.py +38 -12
ripperdoc/utils/permissions/path_validation_utils.py +2 -1
ripperdoc/utils/permissions/shell_command_validation.py +427 -91
ripperdoc/utils/safe_get_cwd.py +2 -1
ripperdoc/utils/session_history.py +13 -6
ripperdoc/utils/todo.py +2 -1
ripperdoc/utils/token_estimation.py +6 -1
{ripperdoc-0.2.7.dist-info → ripperdoc-0.2.9.dist-info}/METADATA +24 -3
ripperdoc-0.2.9.dist-info/RECORD +123 -0
ripperdoc-0.2.7.dist-info/RECORD +0 -113
{ripperdoc-0.2.7.dist-info → ripperdoc-0.2.9.dist-info}/WHEEL +0 -0
{ripperdoc-0.2.7.dist-info → ripperdoc-0.2.9.dist-info}/entry_points.txt +0 -0
{ripperdoc-0.2.7.dist-info → ripperdoc-0.2.9.dist-info}/licenses/LICENSE +0 -0
{ripperdoc-0.2.7.dist-info → ripperdoc-0.2.9.dist-info}/top_level.txt +0 -0

ripperdoc/core/providers/anthropic.py CHANGED Viewed

@@ -3,10 +3,13 @@
 from __future__ import annotations
 import asyncio
+import json
 import time
 from typing import Any, Awaitable, Callable, Dict, List, Optional
+from uuid import uuid4
 import anthropic
+import httpx
 from anthropic import AsyncAnthropic
 from ripperdoc.core.config import ModelProfile
@@ -15,13 +18,11 @@ from ripperdoc.core.providers.base import (
     ProviderClient,
     ProviderResponse,
     call_with_timeout_and_retries,
-    iter_with_timeout,
     sanitize_tool_history,
 )
 from ripperdoc.core.query_utils import (
     anthropic_usage_tokens,
     build_anthropic_tool_schemas,
-    content_blocks_from_anthropic_response,
     estimate_cost_usd,
 )
 from ripperdoc.core.tool import Tool
@@ -63,8 +64,99 @@ def _classify_anthropic_error(exc: Exception) -> tuple[str, str]:
     return "unknown_error", f"Unexpected error ({exc_type}): {exc_msg}"
+def _content_blocks_from_stream_state(
+    collected_text: List[str],
+    collected_thinking: List[str],
+    collected_tool_calls: Dict[int, Dict[str, Any]],
+) -> List[Dict[str, Any]]:
+    """Build content blocks from accumulated stream state."""
+    blocks: List[Dict[str, Any]] = []
+    # Add thinking block if present
+    if collected_thinking:
+        blocks.append(
+            {
+                "type": "thinking",
+                "thinking": "".join(collected_thinking),
+            }
+        )
+    # Add text block if present
+    if collected_text:
+        blocks.append(
+            {
+                "type": "text",
+                "text": "".join(collected_text),
+            }
+        )
+    # Add tool_use blocks
+    for idx in sorted(collected_tool_calls.keys()):
+        call = collected_tool_calls[idx]
+        name = call.get("name")
+        if not name:
+            continue
+        tool_use_id = call.get("id") or str(uuid4())
+        blocks.append(
+            {
+                "type": "tool_use",
+                "tool_use_id": tool_use_id,
+                "name": name,
+                "input": call.get("input", {}),
+            }
+        )
+    return blocks
+def _content_blocks_from_response(response: Any) -> List[Dict[str, Any]]:
+    """Normalize Anthropic response content to our internal block format."""
+    blocks: List[Dict[str, Any]] = []
+    for block in getattr(response, "content", []) or []:
+        btype = getattr(block, "type", None)
+        if btype == "text":
+            blocks.append({"type": "text", "text": getattr(block, "text", "")})
+        elif btype == "thinking":
+            blocks.append(
+                {
+                    "type": "thinking",
+                    "thinking": getattr(block, "thinking", None) or "",
+                    "signature": getattr(block, "signature", None),
+                }
+            )
+        elif btype == "redacted_thinking":
+            blocks.append(
+                {
+                    "type": "redacted_thinking",
+                    "data": getattr(block, "data", None),
+                    "signature": getattr(block, "signature", None),
+                }
+            )
+        elif btype == "tool_use":
+            raw_input = getattr(block, "input", {}) or {}
+            blocks.append(
+                {
+                    "type": "tool_use",
+                    "tool_use_id": getattr(block, "id", None) or str(uuid4()),
+                    "name": getattr(block, "name", None),
+                    "input": raw_input if isinstance(raw_input, dict) else {},
+                }
+            )
+    return blocks
 class AnthropicClient(ProviderClient):
-    """Anthropic client with streaming and non-streaming support."""
+    """Anthropic client with streaming and non-streaming support.
+    Streaming mode (default):
+    - Uses event-based streaming to capture both thinking and text tokens
+    - Timeout applies per-token (chunk), not to the entire request
+    - Thinking tokens are streamed in real-time via progress_callback
+    Non-streaming mode:
+    - Makes a single blocking request
+    - Timeout applies to the entire request
+    """
     def __init__(self, client_factory: Optional[Callable[[], Awaitable[AsyncAnthropic]]] = None):
         self._client_factory = client_factory
@@ -109,6 +201,15 @@ class AnthropicClient(ProviderClient):
         except Exception as exc:
             duration_ms = (time.time() - start_time) * 1000
             error_code, error_message = _classify_anthropic_error(exc)
+            logger.debug(
+                "[anthropic_client] Exception details",
+                extra={
+                    "model": model_profile.model,
+                    "exception_type": type(exc).__name__,
+                    "exception_str": str(exc),
+                    "error_code": error_code,
+                },
+            )
             logger.error(
                 "[anthropic_client] API call failed",
                 extra={
@@ -141,95 +242,115 @@ class AnthropicClient(ProviderClient):
     ) -> ProviderResponse:
         """Internal implementation of call, may raise exceptions."""
         tool_schemas = await build_anthropic_tool_schemas(tools)
-        collected_text: List[str] = []
-        reasoning_parts: List[str] = []
         response_metadata: Dict[str, Any] = {}
-        anthropic_kwargs = {"base_url": model_profile.api_base}
+        logger.debug(
+            "[anthropic_client] Preparing request",
+            extra={
+                "model": model_profile.model,
+                "tool_mode": tool_mode,
+                "stream": stream,
+                "max_thinking_tokens": max_thinking_tokens,
+                "num_tools": len(tool_schemas),
+            },
+        )
+        anthropic_kwargs: Dict[str, Any] = {}
+        if model_profile.api_base:
+            anthropic_kwargs["base_url"] = model_profile.api_base
         if model_profile.api_key:
             anthropic_kwargs["api_key"] = model_profile.api_key
         auth_token = getattr(model_profile, "auth_token", None)
         if auth_token:
             anthropic_kwargs["auth_token"] = auth_token
+        # Set timeout for the Anthropic SDK client
+        # For streaming, we want a long timeout since models may take time to start responding
+        # httpx.Timeout: (connect, read, write, pool)
+        if stream:
+            # For streaming: long read timeout, reasonable connect timeout
+            # The read timeout applies to waiting for each chunk from the server
+            timeout_config = httpx.Timeout(
+                connect=60.0,  # 60 seconds to establish connection
+                read=600.0,  # 10 minutes to wait for each chunk (model may be thinking)
+                write=60.0,  # 60 seconds to send request
+                pool=60.0,  # 60 seconds to get connection from pool
+            )
+            anthropic_kwargs["timeout"] = timeout_config
+        elif request_timeout and request_timeout > 0:
+            # For non-streaming: use the provided timeout
+            anthropic_kwargs["timeout"] = request_timeout
         normalized_messages = sanitize_tool_history(list(normalized_messages))
         thinking_payload: Optional[Dict[str, Any]] = None
         if max_thinking_tokens > 0:
             thinking_payload = {"type": "enabled", "budget_tokens": max_thinking_tokens}
-        async with await self._client(anthropic_kwargs) as client:
+        # Build common request kwargs
+        request_kwargs: Dict[str, Any] = {
+            "model": model_profile.model,
+            "max_tokens": model_profile.max_tokens,
+            "system": system_prompt,
+            "messages": normalized_messages,
+            "temperature": model_profile.temperature,
+        }
+        if tool_schemas:
+            request_kwargs["tools"] = tool_schemas
+        if thinking_payload:
+            request_kwargs["thinking"] = thinking_payload
-            async def _stream_request() -> Any:
-                stream_cm = client.messages.stream(
-                    model=model_profile.model,
-                    max_tokens=model_profile.max_tokens,
-                    system=system_prompt,
-                    messages=normalized_messages,  # type: ignore[arg-type]
-                    tools=tool_schemas if tool_schemas else None,  # type: ignore
-                    temperature=model_profile.temperature,
-                    thinking=thinking_payload,  # type: ignore[arg-type]
+        logger.debug(
+            "[anthropic_client] Request parameters",
+            extra={
+                "model": model_profile.model,
+                "request_kwargs": json.dumps(
+                    {k: v for k, v in request_kwargs.items() if k != "messages"},
+                    ensure_ascii=False,
+                    default=str,
+                )[:1000],
+                "thinking_payload": json.dumps(thinking_payload, ensure_ascii=False)
+                if thinking_payload
+                else None,
+            },
+        )
+        async with await self._client(anthropic_kwargs) as client:
+            if stream:
+                # Streaming mode: use event-based streaming with per-token timeout
+                content_blocks, usage_tokens = await self._stream_request(
+                    client=client,
+                    request_kwargs=request_kwargs,
+                    progress_callback=progress_callback,
+                    request_timeout=request_timeout,
+                    max_retries=max_retries,
+                    response_metadata=response_metadata,
                 )
-                stream_resp = (
-                    await asyncio.wait_for(stream_cm.__aenter__(), timeout=request_timeout)
-                    if request_timeout and request_timeout > 0
-                    else await stream_cm.__aenter__()
+            else:
+                # Non-streaming mode: single request with overall timeout
+                content_blocks, usage_tokens = await self._non_stream_request(
+                    client=client,
+                    request_kwargs=request_kwargs,
+                    request_timeout=request_timeout,
+                    max_retries=max_retries,
+                    response_metadata=response_metadata,
                 )
-                try:
-                    async for text in iter_with_timeout(stream_resp.text_stream, request_timeout):
-                        if text:
-                            collected_text.append(text)
-                            if progress_callback:
-                                try:
-                                    await progress_callback(text)
-                                except (RuntimeError, ValueError, TypeError, OSError) as cb_exc:
-                                    logger.warning(
-                                        "[anthropic_client] Stream callback failed: %s: %s",
-                                        type(cb_exc).__name__, cb_exc,
-                                    )
-                    getter = getattr(stream_resp, "get_final_response", None) or getattr(
-                        stream_resp, "get_final_message", None
-                    )
-                    if getter:
-                        return await getter()
-                    return None
-                finally:
-                    await stream_cm.__aexit__(None, None, None)
-            async def _non_stream_request() -> Any:
-                return await client.messages.create(
-                    model=model_profile.model,
-                    max_tokens=model_profile.max_tokens,
-                    system=system_prompt,
-                    messages=normalized_messages,  # type: ignore[arg-type]
-                    tools=tool_schemas if tool_schemas else None,  # type: ignore
-                    temperature=model_profile.temperature,
-                    thinking=thinking_payload,  # type: ignore[arg-type]
-                )
-            timeout_for_call = None if stream else request_timeout
-            response = await call_with_timeout_and_retries(
-                _stream_request if stream else _non_stream_request,
-                timeout_for_call,
-                max_retries,
-            )
         duration_ms = (time.time() - start_time) * 1000
-        usage_tokens = anthropic_usage_tokens(getattr(response, "usage", None))
         cost_usd = estimate_cost_usd(model_profile, usage_tokens)
         record_usage(
             model_profile.model, duration_ms=duration_ms, cost_usd=cost_usd, **usage_tokens
         )
-        content_blocks = content_blocks_from_anthropic_response(response, tool_mode)
-        for blk in content_blocks:
-            if blk.get("type") == "thinking":
-                thinking_text = blk.get("thinking") or blk.get("text") or ""
-                if thinking_text:
-                    reasoning_parts.append(str(thinking_text))
-        if reasoning_parts:
-            response_metadata["reasoning_content"] = "\n".join(reasoning_parts)
-        # Streaming progress is handled via text_stream; final content retains thinking blocks.
+        logger.debug(
+            "[anthropic_client] Response content blocks",
+            extra={
+                "model": model_profile.model,
+                "content_blocks": json.dumps(content_blocks, ensure_ascii=False)[:1000],
+                "usage_tokens": json.dumps(usage_tokens, ensure_ascii=False),
+                "metadata": json.dumps(response_metadata, ensure_ascii=False)[:500],
+            },
+        )
         logger.info(
             "[anthropic_client] Response received",
@@ -238,6 +359,8 @@ class AnthropicClient(ProviderClient):
                 "duration_ms": round(duration_ms, 2),
                 "tool_mode": tool_mode,
                 "tool_schemas": len(tool_schemas),
+                "stream": stream,
+                "content_blocks": len(content_blocks),
             },
         )
@@ -248,3 +371,360 @@ class AnthropicClient(ProviderClient):
             duration_ms=duration_ms,
             metadata=response_metadata,
         )
+    async def _stream_request(
+        self,
+        *,
+        client: AsyncAnthropic,
+        request_kwargs: Dict[str, Any],
+        progress_callback: Optional[ProgressCallback],
+        request_timeout: Optional[float],
+        max_retries: int,
+        response_metadata: Dict[str, Any],
+    ) -> tuple[List[Dict[str, Any]], Dict[str, int]]:
+        """Execute a streaming request with per-token timeout.
+        Uses Anthropic's event-based streaming API to capture:
+        - thinking tokens (streamed in real-time)
+        - text tokens (streamed in real-time)
+        - tool_use blocks
+        In streaming mode:
+        - Connection timeout uses request_timeout
+        - Per-event timeout is disabled (None) because the model may take
+          a long time to generate the first token (especially during thinking)
+        - Once streaming starts, events should flow continuously
+        """
+        collected_text: List[str] = []
+        collected_thinking: List[str] = []
+        collected_tool_calls: Dict[int, Dict[str, Any]] = {}
+        usage_tokens: Dict[str, int] = {}
+        # Use mutable containers to track state across event handling
+        current_block_index_ref: List[int] = [-1]
+        current_block_type_ref: List[Optional[str]] = [None]
+        event_count = 0
+        message_stop_received = False
+        async def _do_stream() -> None:
+            nonlocal event_count, message_stop_received
+            event_count = 0
+            message_stop_received = False
+            logger.debug(
+                "[anthropic_client] Initiating stream request",
+                extra={
+                    "model": request_kwargs.get("model"),
+                },
+            )
+            # Create the stream - this initiates the connection
+            stream = client.messages.stream(**request_kwargs)
+            # Enter the stream context
+            stream_manager = await stream.__aenter__()
+            try:
+                # Iterate over events
+                # Some API proxies don't properly close the stream after message_stop,
+                # so we break out of the loop when we receive message_stop
+                async for event in stream_manager:
+                    event_count += 1
+                    event_type = getattr(event, "type", "unknown")
+                    await self._handle_stream_event(
+                        event=event,
+                        collected_text=collected_text,
+                        collected_thinking=collected_thinking,
+                        collected_tool_calls=collected_tool_calls,
+                        usage_tokens=usage_tokens,
+                        progress_callback=progress_callback,
+                        current_block_index_ref=current_block_index_ref,
+                        current_block_type_ref=current_block_type_ref,
+                    )
+                    # Check if we received message_stop - break out of loop
+                    # Some API proxies don't properly close the SSE stream
+                    if event_type == "message_stop":
+                        message_stop_received = True
+                        break
+            except Exception:
+                raise
+            finally:
+                try:
+                    # Use timeout for __aexit__ in case the stream doesn't close properly
+                    await asyncio.wait_for(stream.__aexit__(None, None, None), timeout=5.0)
+                except asyncio.TimeoutError:
+                    pass  # Stream didn't close properly, continue anyway
+                except Exception:
+                    pass  # Ignore __aexit__ errors
+        # For streaming, we don't use call_with_timeout_and_retries on the whole operation
+        # Instead, timeout is applied per-event inside _iter_events_with_timeout
+        # But we still want retries for connection failures
+        attempts = max(0, int(max_retries)) + 1
+        last_error: Optional[Exception] = None
+        for attempt in range(1, attempts + 1):
+            try:
+                # Reset state for retry
+                collected_text.clear()
+                collected_thinking.clear()
+                collected_tool_calls.clear()
+                usage_tokens.clear()
+                current_block_index_ref[0] = -1
+                current_block_type_ref[0] = None
+                await _do_stream()
+                break  # Success
+            except asyncio.TimeoutError as exc:
+                last_error = exc
+                if attempt == attempts:
+                    break
+                delay = 0.5 * (2 ** (attempt - 1))  # Exponential backoff
+                logger.warning(
+                    "[anthropic_client] Stream timed out; retrying",
+                    extra={
+                        "attempt": attempt,
+                        "max_retries": max_retries,
+                        "delay_seconds": delay,
+                    },
+                )
+                await asyncio.sleep(delay)
+            except asyncio.CancelledError:
+                raise
+            except (RuntimeError, ValueError, TypeError, OSError, ConnectionError) as exc:
+                # Non-timeout errors: retry for connection errors only
+                if isinstance(exc, (OSError, ConnectionError)):
+                    last_error = exc
+                    if attempt == attempts:
+                        raise
+                    delay = 0.5 * (2 ** (attempt - 1))
+                    logger.warning(
+                        "[anthropic_client] Connection error; retrying",
+                        extra={
+                            "attempt": attempt,
+                            "error": str(exc),
+                        },
+                    )
+                    await asyncio.sleep(delay)
+                else:
+                    raise
+        if (
+            last_error
+            and not collected_text
+            and not collected_thinking
+            and not collected_tool_calls
+        ):
+            raise RuntimeError(f"Stream failed after {attempts} attempts") from last_error
+        # Store reasoning content in metadata
+        if collected_thinking:
+            response_metadata["reasoning_content"] = "".join(collected_thinking)
+        content_blocks = _content_blocks_from_stream_state(
+            collected_text, collected_thinking, collected_tool_calls
+        )
+        return content_blocks, usage_tokens
+    async def _handle_stream_event(
+        self,
+        *,
+        event: Any,
+        collected_text: List[str],
+        collected_thinking: List[str],
+        collected_tool_calls: Dict[int, Dict[str, Any]],
+        usage_tokens: Dict[str, int],
+        progress_callback: Optional[ProgressCallback],
+        current_block_index_ref: List[int],
+        current_block_type_ref: List[Optional[str]],
+    ) -> None:
+        """Handle a single stream event.
+        Supports both standard Anthropic API events and non-standard formats
+        from API proxies like aiping.cn.
+        Standard Anthropic events:
+        - message_start, content_block_start, content_block_delta, content_block_stop
+        - message_delta, message_stop
+        Non-standard events (aiping.cn style):
+        - thinking (direct thinking content)
+        - text (direct text content)
+        - signature (thinking signature)
+        """
+        event_type = getattr(event, "type", None)
+        if event_type == "message_start":
+            # Extract initial usage info if available
+            message = getattr(event, "message", None)
+            if message:
+                usage = getattr(message, "usage", None)
+                if usage:
+                    usage_tokens.update(anthropic_usage_tokens(usage))
+        elif event_type == "content_block_start":
+            # New content block starting
+            index = getattr(event, "index", 0)
+            content_block = getattr(event, "content_block", None)
+            if content_block:
+                block_type = getattr(content_block, "type", None)
+                current_block_index_ref[0] = index
+                current_block_type_ref[0] = block_type
+                if block_type == "tool_use":
+                    # Initialize tool call state
+                    collected_tool_calls[index] = {
+                        "id": getattr(content_block, "id", None),
+                        "name": getattr(content_block, "name", None),
+                        "input_json": "",
+                        "input": {},
+                    }
+                    # Announce tool start
+                    if progress_callback:
+                        tool_name = getattr(content_block, "name", "unknown")
+                        try:
+                            await progress_callback(f"[tool:{tool_name}]")
+                        except (RuntimeError, ValueError, TypeError, OSError):
+                            pass
+        elif event_type == "content_block_delta":
+            # Content delta within a block
+            index = getattr(event, "index", current_block_index_ref[0])
+            delta = getattr(event, "delta", None)
+            if not delta:
+                return
+            delta_type = getattr(delta, "type", None)
+            if delta_type == "thinking_delta":
+                # Thinking content delta
+                thinking_text = getattr(delta, "thinking", "")
+                if thinking_text:
+                    collected_thinking.append(thinking_text)
+                    if progress_callback:
+                        try:
+                            await progress_callback(thinking_text)
+                        except (RuntimeError, ValueError, TypeError, OSError) as cb_exc:
+                            logger.warning(
+                                "[anthropic_client] Progress callback failed: %s: %s",
+                                type(cb_exc).__name__,
+                                cb_exc,
+                            )
+            elif delta_type == "text_delta":
+                # Text content delta
+                text = getattr(delta, "text", "")
+                if text:
+                    collected_text.append(text)
+                    if progress_callback:
+                        try:
+                            await progress_callback(text)
+                        except (RuntimeError, ValueError, TypeError, OSError) as cb_exc:
+                            logger.warning(
+                                "[anthropic_client] Progress callback failed: %s: %s",
+                                type(cb_exc).__name__,
+                                cb_exc,
+                            )
+            elif delta_type == "input_json_delta":
+                # Tool input JSON delta
+                partial_json = getattr(delta, "partial_json", "")
+                if partial_json and index in collected_tool_calls:
+                    collected_tool_calls[index]["input_json"] += partial_json
+                    if progress_callback:
+                        try:
+                            await progress_callback(partial_json)
+                        except (RuntimeError, ValueError, TypeError, OSError):
+                            pass
+        # ===== Non-standard events from aiping.cn and similar proxies =====
+        # NOTE: aiping.cn sends BOTH standard (content_block_delta) and non-standard
+        # (text, thinking) events. We only process the non-standard events if we
+        # haven't already collected content from standard events in this block.
+        # This is controlled by checking if the standard delta was processed.
+        elif event_type == "thinking":
+            # Direct thinking content (non-standard, aiping.cn style)
+            # Skip - already handled via content_block_delta (aiping.cn sends both)
+            pass
+        elif event_type == "text":
+            # Direct text content (non-standard, aiping.cn style)
+            # Skip - already handled via content_block_delta (aiping.cn sends both)
+            pass
+        elif event_type == "signature":
+            # Thinking signature (non-standard, aiping.cn style)
+            pass
+        # ===== Standard events continued =====
+        elif event_type == "content_block_stop":
+            # Content block finished
+            index = getattr(event, "index", current_block_index_ref[0])
+            # Parse accumulated JSON for tool calls
+            if index in collected_tool_calls:
+                import json
+                json_str = collected_tool_calls[index].get("input_json", "")
+                if json_str:
+                    try:
+                        collected_tool_calls[index]["input"] = json.loads(json_str)
+                    except json.JSONDecodeError:
+                        logger.warning(
+                            "[anthropic_client] Failed to parse tool input JSON",
+                            extra={"json": json_str[:200]},
+                        )
+                        collected_tool_calls[index]["input"] = {}
+        elif event_type == "message_delta":
+            # Message-level delta (usually contains usage info at the end)
+            usage = getattr(event, "usage", None)
+            if usage:
+                # Update with final usage - output_tokens comes here
+                usage_tokens["output_tokens"] = getattr(usage, "output_tokens", 0)
+        elif event_type == "message_stop":
+            # Message complete
+            pass
+        # Unknown event types are silently ignored
+    async def _non_stream_request(
+        self,
+        *,
+        client: AsyncAnthropic,
+        request_kwargs: Dict[str, Any],
+        request_timeout: Optional[float],
+        max_retries: int,
+        response_metadata: Dict[str, Any],
+    ) -> tuple[List[Dict[str, Any]], Dict[str, int]]:
+        """Execute a non-streaming request with overall timeout."""
+        async def _do_request() -> Any:
+            return await client.messages.create(**request_kwargs)
+        response = await call_with_timeout_and_retries(
+            _do_request,
+            request_timeout,
+            max_retries,
+        )
+        usage_tokens = anthropic_usage_tokens(getattr(response, "usage", None))
+        content_blocks = _content_blocks_from_response(response)
+        # Extract reasoning content for metadata
+        for block in content_blocks:
+            if block.get("type") == "thinking":
+                thinking_text = block.get("thinking") or ""
+                if thinking_text:
+                    response_metadata["reasoning_content"] = thinking_text
+                    break
+        return content_blocks, usage_tokens

ripperdoc 0.2.7__py3-none-any.whl → 0.2.9__py3-none-any.whl

ripperdoc 0.2.7py3-none-any.whl → 0.2.9py3-none-any.whl