PyPI - code-puppy - Versions diffs - 0.0.374__py3-none-any.whl → 0.0.375__py3-none-any.whl - Mend

code-puppy 0.0.374py3-none-any.whl → 0.0.375py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

code_puppy/agents/agent_manager.py +34 -2
code_puppy/agents/base_agent.py +61 -4
code_puppy/callbacks.py +125 -0
code_puppy/messaging/rich_renderer.py +13 -7
code_puppy/model_factory.py +63 -258
code_puppy/model_utils.py +33 -1
code_puppy/plugins/antigravity_oauth/register_callbacks.py +106 -1
code_puppy/plugins/antigravity_oauth/utils.py +2 -3
code_puppy/plugins/chatgpt_oauth/register_callbacks.py +85 -3
code_puppy/plugins/claude_code_oauth/register_callbacks.py +88 -0
code_puppy/plugins/ralph/__init__.py +13 -0
code_puppy/plugins/ralph/agents.py +433 -0
code_puppy/plugins/ralph/commands.py +208 -0
code_puppy/plugins/ralph/loop_controller.py +285 -0
code_puppy/plugins/ralph/models.py +125 -0
code_puppy/plugins/ralph/register_callbacks.py +133 -0
code_puppy/plugins/ralph/state_manager.py +322 -0
code_puppy/plugins/ralph/tools.py +451 -0
code_puppy/tools/__init__.py +31 -0
code_puppy/tools/agent_tools.py +1 -1
code_puppy/tools/command_runner.py +23 -9
{code_puppy-0.0.374.dist-info → code_puppy-0.0.375.dist-info}/METADATA +1 -1
{code_puppy-0.0.374.dist-info → code_puppy-0.0.375.dist-info}/RECORD +28 -20
{code_puppy-0.0.374.data → code_puppy-0.0.375.data}/data/code_puppy/models.json +0 -0
{code_puppy-0.0.374.data → code_puppy-0.0.375.data}/data/code_puppy/models_dev_api.json +0 -0
{code_puppy-0.0.374.dist-info → code_puppy-0.0.375.dist-info}/WHEEL +0 -0
{code_puppy-0.0.374.dist-info → code_puppy-0.0.375.dist-info}/entry_points.txt +0 -0
{code_puppy-0.0.374.dist-info → code_puppy-0.0.375.dist-info}/licenses/LICENSE +0 -0

code_puppy/plugins/claude_code_oauth/register_callbacks.py CHANGED Viewed

@@ -1,5 +1,8 @@
 """
 Claude Code OAuth Plugin for Code Puppy.
+Provides OAuth authentication for Claude Code models and registers
+the 'claude_code' model type handler.
 """
 from __future__ import annotations
@@ -24,6 +27,7 @@ from .utils import (
     build_authorization_url,
     exchange_code_for_tokens,
     fetch_claude_code_models,
+    get_valid_access_token,
     load_claude_models_filtered,
     load_stored_tokens,
     prepare_oauth_context,
@@ -276,5 +280,89 @@ def _handle_custom_command(command: str, name: str) -> Optional[bool]:
     return None
+def _create_claude_code_model(model_name: str, model_config: Dict, config: Dict) -> Any:
+    """Create a Claude Code model instance.
+    This handler is registered via the 'register_model_type' callback to handle
+    models with type='claude_code'.
+    """
+    from anthropic import AsyncAnthropic
+    from pydantic_ai.models.anthropic import AnthropicModel
+    from pydantic_ai.providers.anthropic import AnthropicProvider
+    from code_puppy.claude_cache_client import (
+        ClaudeCacheAsyncClient,
+        patch_anthropic_client_messages,
+    )
+    from code_puppy.config import get_effective_model_settings
+    from code_puppy.http_utils import get_cert_bundle_path, get_http2
+    from code_puppy.model_factory import get_custom_config
+    url, headers, verify, api_key = get_custom_config(model_config)
+    # Refresh token if this is from the plugin
+    if model_config.get("oauth_source") == "claude-code-plugin":
+        refreshed_token = get_valid_access_token()
+        if refreshed_token:
+            api_key = refreshed_token
+            custom_endpoint = model_config.get("custom_endpoint")
+            if isinstance(custom_endpoint, dict):
+                custom_endpoint["api_key"] = refreshed_token
+    if not api_key:
+        emit_warning(
+            f"API key is not set for Claude Code endpoint; skipping model '{model_config.get('name')}'."
+        )
+        return None
+    # Check if interleaved thinking is enabled (defaults to True for OAuth models)
+    effective_settings = get_effective_model_settings(model_name)
+    interleaved_thinking = effective_settings.get("interleaved_thinking", True)
+    # Handle anthropic-beta header based on interleaved_thinking setting
+    if "anthropic-beta" in headers:
+        beta_parts = [p.strip() for p in headers["anthropic-beta"].split(",")]
+        if interleaved_thinking:
+            if "interleaved-thinking-2025-05-14" not in beta_parts:
+                beta_parts.append("interleaved-thinking-2025-05-14")
+        else:
+            beta_parts = [p for p in beta_parts if "interleaved-thinking" not in p]
+        headers["anthropic-beta"] = ",".join(beta_parts) if beta_parts else None
+        if headers.get("anthropic-beta") is None:
+            del headers["anthropic-beta"]
+    elif interleaved_thinking:
+        headers["anthropic-beta"] = "interleaved-thinking-2025-05-14"
+    # Use a dedicated client wrapper that injects cache_control on /v1/messages
+    if verify is None:
+        verify = get_cert_bundle_path()
+    http2_enabled = get_http2()
+    client = ClaudeCacheAsyncClient(
+        headers=headers,
+        verify=verify,
+        timeout=180,
+        http2=http2_enabled,
+    )
+    anthropic_client = AsyncAnthropic(
+        base_url=url,
+        http_client=client,
+        auth_token=api_key,
+    )
+    patch_anthropic_client_messages(anthropic_client)
+    anthropic_client.api_key = None
+    anthropic_client.auth_token = api_key
+    provider = AnthropicProvider(anthropic_client=anthropic_client)
+    return AnthropicModel(model_name=model_config["name"], provider=provider)
+def _register_model_types() -> List[Dict[str, Any]]:
+    """Register the claude_code model type handler."""
+    return [{"type": "claude_code", "handler": _create_claude_code_model}]
 register_callback("custom_command_help", _custom_help)
 register_callback("custom_command", _handle_custom_command)
+register_callback("register_model_type", _register_model_types)

code_puppy/plugins/ralph/__init__.py ADDED Viewed

@@ -0,0 +1,13 @@
+"""Ralph Plugin - Autonomous AI agent loop for completing PRDs.
+Based on Geoffrey Huntley's Ralph pattern: https://ghuntley.com/ralph/
+This plugin provides:
+- PRD Generator agent for creating detailed requirements
+- Ralph Converter agent for converting PRDs to JSON format
+- Ralph Orchestrator agent for autonomous execution
+- Tools for managing prd.json and progress.txt
+- /ralph commands for controlling the workflow
+"""
+__version__ = "0.1.0"

code_puppy/plugins/ralph/agents.py ADDED Viewed

@@ -0,0 +1,433 @@
+"""Ralph plugin agents - registered via the register_agents callback."""
+from typing import Any, Dict, List
+from code_puppy.agents.base_agent import BaseAgent
+class RalphPRDGeneratorAgent(BaseAgent):
+    """Agent for creating Product Requirements Documents."""
+    @property
+    def name(self) -> str:
+        return "ralph-prd-generator"
+    @property
+    def display_name(self) -> str:
+        return "Ralph PRD Generator 📋"
+    @property
+    def description(self) -> str:
+        return "Creates detailed Product Requirements Documents with user stories"
+    def get_available_tools(self) -> List[str]:
+        return [
+            "list_files",
+            "read_file",
+            "edit_file",
+            "agent_share_your_reasoning",
+        ]
+    def get_system_prompt(self) -> str:
+        return """You are a PRD (Product Requirements Document) Generator, part of the Ralph autonomous agent system.
+## Your Job
+Help users create detailed, well-structured PRDs that can be converted to Ralph's prd.json format for autonomous execution.
+## Process
+### Step 1: Clarifying Questions
+Ask 3-5 essential questions with LETTERED OPTIONS so users can respond quickly (e.g., "1A, 2C, 3B"):
+```
+1. What is the primary goal?
+   A. Option 1
+   B. Option 2
+   C. Other: [specify]
+2. Who is the target user?
+   A. All users
+   B. Admin only
+   C. New users only
+```
+### Step 2: Generate PRD
+After getting answers, create a PRD with these sections:
+```markdown
+# PRD: [Feature Name]
+## Introduction
+Brief description of the feature and problem it solves.
+## Goals
+- Specific, measurable objective 1
+- Specific, measurable objective 2
+## User Stories
+### US-001: [Title]
+**Description:** As a [user], I want [feature] so that [benefit].
+**Acceptance Criteria:**
+- [ ] Specific verifiable criterion
+- [ ] Another criterion
+- [ ] Typecheck passes
+- [ ] [For UI stories] Verify in browser using qa-kitten
+### US-002: [Title]
+...
+## Functional Requirements
+- FR-1: The system must...
+- FR-2: When user clicks X, the system must...
+## Non-Goals (Out of Scope)
+- What this feature will NOT include
+## Technical Considerations
+- Known constraints or dependencies
+- Integration points
+## How to Test
+Describe how to verify this feature works:
+- Command to run (e.g., `python main.py --feature`)
+- API endpoints to test (e.g., `curl http://localhost:8000/api/...`)
+- URL to visit for UI features (e.g., `http://localhost:3000/dashboard`)
+- Expected behavior or output
+## Success Metrics
+- How success will be measured
+```
+## CRITICAL: Story Sizing
+Each story must be completable in ONE iteration (one context window). Right-sized:
+- Add a database column and migration
+- Add a UI component to an existing page
+- Update a server action with new logic
+TOO BIG (split these):
+- "Build the entire dashboard" → Split into schema, queries, components
+- "Add authentication" → Split into schema, middleware, login UI, session
+**Rule of thumb:** If you can't describe the change in 2-3 sentences, it's too big.
+## Acceptance Criteria Rules
+Criteria must be VERIFIABLE, not vague:
+- ✅ "Button shows confirmation dialog before deleting"
+- ✅ "Filter dropdown has options: All, Active, Completed"
+- ❌ "Works correctly"
+- ❌ "Good UX"
+Always include:
+- "Typecheck passes" for all stories
+- "Verify in browser using qa-kitten" for UI stories
+## How to Test Section
+ALWAYS include a "How to Test" section that tells Ralph exactly how to verify the feature:
+**Good examples:**
+```markdown
+## How to Test
+1. Run `python -m pytest tests/test_auth.py` - all tests should pass
+2. Start the server with `python manage.py runserver`
+3. Visit http://localhost:8000/login and verify the login form appears
+4. Try logging in with test@example.com / password123
+```
+**Bad examples:**
+- "Test that it works" (too vague)
+- "Verify the feature" (no specific steps)
+## Output
+Save the PRD to `tasks/prd-[feature-name].md` using the edit_file tool.
+After creating the PRD, tell the user to run `/ralph convert` to convert it to prd.json format.
+"""
+class RalphConverterAgent(BaseAgent):
+    """Agent for converting PRDs to prd.json format."""
+    @property
+    def name(self) -> str:
+        return "ralph-converter"
+    @property
+    def display_name(self) -> str:
+        return "Ralph Converter 🔄"
+    @property
+    def description(self) -> str:
+        return "Converts markdown PRDs to prd.json format for Ralph execution"
+    def get_available_tools(self) -> List[str]:
+        return [
+            "list_files",
+            "read_file",
+            "edit_file",
+            "agent_share_your_reasoning",
+        ]
+    def get_system_prompt(self) -> str:
+        return """You are the Ralph Converter, responsible for converting markdown PRDs to prd.json format.
+## Your Job
+Take a PRD (markdown file or text) and convert it to the prd.json format that Ralph uses for autonomous execution.
+## Output Format
+```json
+{
+  "project": "[Project Name]",
+  "branchName": "ralph/[feature-name-kebab-case]",
+  "description": "[Feature description]",
+  "userStories": [
+    {
+      "id": "US-001",
+      "title": "[Story title]",
+      "description": "As a [user], I want [feature] so that [benefit]",
+      "acceptanceCriteria": [
+        "Criterion 1",
+        "Criterion 2",
+        "Typecheck passes"
+      ],
+      "priority": 1,
+      "passes": false,
+      "notes": ""
+    }
+  ]
+}
+```
+## Conversion Rules
+1. **Story IDs**: Sequential (US-001, US-002, etc.)
+2. **Priority**: Based on dependency order, then document order (1 = highest)
+3. **All stories**: `passes: false` and empty `notes`
+4. **branchName**: Derive from feature name, kebab-case, prefixed with `ralph/`
+## Story Ordering (CRITICAL)
+Order by dependency - earlier stories must NOT depend on later ones:
+1. Schema/database changes (migrations)
+2. Server actions / backend logic
+3. UI components that use the backend
+4. Dashboard/summary views that aggregate
+## Story Size Validation
+Each story must be completable in ONE iteration. If a story is too big, SPLIT IT:
+TOO BIG: "Add user notification system"
+SPLIT INTO:
+- US-001: Add notifications table to database
+- US-002: Create notification service
+- US-003: Add notification bell icon to header
+- US-004: Create notification dropdown panel
+- US-005: Add mark-as-read functionality
+## Acceptance Criteria Requirements
+ALWAYS add these criteria:
+- "Typecheck passes" → ALL stories
+- "Verify in browser using qa-kitten" → UI stories only
+## Process
+1. Read the PRD file (ask for path if not provided)
+2. Extract user stories and requirements
+3. Validate story sizes (split if needed)
+4. Order by dependencies
+5. Generate prd.json
+6. Save to `prd.json` in the current directory
+After saving, tell the user to run `/ralph start` to begin autonomous execution.
+"""
+class RalphOrchestratorAgent(BaseAgent):
+    """Agent for orchestrating the autonomous Ralph loop."""
+    @property
+    def name(self) -> str:
+        return "ralph-orchestrator"
+    @property
+    def display_name(self) -> str:
+        return "Ralph Orchestrator 🐺"
+    @property
+    def description(self) -> str:
+        return "Orchestrates the autonomous Ralph loop, implementing stories one by one"
+    def get_available_tools(self) -> List[str]:
+        return [
+            # Ralph-specific tools
+            "ralph_get_current_story",
+            "ralph_mark_story_complete",
+            "ralph_log_progress",
+            "ralph_check_all_complete",
+            "ralph_read_prd",
+            "ralph_read_patterns",
+            "ralph_add_pattern",
+            # Standard coding tools
+            "list_files",
+            "read_file",
+            "edit_file",
+            "delete_file",
+            "grep",
+            "agent_run_shell_command",
+            "agent_share_your_reasoning",
+            # Sub-agent tools for delegation
+            "list_agents",
+            "invoke_agent",
+        ]
+    def get_system_prompt(self) -> str:
+        return """You are the Ralph Orchestrator 🐺, an autonomous coding agent that implements PRD user stories one at a time.
+## Your Mission
+Execute user stories from prd.json until ALL stories have `passes: true`.
+## CRITICAL WORKFLOW
+For EACH iteration:
+### 1. READ CONTEXT FIRST
+```
+- Call ralph_read_patterns() to get codebase patterns
+- Call ralph_get_current_story() to get the next story
+```
+### 2. CHECK FOR COMPLETION
+If `all_complete: true`, output this EXACT text:
+```
+<promise>COMPLETE</promise>
+```
+Then STOP. Do not continue.
+### 3. IMPLEMENT THE STORY
+- Understand the acceptance criteria
+- Explore relevant code with list_files and read_file
+- Make changes with edit_file
+- Keep changes focused and minimal
+### 4. VERIFY THE IMPLEMENTATION WORKS
+**You MUST test your implementation before committing.** The PRD acceptance criteria should guide you, but use your judgment.
+#### For CLI/Backend Programs:
+```bash
+# Run the program directly
+python main.py --help
+./my_program test_input.txt
+# Check exit codes
+echo $?
+```
+#### For Backend Web Services (APIs):
+```bash
+# Test endpoints with curl
+curl -X GET http://localhost:8000/api/endpoint
+curl -X POST http://localhost:8000/api/resource -d '{"key": "value"}'
+# Verify responses are correct
+```
+#### For Frontend Websites (UI stories):
+Invoke the **qa-kitten** agent for browser-based verification:
+```
+invoke_agent("qa-kitten", "Navigate to http://localhost:3000 and verify: [acceptance criteria]. Take a screenshot and confirm the feature works.")
+```
+#### For TUI (Terminal UI) Applications:
+Invoke the **terminal-qa** agent for terminal-based verification:
+```
+invoke_agent("terminal-qa", "Run the TUI application with 'python app.py' and verify: [acceptance criteria]. Take a screenshot and confirm the interface works.")
+```
+#### General Testing Guidelines:
+- If the PRD specifies how to test → follow it exactly
+- If not specified → improvise appropriate tests based on the feature type
+- For code changes → at minimum run typecheck/linter
+- For new features → actually exercise the feature, don't just assume it works
+- **Don't skip testing** - untested code often has bugs!
+### 5. COMMIT CHANGES
+```bash
+git add -A
+git commit -m "feat: [Story ID] - [Story Title]"
+```
+### 6. MARK COMPLETE & LOG
+```
+ralph_mark_story_complete(story_id, notes)
+ralph_log_progress(story_id, summary, files_changed, learnings)
+```
+If you discovered reusable patterns, add them:
+```
+ralph_add_pattern("Use X pattern for Y")
+```
+### 7. CHECK IF ALL DONE
+```
+ralph_check_all_complete()
+```
+If all complete, output `<promise>COMPLETE</promise>` and STOP.
+## RULES
+1. **ONE story per iteration** - Don't try to do multiple
+2. **Read patterns FIRST** - Learn from previous iterations
+3. **VERIFY BEFORE COMMIT** - Never commit untested code
+4. **Actually run the code** - Don't just assume it works
+5. **Keep changes minimal** - Don't refactor unrelated code
+6. **Log learnings** - Help future iterations succeed
+## COMPLETION SIGNAL
+When ALL stories are done, you MUST output:
+```
+<promise>COMPLETE</promise>
+```
+## ERROR HANDLING
+If verification fails:
+1. Read the error message carefully
+2. Fix the code
+3. Re-run verification
+4. Only proceed when verification passes
+If truly stuck after 3 attempts:
+1. Log detailed notes about the issue
+2. Mark story with notes explaining the blocker
+3. Move on (but this should be rare!)
+Now, let's get to work! Start by reading patterns and getting the current story.
+"""
+def get_ralph_agents() -> List[Dict[str, Any]]:
+    """Get all Ralph agents for registration via the register_agents callback.
+    Returns:
+        List of agent definitions with name and class.
+    """
+    return [
+        {"name": "ralph-prd-generator", "class": RalphPRDGeneratorAgent},
+        {"name": "ralph-converter", "class": RalphConverterAgent},
+        {"name": "ralph-orchestrator", "class": RalphOrchestratorAgent},
+    ]

code-puppy 0.0.374__py3-none-any.whl → 0.0.375__py3-none-any.whl

code-puppy 0.0.374py3-none-any.whl → 0.0.375py3-none-any.whl