PyPI - planner-auto - Versions diffs - 0.5.0__tar.gz - Mend

planner-auto 0.5.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (87) hide show

planner_auto-0.5.0/PKG-INFO +363 -0
planner_auto-0.5.0/README.md +332 -0
planner_auto-0.5.0/planner_auto/__init__.py +19 -0
planner_auto-0.5.0/planner_auto/agents.py +247 -0
planner_auto-0.5.0/planner_auto/cli.py +1131 -0
planner_auto-0.5.0/planner_auto/db.py +772 -0
planner_auto-0.5.0/planner_auto/errors.py +96 -0
planner_auto-0.5.0/planner_auto/export.py +340 -0
planner_auto-0.5.0/planner_auto/git_utils.py +50 -0
planner_auto-0.5.0/planner_auto/inspect.py +262 -0
planner_auto-0.5.0/planner_auto/logging.py +107 -0
planner_auto-0.5.0/planner_auto/loop/__init__.py +18 -0
planner_auto-0.5.0/planner_auto/loop/convergence.py +127 -0
planner_auto-0.5.0/planner_auto/loop/engine.py +745 -0
planner_auto-0.5.0/planner_auto/loop/feedback.py +219 -0
planner_auto-0.5.0/planner_auto/loop/history.py +201 -0
planner_auto-0.5.0/planner_auto/prompts.py +57 -0
planner_auto-0.5.0/planner_auto/review_workflow.py +349 -0
planner_auto-0.5.0/planner_auto/reviewer/__init__.py +21 -0
planner_auto-0.5.0/planner_auto/reviewer/contract.py +174 -0
planner_auto-0.5.0/planner_auto/reviewer/direct_api.py +245 -0
planner_auto-0.5.0/planner_auto/reviewer/parser.py +384 -0
planner_auto-0.5.0/planner_auto/reviewer/prompts.py +171 -0
planner_auto-0.5.0/planner_auto/sdk_wrapper.py +434 -0
planner_auto-0.5.0/planner_auto/session.py +192 -0
planner_auto-0.5.0/planner_auto/state.py +49 -0
planner_auto-0.5.0/planner_auto/tui/__init__.py +18 -0
planner_auto-0.5.0/planner_auto/tui/adapter.py +129 -0
planner_auto-0.5.0/planner_auto/tui/bindings.py +16 -0
planner_auto-0.5.0/planner_auto/tui/messages.py +135 -0
planner_auto-0.5.0/planner_auto/tui/review_app.py +671 -0
planner_auto-0.5.0/planner_auto/tui/screens/__init__.py +1 -0
planner_auto-0.5.0/planner_auto/tui/screens/disposition_screen.py +137 -0
planner_auto-0.5.0/planner_auto/tui/screens/help_screen.py +83 -0
planner_auto-0.5.0/planner_auto/tui/screens/plan_screen.py +93 -0
planner_auto-0.5.0/planner_auto/tui/screens/raw_response_screen.py +96 -0
planner_auto-0.5.0/planner_auto/tui/styles/theme.tcss +235 -0
planner_auto-0.5.0/planner_auto/tui/widgets/__init__.py +1 -0
planner_auto-0.5.0/planner_auto/tui/widgets/convergence_panel.py +93 -0
planner_auto-0.5.0/planner_auto/tui/widgets/current_round.py +157 -0
planner_auto-0.5.0/planner_auto/tui/widgets/log_panel.py +106 -0
planner_auto-0.5.0/planner_auto/tui/widgets/plan_panel.py +75 -0
planner_auto-0.5.0/planner_auto/tui/widgets/round_detail.py +167 -0
planner_auto-0.5.0/planner_auto/tui/widgets/round_list.py +115 -0
planner_auto-0.5.0/planner_auto/tui/widgets/session_panel.py +73 -0
planner_auto-0.5.0/planner_auto/validation.py +92 -0
planner_auto-0.5.0/planner_auto.egg-info/PKG-INFO +363 -0
planner_auto-0.5.0/planner_auto.egg-info/SOURCES.txt +85 -0
planner_auto-0.5.0/planner_auto.egg-info/dependency_links.txt +1 -0
planner_auto-0.5.0/planner_auto.egg-info/entry_points.txt +2 -0
planner_auto-0.5.0/planner_auto.egg-info/requires.txt +14 -0
planner_auto-0.5.0/planner_auto.egg-info/top_level.txt +1 -0
planner_auto-0.5.0/pyproject.toml +56 -0
planner_auto-0.5.0/setup.cfg +4 -0
planner_auto-0.5.0/tests/test_agents.py +211 -0
planner_auto-0.5.0/tests/test_backend_wiring.py +291 -0
planner_auto-0.5.0/tests/test_check.py +275 -0
planner_auto-0.5.0/tests/test_cli.py +203 -0
planner_auto-0.5.0/tests/test_context.py +174 -0
planner_auto-0.5.0/tests/test_contract.py +281 -0
planner_auto-0.5.0/tests/test_convergence.py +145 -0
planner_auto-0.5.0/tests/test_db.py +260 -0
planner_auto-0.5.0/tests/test_db_v2.py +447 -0
planner_auto-0.5.0/tests/test_direct_api.py +391 -0
planner_auto-0.5.0/tests/test_direct_backend.py +381 -0
planner_auto-0.5.0/tests/test_engine.py +869 -0
planner_auto-0.5.0/tests/test_error_diagnostics.py +295 -0
planner_auto-0.5.0/tests/test_export.py +272 -0
planner_auto-0.5.0/tests/test_git_utils.py +158 -0
planner_auto-0.5.0/tests/test_init.py +60 -0
planner_auto-0.5.0/tests/test_inspect.py +297 -0
planner_auto-0.5.0/tests/test_logging.py +212 -0
planner_auto-0.5.0/tests/test_loop_output.py +274 -0
planner_auto-0.5.0/tests/test_parser.py +380 -0
planner_auto-0.5.0/tests/test_review_cli.py +387 -0
planner_auto-0.5.0/tests/test_review_export.py +270 -0
planner_auto-0.5.0/tests/test_review_workflow.py +176 -0
planner_auto-0.5.0/tests/test_sdk_wrapper.py +126 -0
planner_auto-0.5.0/tests/test_sdk_wrapper_v2.py +173 -0
planner_auto-0.5.0/tests/test_session.py +193 -0
planner_auto-0.5.0/tests/test_structured_logging.py +251 -0
planner_auto-0.5.0/tests/test_tui_adapter.py +137 -0
planner_auto-0.5.0/tests/test_tui_keybindings.py +231 -0
planner_auto-0.5.0/tests/test_tui_live.py +365 -0
planner_auto-0.5.0/tests/test_tui_messages.py +144 -0
planner_auto-0.5.0/tests/test_tui_screens.py +231 -0
planner_auto-0.5.0/tests/test_validation.py +206 -0

planner_auto-0.5.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,363 @@
+Metadata-Version: 2.4
+Name: planner-auto
+Version: 0.5.0
+Summary: Interactive planning session manager with SQLite persistence and artifact export
+Author-email: Danny Almaden <dan@ailab.ph>
+License: MIT
+Project-URL: Homepage, https://github.com/ailabph/claude-ai-workflows
+Project-URL: Repository, https://github.com/ailabph/claude-ai-workflows
+Project-URL: Changelog, https://github.com/ailabph/claude-ai-workflows/blob/main/planner-auto/CHANGELOG.md
+Keywords: planning,claude,ai,orchestration,milestone,gpt,review
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Developers
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Requires-Python: >=3.10
+Description-Content-Type: text/markdown
+Requires-Dist: click>=8.0
+Requires-Dist: claude-agent-sdk<0.2.0,>=0.1.50
+Requires-Dist: anthropic>=0.40.0
+Requires-Dist: prompt_toolkit>=3.0
+Requires-Dist: openai>=2.0
+Requires-Dist: python-dotenv>=1.0
+Provides-Extra: dev
+Requires-Dist: pytest>=7.0; extra == "dev"
+Requires-Dist: pytest-asyncio>=0.21; extra == "dev"
+Requires-Dist: textual[dev]>=0.80.0; extra == "dev"
+Provides-Extra: tui
+Requires-Dist: textual>=0.80.0; extra == "tui"
+# planner-auto
+Automated planning session manager that produces milestone plans through interactive conversation with Claude, reviewed by GPT for quality. Plans are persisted in SQLite and exported as markdown artifacts ready for [orchestrator-auto](../orchestrator-auto/) to implement.
+## How It Works
+```
+You describe a feature
+    → Claude asks clarifying questions
+        → Claude generates a milestone plan
+            → GPT reviews and critiques
+                → Claude revises based on feedback
+                    → Repeat until GPT says GO
+                        → Plan exported for orchestrator-auto
+```
+Each session follows a strict lifecycle: **SETUP → CONTEXT → DISCUSSION → PLANNING → REVIEW → COMPLETE**. All state lives in SQLite. File artifacts (plans, reviews, chat logs) are exported views, not source of truth.
+## Installation
+```bash
+cd planner-auto/
+pip install -e .           # Production
+pip install -e ".[dev]"    # With pytest
+pip install -e ".[tui]"    # With TUI dashboard (textual)
+# Required
+export ANTHROPIC_API_KEY="your-key"     # For Claude (planner)
+# OR
+export CLAUDE_CODE_OAUTH_TOKEN="token"  # Claude Pro/Max subscription
+# Required for Plan 2 (reviewer)
+export OPENAI_API_KEY="your-key"        # For GPT-5.4 (reviewer)
+```
+## Quick Start
+```bash
+# Start a session
+planner-auto start --project my-api
+# Add context files
+planner-auto add-context <session-id> --file src/app.py
+planner-auto add-context <session-id> --file src/models.py
+planner-auto add-context <session-id> --note "Uses PostgreSQL, deployed on AWS"
+# Discuss the feature (interactive mode)
+planner-auto discuss <session-id> --interactive
+# Type your feature description, Claude asks questions
+# Type /done when ready to move to planning
+# Or one-shot discuss with auto-advance
+planner-auto discuss <session-id> "Add user registration with email validation" --done
+# Generate the plan
+planner-auto generate <session-id>
+planner-auto generate <session-id> --model claude-opus-4-6  # Override model
+# Export artifacts
+planner-auto export <session-id>
+planner-auto export <session-id> --output-dir ./my-plans/
+# Complete the session
+planner-auto complete <session-id>
+```
+## CLI Reference
+### Session Commands (Plan 1)
+| Command | Description |
+|---------|-------------|
+| `start --project <name>` | Create a new planning session |
+| `add-context <id> --file <path>` | Add a file to session context |
+| `add-context <id> --note "text"` | Add a text note to session context |
+| `discuss <id> "message"` | Send a single discussion message |
+| `discuss <id> --interactive` | Enter interactive discussion mode (type `/done` to advance) |
+| `discuss <id> "message" --done` | Send message and advance to PLANNING |
+| `generate <id>` | Generate milestone plan from context + conversation |
+| `generate <id> --model <model>` | Generate with a specific Claude model |
+| `list` | List all sessions |
+| `list --status active` | Filter sessions by status |
+| `status <id>` | Show session details (phase, counts, blockers) |
+| `resume <id>` | Resume a paused session (answer open blockers) |
+| `export <id>` | Export session artifacts to disk |
+| `export <id> --output-dir <path>` | Export to custom directory |
+| `complete <id>` | Complete session (checks blockers, auto-exports) |
+### Global Flags
+| Flag | Description |
+|------|-------------|
+| `--db-path <path>` | Override database path (default: `~/.planner-auto/planner.db`) |
+| `--verbose` | Print detailed output |
+| `--debug` | Print debug-level output + stack traces |
+### Review Commands (Plan 2)
+| Command | Description |
+|---------|-------------|
+| `review <id>` | Run automated GPT review loop on current plan |
+| `review <id> --fast` | Fast mode: 4 rounds, no history, basic prompt |
+| `review <id> --max-rounds <n>` | Override round cap |
+| `review <id> --no-review-history` | Disable review history context |
+| `review <id> --reviewer-model <model>` | Override GPT model (default: gpt-5.4) |
+| `review <id> --reviewer-reasoning <level>` | Reasoning effort (default: high) |
+| `review <id> --complexity standard\|complex` | Override complexity detection |
+| `review <id> --repo-root <path>` | Override repo root for .kafra handoff |
+| `review <id> --tui` | Launch live TUI dashboard (requires `pip install planner-auto[tui]`) |
+**Review loop features:**
+- GPT-5.4 reviews with `resolution_guidance` + `target_section` per issue
+- `keep/trim` sections: GPT tells Claude what to preserve and what to simplify
+- `validate feedback`: Claude assesses each issue as ACCEPT / DEFER / REJECT
+- Severity filtering: only `critical` + `major` issues reach Claude
+- Review history: GPT sees previous plan + cumulative DEFER decisions across all rounds
+- Complexity detection: auto-adjusts round cap (standard=8, complex=12)
+- Convergence: GPT GO, or cap with zero criticals = accepted
+- Cap with criticals = session paused for human review
+- Final plan copied to `<repo>/.kafra/a-01-plans/`
+- Review metadata persisted: model, cost, tokens, raw response per round
+- **TUI mode** (`--tui`): Live dashboard with round progress, convergence sparkline, disposition drill-down. Requires `pip install planner-auto[tui]`.
+## Session Lifecycle
+```
+SETUP ──► CONTEXT ──► DISCUSSION ──► PLANNING ──► REVIEW ──► COMPLETE
+                                        │            │          ▲
+                                        │            └──────────┘
+                                        │            (revise & re-review)
+                                        └───────────────────────┘
+                                        (skip review — direct complete)
+Any phase can transition to PAUSED via blockers.
+PAUSED only allows: resume, status, export.
+```
+| Phase | What Happens | Allowed Commands |
+|-------|-------------|-----------------|
+| SETUP | Session created, config saved | start, add-context, status, export |
+| CONTEXT | Files and notes loaded | add-context, status, export |
+| DISCUSSION | User describes feature, Claude asks questions | discuss, status, export |
+| PLANNING | Context synthesized, plan generated | generate, review, complete, status, export |
+| REVIEW | GPT review loop running | review, complete, status, export |
+| COMPLETE | Session finished, artifacts exported | status, export |
+## Database Schema
+All state lives in SQLite at `~/.planner-auto/planner.db`. 7 tables:
+| Table | Purpose |
+|-------|---------|
+| `sessions` | Session metadata: project, phase, status, timestamps |
+| `messages` | Append-only conversation log (user + assistant turns) |
+| `context_entries` | Loaded files, notes, and synthesized context |
+| `plan_drafts` | Versioned plan content with draft number |
+| `reviews` | Reviewer responses with verdict and issues (Plan 2) |
+| `blockers` | Pause/resume lifecycle with source, question, answer |
+| `session_config` | Config snapshot per session (models, prompt hashes) |
+### Transaction Contract
+CRUD functions do NOT auto-commit. Callers manage transactions:
+```python
+from planner_auto.db import transaction, add_message
+# Single operation — explicit commit
+add_message(conn, session_id, "user", "hello")
+conn.commit()
+# Atomic multi-operation — transaction context manager
+with transaction(conn):
+    add_message(conn, session_id, "user", user_input)
+    add_message(conn, session_id, "assistant", response)
+# Both committed together, or both rolled back on error
+```
+## Artifact Export
+Artifacts are generated from the DB on demand. They are NOT read back by the tool.
+```
+~/.planner-auto/sessions/<session-id>/
+├── chat.csv                  # Full conversation (id, timestamp, role, content)
+├── context-summary.md        # Context entries grouped by type
+├── plan-draft-1.md           # First plan draft
+├── plan-draft-2.md           # Revised draft (after review, Plan 2)
+├── ...
+└── plan-draft-N.md           # Latest draft
+```
+With Plan 2 (reviewer), additional files:
+```
+├── a-01-plan.md              # Draft 1
+├── a-02-review.md            # Review 1
+├── a-03-plan.md              # Draft 2 (revised)
+├── a-04-review.md            # Review 2
+├── ...
+└── a-<N>-plan-final.md       # GPT-approved final plan
+```
+## Architecture (For Agents & Devs)
+```
+planner_auto/
+├── cli.py              # Click CLI — all user-facing commands
+├── db.py               # SQLite schema (v2), CRUD, transaction(), schema migration
+├── session.py          # SessionManager — phase transitions, pause/resume
+├── state.py            # Phase/Status enums, transition rules, command permissions
+├── agents.py           # discuss(), synthesize_context(), generate_plan()
+├── sdk_wrapper.py      # Claude SDK wrapper — retry, timeout, effort/thinking
+├── review_workflow.py  # Shared review orchestration (prepare/run/finalize)
+├── prompts.py          # System prompts with version hashing
+├── export.py           # Artifact export — plans, reviews, .kafra handoff
+├── validation.py       # Plan format validation (milestone headers, checkboxes)
+├── errors.py           # Custom exceptions (SDK, reviewer, session errors)
+├── git_utils.py        # Repo root discovery (git rev-parse + --repo-root)
+├── logging.py          # Session-scoped log file setup
+├── inspect.py          # DB inspection queries for debugging
+├── reviewer/
+│   ├── contract.py     # ReviewerContract ABC, ReviewerResponse, ReviewIssue
+│   ├── direct_api.py   # DirectAPIAdapter — GPT-5.4 via OpenAI SDK
+│   ├── parser.py       # Response parser (JSON/XML/free-form fallback)
+│   └── prompts.py      # Reviewer system prompts (basic, guidance, keep_trim)
+├── loop/
+│   ├── engine.py       # ReviewLoopEngine — review → revise → repeat
+│   ├── feedback.py     # Validate feedback (ACCEPT/DEFER/REJECT per issue)
+│   ├── history.py      # Review context builder (cumulative deferred)
+│   └── convergence.py  # Complexity detection, caps, fast mode
+└── tui/                # TUI Review Dashboard (optional: pip install planner-auto[tui])
+    ├── review_app.py   # ReviewTUI — main Textual app
+    ├── adapter.py      # Thread-safe engine → TUI bridge
+    ├── messages.py     # 8 Textual message types
+    ├── bindings.py     # Keybinding definitions
+    ├── widgets/        # SessionPanel, ConvergencePanel, RoundList, etc.
+    ├── screens/        # DispositionScreen, PlanScreen, RawResponseScreen, HelpScreen
+    └── styles/         # theme.tcss — dark theme, 3 responsive breakpoints
+```
+### Key Design Decisions
+| Decision | Rationale |
+|----------|-----------|
+| SQLite as canonical state | Files drift from tool state. DB is authoritative, files are exports. |
+| Callers manage commits | Enables atomic multi-operation transactions without CRUD-level coupling. |
+| Phase-gated commands | Prevents out-of-order operations (e.g., generate before discuss). |
+| PLANNING→COMPLETE or PLANNING→REVIEW→COMPLETE | Direct complete skips review; `review` command runs the GPT loop. |
+| `asyncio.wait_for` on SDK calls | Prevents hung SDK subprocess from blocking forever. |
+| Prompt version hashing | Config snapshot per session enables reproducibility and regression detection. |
+### For Agents
+When working with planner-auto code:
+- All DB access goes through `db.py` functions — never raw SQL in other modules
+- All phase transitions go through `SessionManager` — never direct DB updates
+- SDK calls go through `sdk_wrapper.py` — handles retry, timeout, error mapping
+- Tests use in-memory SQLite (`:memory:`) with explicit commits
+- Tests mock all SDK calls — no real API calls in test suite
+## Development
+```bash
+# Setup
+cd planner-auto/
+pip install -e ".[dev]"
+# Run tests
+pytest tests/ -v                           # All tests
+pytest tests/test_db.py -v                 # Single file
+pytest tests/test_session.py::TestCheckCommand -v  # Single class
+pytest -k "complete" -v                    # Filter by name
+# Current test count: 464 passing
+```
+## Config Versioning
+Every session captures its configuration at creation time in `session_config`:
+```json
+{
+  "project": "my-api",
+  "model_default": "claude-sonnet-4-6",
+  "prompt_hashes": {
+    "planner": "sha256:abc123...",
+    "synthesis": "sha256:def456..."
+  }
+}
+```
+Plan 2 extends this with reviewer settings:
+```json
+{
+  "project": "my-api",
+  "model_default": "claude-opus-4-6",
+  "repo_root": "/Users/me/my-api",
+  "reviewer_model": "gpt-5.4",
+  "reasoning_effort": "high",
+  "prompt_mode": "keep_trim",
+  "review_history": true,
+  "validate_feedback": true,
+  "filter_severity": ["critical", "major"],
+  "fast_mode": false,
+  "complexity": "standard",
+  "max_rounds": 8
+}
+```
+## Known Issues
+### Claude Agent SDK Subprocess (when using `--claude-backend sdk`)
+The SDK backend (`--claude-backend sdk`) spawns a `claude` CLI subprocess which shares rate-limit quota with active Claude Code sessions. This is **not an issue with the default `direct` backend**.
+If you need to use the SDK backend (e.g., OAuth-only auth), be aware:
+- Rate limiting when other Claude Code sessions are active
+- anyio cancel scope tracebacks on error paths (cosmetic, not harmful)
+- Opus + thinking can consume turns on tool calls, returning empty results
+**Recommendation:** Use the default `direct` backend with `ANTHROPIC_API_KEY` whenever possible.
+## Roadmap
+- [x] **Plan 1: Session Core** — CLI, DB, lifecycle, context, plan generation, export
+- [x] **Plan 2: Reviewer Adapter** — GPT review loop, convergence, .kafra handoff
+- [x] **Direct API backend** — Bypass SDK subprocess, works alongside Claude Code sessions
+- [x] **Stress testing (Level 2)** — First end-to-end success: 3-round convergence, $0.12, GPT GO
+- [x] **TUI mode** — Review dashboard with live round progress, convergence sparkline, drill-down
+- [ ] **Telegram notifications** — Notify on plan approval or blocker
+- [ ] **Homebrew formula** — `brew install planner-auto`

planner_auto-0.5.0/README.md ADDED Viewed

@@ -0,0 +1,332 @@
+# planner-auto
+Automated planning session manager that produces milestone plans through interactive conversation with Claude, reviewed by GPT for quality. Plans are persisted in SQLite and exported as markdown artifacts ready for [orchestrator-auto](../orchestrator-auto/) to implement.
+## How It Works
+```
+You describe a feature
+    → Claude asks clarifying questions
+        → Claude generates a milestone plan
+            → GPT reviews and critiques
+                → Claude revises based on feedback
+                    → Repeat until GPT says GO
+                        → Plan exported for orchestrator-auto
+```
+Each session follows a strict lifecycle: **SETUP → CONTEXT → DISCUSSION → PLANNING → REVIEW → COMPLETE**. All state lives in SQLite. File artifacts (plans, reviews, chat logs) are exported views, not source of truth.
+## Installation
+```bash
+cd planner-auto/
+pip install -e .           # Production
+pip install -e ".[dev]"    # With pytest
+pip install -e ".[tui]"    # With TUI dashboard (textual)
+# Required
+export ANTHROPIC_API_KEY="your-key"     # For Claude (planner)
+# OR
+export CLAUDE_CODE_OAUTH_TOKEN="token"  # Claude Pro/Max subscription
+# Required for Plan 2 (reviewer)
+export OPENAI_API_KEY="your-key"        # For GPT-5.4 (reviewer)
+```
+## Quick Start
+```bash
+# Start a session
+planner-auto start --project my-api
+# Add context files
+planner-auto add-context <session-id> --file src/app.py
+planner-auto add-context <session-id> --file src/models.py
+planner-auto add-context <session-id> --note "Uses PostgreSQL, deployed on AWS"
+# Discuss the feature (interactive mode)
+planner-auto discuss <session-id> --interactive
+# Type your feature description, Claude asks questions
+# Type /done when ready to move to planning
+# Or one-shot discuss with auto-advance
+planner-auto discuss <session-id> "Add user registration with email validation" --done
+# Generate the plan
+planner-auto generate <session-id>
+planner-auto generate <session-id> --model claude-opus-4-6  # Override model
+# Export artifacts
+planner-auto export <session-id>
+planner-auto export <session-id> --output-dir ./my-plans/
+# Complete the session
+planner-auto complete <session-id>
+```
+## CLI Reference
+### Session Commands (Plan 1)
+| Command | Description |
+|---------|-------------|
+| `start --project <name>` | Create a new planning session |
+| `add-context <id> --file <path>` | Add a file to session context |
+| `add-context <id> --note "text"` | Add a text note to session context |
+| `discuss <id> "message"` | Send a single discussion message |
+| `discuss <id> --interactive` | Enter interactive discussion mode (type `/done` to advance) |
+| `discuss <id> "message" --done` | Send message and advance to PLANNING |
+| `generate <id>` | Generate milestone plan from context + conversation |
+| `generate <id> --model <model>` | Generate with a specific Claude model |
+| `list` | List all sessions |
+| `list --status active` | Filter sessions by status |
+| `status <id>` | Show session details (phase, counts, blockers) |
+| `resume <id>` | Resume a paused session (answer open blockers) |
+| `export <id>` | Export session artifacts to disk |
+| `export <id> --output-dir <path>` | Export to custom directory |
+| `complete <id>` | Complete session (checks blockers, auto-exports) |
+### Global Flags
+| Flag | Description |
+|------|-------------|
+| `--db-path <path>` | Override database path (default: `~/.planner-auto/planner.db`) |
+| `--verbose` | Print detailed output |
+| `--debug` | Print debug-level output + stack traces |
+### Review Commands (Plan 2)
+| Command | Description |
+|---------|-------------|
+| `review <id>` | Run automated GPT review loop on current plan |
+| `review <id> --fast` | Fast mode: 4 rounds, no history, basic prompt |
+| `review <id> --max-rounds <n>` | Override round cap |
+| `review <id> --no-review-history` | Disable review history context |
+| `review <id> --reviewer-model <model>` | Override GPT model (default: gpt-5.4) |
+| `review <id> --reviewer-reasoning <level>` | Reasoning effort (default: high) |
+| `review <id> --complexity standard\|complex` | Override complexity detection |
+| `review <id> --repo-root <path>` | Override repo root for .kafra handoff |
+| `review <id> --tui` | Launch live TUI dashboard (requires `pip install planner-auto[tui]`) |
+**Review loop features:**
+- GPT-5.4 reviews with `resolution_guidance` + `target_section` per issue
+- `keep/trim` sections: GPT tells Claude what to preserve and what to simplify
+- `validate feedback`: Claude assesses each issue as ACCEPT / DEFER / REJECT
+- Severity filtering: only `critical` + `major` issues reach Claude
+- Review history: GPT sees previous plan + cumulative DEFER decisions across all rounds
+- Complexity detection: auto-adjusts round cap (standard=8, complex=12)
+- Convergence: GPT GO, or cap with zero criticals = accepted
+- Cap with criticals = session paused for human review
+- Final plan copied to `<repo>/.kafra/a-01-plans/`
+- Review metadata persisted: model, cost, tokens, raw response per round
+- **TUI mode** (`--tui`): Live dashboard with round progress, convergence sparkline, disposition drill-down. Requires `pip install planner-auto[tui]`.
+## Session Lifecycle
+```
+SETUP ──► CONTEXT ──► DISCUSSION ──► PLANNING ──► REVIEW ──► COMPLETE
+                                        │            │          ▲
+                                        │            └──────────┘
+                                        │            (revise & re-review)
+                                        └───────────────────────┘
+                                        (skip review — direct complete)
+Any phase can transition to PAUSED via blockers.
+PAUSED only allows: resume, status, export.
+```
+| Phase | What Happens | Allowed Commands |
+|-------|-------------|-----------------|
+| SETUP | Session created, config saved | start, add-context, status, export |
+| CONTEXT | Files and notes loaded | add-context, status, export |
+| DISCUSSION | User describes feature, Claude asks questions | discuss, status, export |
+| PLANNING | Context synthesized, plan generated | generate, review, complete, status, export |
+| REVIEW | GPT review loop running | review, complete, status, export |
+| COMPLETE | Session finished, artifacts exported | status, export |
+## Database Schema
+All state lives in SQLite at `~/.planner-auto/planner.db`. 7 tables:
+| Table | Purpose |
+|-------|---------|
+| `sessions` | Session metadata: project, phase, status, timestamps |
+| `messages` | Append-only conversation log (user + assistant turns) |
+| `context_entries` | Loaded files, notes, and synthesized context |
+| `plan_drafts` | Versioned plan content with draft number |
+| `reviews` | Reviewer responses with verdict and issues (Plan 2) |
+| `blockers` | Pause/resume lifecycle with source, question, answer |
+| `session_config` | Config snapshot per session (models, prompt hashes) |
+### Transaction Contract
+CRUD functions do NOT auto-commit. Callers manage transactions:
+```python
+from planner_auto.db import transaction, add_message
+# Single operation — explicit commit
+add_message(conn, session_id, "user", "hello")
+conn.commit()
+# Atomic multi-operation — transaction context manager
+with transaction(conn):
+    add_message(conn, session_id, "user", user_input)
+    add_message(conn, session_id, "assistant", response)
+# Both committed together, or both rolled back on error
+```
+## Artifact Export
+Artifacts are generated from the DB on demand. They are NOT read back by the tool.
+```
+~/.planner-auto/sessions/<session-id>/
+├── chat.csv                  # Full conversation (id, timestamp, role, content)
+├── context-summary.md        # Context entries grouped by type
+├── plan-draft-1.md           # First plan draft
+├── plan-draft-2.md           # Revised draft (after review, Plan 2)
+├── ...
+└── plan-draft-N.md           # Latest draft
+```
+With Plan 2 (reviewer), additional files:
+```
+├── a-01-plan.md              # Draft 1
+├── a-02-review.md            # Review 1
+├── a-03-plan.md              # Draft 2 (revised)
+├── a-04-review.md            # Review 2
+├── ...
+└── a-<N>-plan-final.md       # GPT-approved final plan
+```
+## Architecture (For Agents & Devs)
+```
+planner_auto/
+├── cli.py              # Click CLI — all user-facing commands
+├── db.py               # SQLite schema (v2), CRUD, transaction(), schema migration
+├── session.py          # SessionManager — phase transitions, pause/resume
+├── state.py            # Phase/Status enums, transition rules, command permissions
+├── agents.py           # discuss(), synthesize_context(), generate_plan()
+├── sdk_wrapper.py      # Claude SDK wrapper — retry, timeout, effort/thinking
+├── review_workflow.py  # Shared review orchestration (prepare/run/finalize)
+├── prompts.py          # System prompts with version hashing
+├── export.py           # Artifact export — plans, reviews, .kafra handoff
+├── validation.py       # Plan format validation (milestone headers, checkboxes)
+├── errors.py           # Custom exceptions (SDK, reviewer, session errors)
+├── git_utils.py        # Repo root discovery (git rev-parse + --repo-root)
+├── logging.py          # Session-scoped log file setup
+├── inspect.py          # DB inspection queries for debugging
+├── reviewer/
+│   ├── contract.py     # ReviewerContract ABC, ReviewerResponse, ReviewIssue
+│   ├── direct_api.py   # DirectAPIAdapter — GPT-5.4 via OpenAI SDK
+│   ├── parser.py       # Response parser (JSON/XML/free-form fallback)
+│   └── prompts.py      # Reviewer system prompts (basic, guidance, keep_trim)
+├── loop/
+│   ├── engine.py       # ReviewLoopEngine — review → revise → repeat
+│   ├── feedback.py     # Validate feedback (ACCEPT/DEFER/REJECT per issue)
+│   ├── history.py      # Review context builder (cumulative deferred)
+│   └── convergence.py  # Complexity detection, caps, fast mode
+└── tui/                # TUI Review Dashboard (optional: pip install planner-auto[tui])
+    ├── review_app.py   # ReviewTUI — main Textual app
+    ├── adapter.py      # Thread-safe engine → TUI bridge
+    ├── messages.py     # 8 Textual message types
+    ├── bindings.py     # Keybinding definitions
+    ├── widgets/        # SessionPanel, ConvergencePanel, RoundList, etc.
+    ├── screens/        # DispositionScreen, PlanScreen, RawResponseScreen, HelpScreen
+    └── styles/         # theme.tcss — dark theme, 3 responsive breakpoints
+```
+### Key Design Decisions
+| Decision | Rationale |
+|----------|-----------|
+| SQLite as canonical state | Files drift from tool state. DB is authoritative, files are exports. |
+| Callers manage commits | Enables atomic multi-operation transactions without CRUD-level coupling. |
+| Phase-gated commands | Prevents out-of-order operations (e.g., generate before discuss). |
+| PLANNING→COMPLETE or PLANNING→REVIEW→COMPLETE | Direct complete skips review; `review` command runs the GPT loop. |
+| `asyncio.wait_for` on SDK calls | Prevents hung SDK subprocess from blocking forever. |
+| Prompt version hashing | Config snapshot per session enables reproducibility and regression detection. |
+### For Agents
+When working with planner-auto code:
+- All DB access goes through `db.py` functions — never raw SQL in other modules
+- All phase transitions go through `SessionManager` — never direct DB updates
+- SDK calls go through `sdk_wrapper.py` — handles retry, timeout, error mapping
+- Tests use in-memory SQLite (`:memory:`) with explicit commits
+- Tests mock all SDK calls — no real API calls in test suite
+## Development
+```bash
+# Setup
+cd planner-auto/
+pip install -e ".[dev]"
+# Run tests
+pytest tests/ -v                           # All tests
+pytest tests/test_db.py -v                 # Single file
+pytest tests/test_session.py::TestCheckCommand -v  # Single class
+pytest -k "complete" -v                    # Filter by name
+# Current test count: 464 passing
+```
+## Config Versioning
+Every session captures its configuration at creation time in `session_config`:
+```json
+{
+  "project": "my-api",
+  "model_default": "claude-sonnet-4-6",
+  "prompt_hashes": {
+    "planner": "sha256:abc123...",
+    "synthesis": "sha256:def456..."
+  }
+}
+```
+Plan 2 extends this with reviewer settings:
+```json
+{
+  "project": "my-api",
+  "model_default": "claude-opus-4-6",
+  "repo_root": "/Users/me/my-api",
+  "reviewer_model": "gpt-5.4",
+  "reasoning_effort": "high",
+  "prompt_mode": "keep_trim",
+  "review_history": true,
+  "validate_feedback": true,
+  "filter_severity": ["critical", "major"],
+  "fast_mode": false,
+  "complexity": "standard",
+  "max_rounds": 8
+}
+```
+## Known Issues
+### Claude Agent SDK Subprocess (when using `--claude-backend sdk`)
+The SDK backend (`--claude-backend sdk`) spawns a `claude` CLI subprocess which shares rate-limit quota with active Claude Code sessions. This is **not an issue with the default `direct` backend**.
+If you need to use the SDK backend (e.g., OAuth-only auth), be aware:
+- Rate limiting when other Claude Code sessions are active
+- anyio cancel scope tracebacks on error paths (cosmetic, not harmful)
+- Opus + thinking can consume turns on tool calls, returning empty results
+**Recommendation:** Use the default `direct` backend with `ANTHROPIC_API_KEY` whenever possible.
+## Roadmap
+- [x] **Plan 1: Session Core** — CLI, DB, lifecycle, context, plan generation, export
+- [x] **Plan 2: Reviewer Adapter** — GPT review loop, convergence, .kafra handoff
+- [x] **Direct API backend** — Bypass SDK subprocess, works alongside Claude Code sessions
+- [x] **Stress testing (Level 2)** — First end-to-end success: 3-round convergence, $0.12, GPT GO
+- [x] **TUI mode** — Review dashboard with live round progress, convergence sparkline, drill-down
+- [ ] **Telegram notifications** — Notify on plan approval or blocker
+- [ ] **Homebrew formula** — `brew install planner-auto`