npm - liteagents - Versions diffs - 2.4.0 - Mend

liteagents 2.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (215) hide show

package/CHANGELOG.md +441 -0
package/LICENSE +21 -0
package/README.md +179 -0
package/cli.js +230 -0
package/docs/.gitkeep +1 -0
package/docs/CONTRIBUTING.md +739 -0
package/docs/DUAL_PUBLISH_SUMMARY.md +177 -0
package/docs/ERROR_HANDLING_IMPLEMENTATION.md +327 -0
package/docs/GITHUB_PACKAGES.md +181 -0
package/docs/GITHUB_SETUP.md +158 -0
package/docs/INSTALLATION_DEMO.md +691 -0
package/docs/INSTALLATION_LOCATIONS.md +299 -0
package/docs/INSTALLER_GUIDE.md +1586 -0
package/docs/INTEGRATION_ISSUES_9.1.md +341 -0
package/docs/KNOWLEDGE_BASE.md +727 -0
package/docs/MIGRATION.md +384 -0
package/docs/PACKAGE_BASELINE.md +557 -0
package/docs/PACKAGE_VALIDATION_REPORT.md +427 -0
package/docs/PASS_INTEGRATION.md +307 -0
package/docs/PASS_QUICK_START.md +150 -0
package/docs/PRIVACY.md +203 -0
package/docs/PUBLISHING.md +494 -0
package/docs/QUICK-START.md +318 -0
package/docs/RELEASE_NOTES_1.2.0.md +323 -0
package/docs/SECURITY.md +317 -0
package/docs/SILENT_MODE_GUIDE.md +526 -0
package/docs/SKILLS_CONVERSION.md +154 -0
package/docs/TESTING.md +582 -0
package/docs/TEST_COVERAGE.md +347 -0
package/docs/TROUBLESHOOTING.md +788 -0
package/docs/UPDATED_VARIANT_CONFIGURATION.md +274 -0
package/docs/VARIANT_CONFIGURATION.md +440 -0
package/installer/cli.js +761 -0
package/installer/installation-engine.js +1536 -0
package/installer/package-manager.js +640 -0
package/installer/path-manager.js +427 -0
package/installer/report-template.js +298 -0
package/installer/verification-system.js +274 -0
package/package.json +83 -0
package/packages/ampcode/AGENT.md +58 -0
package/packages/ampcode/README.md +17 -0
package/packages/ampcode/agents/1-create-prd.md +175 -0
package/packages/ampcode/agents/2-generate-tasks.md +190 -0
package/packages/ampcode/agents/3-process-task-list.md +225 -0
package/packages/ampcode/agents/code-developer.md +198 -0
package/packages/ampcode/agents/context-builder.md +142 -0
package/packages/ampcode/agents/feature-planner.md +199 -0
package/packages/ampcode/agents/market-researcher.md +89 -0
package/packages/ampcode/agents/orchestrator.md +116 -0
package/packages/ampcode/agents/quality-assurance.md +115 -0
package/packages/ampcode/agents/system-architect.md +135 -0
package/packages/ampcode/agents/ui-designer.md +184 -0
package/packages/ampcode/commands/brainstorming.md +56 -0
package/packages/ampcode/commands/code-review.md +107 -0
package/packages/ampcode/commands/condition-based-waiting/example.ts +158 -0
package/packages/ampcode/commands/condition-based-waiting.md +122 -0
package/packages/ampcode/commands/debug.md +20 -0
package/packages/ampcode/commands/docs-builder/templates.md +572 -0
package/packages/ampcode/commands/docs-builder.md +106 -0
package/packages/ampcode/commands/explain.md +18 -0
package/packages/ampcode/commands/git-commit.md +14 -0
package/packages/ampcode/commands/optimize.md +20 -0
package/packages/ampcode/commands/refactor.md +21 -0
package/packages/ampcode/commands/review.md +18 -0
package/packages/ampcode/commands/root-cause-tracing/find-polluter.sh +63 -0
package/packages/ampcode/commands/root-cause-tracing.md +176 -0
package/packages/ampcode/commands/security.md +21 -0
package/packages/ampcode/commands/ship.md +18 -0
package/packages/ampcode/commands/skill-creator/scripts/init_skill.py +303 -0
package/packages/ampcode/commands/skill-creator/scripts/package_skill.py +110 -0
package/packages/ampcode/commands/skill-creator/scripts/quick_validate.py +65 -0
package/packages/ampcode/commands/skill-creator.md +211 -0
package/packages/ampcode/commands/stash.md +45 -0
package/packages/ampcode/commands/systematic-debugging.md +297 -0
package/packages/ampcode/commands/test-driven-development.md +390 -0
package/packages/ampcode/commands/test-generate.md +18 -0
package/packages/ampcode/commands/testing-anti-patterns.md +304 -0
package/packages/ampcode/commands/verification-before-completion.md +152 -0
package/packages/ampcode/settings.json +13 -0
package/packages/ampcode/variants.json +8 -0
package/packages/claude/CLAUDE.md +58 -0
package/packages/claude/README.md +23 -0
package/packages/claude/agents/1-create-prd.md +175 -0
package/packages/claude/agents/2-generate-tasks.md +190 -0
package/packages/claude/agents/3-process-task-list.md +225 -0
package/packages/claude/agents/code-developer.md +198 -0
package/packages/claude/agents/context-builder.md +142 -0
package/packages/claude/agents/feature-planner.md +199 -0
package/packages/claude/agents/market-researcher.md +89 -0
package/packages/claude/agents/orchestrator.md +117 -0
package/packages/claude/agents/quality-assurance.md +115 -0
package/packages/claude/agents/system-architect.md +135 -0
package/packages/claude/agents/ui-designer.md +184 -0
package/packages/claude/commands/debug.md +20 -0
package/packages/claude/commands/explain.md +18 -0
package/packages/claude/commands/git-commit.md +14 -0
package/packages/claude/commands/optimize.md +20 -0
package/packages/claude/commands/refactor.md +21 -0
package/packages/claude/commands/review.md +18 -0
package/packages/claude/commands/security.md +21 -0
package/packages/claude/commands/ship.md +18 -0
package/packages/claude/commands/stash.md +45 -0
package/packages/claude/commands/test-generate.md +18 -0
package/packages/claude/skills/brainstorming/SKILL.md +56 -0
package/packages/claude/skills/code-review/SKILL.md +107 -0
package/packages/claude/skills/code-review/code-reviewer.md +146 -0
package/packages/claude/skills/condition-based-waiting/SKILL.md +122 -0
package/packages/claude/skills/condition-based-waiting/example.ts +158 -0
package/packages/claude/skills/docs-builder/SKILL.md +106 -0
package/packages/claude/skills/docs-builder/references/templates.md +572 -0
package/packages/claude/skills/root-cause-tracing/SKILL.md +176 -0
package/packages/claude/skills/root-cause-tracing/find-polluter.sh +63 -0
package/packages/claude/skills/skill-creator/LICENSE.txt +202 -0
package/packages/claude/skills/skill-creator/SKILL.md +211 -0
package/packages/claude/skills/skill-creator/scripts/init_skill.py +303 -0
package/packages/claude/skills/skill-creator/scripts/package_skill.py +110 -0
package/packages/claude/skills/skill-creator/scripts/quick_validate.py +65 -0
package/packages/claude/skills/systematic-debugging/CREATION-LOG.md +119 -0
package/packages/claude/skills/systematic-debugging/SKILL.md +296 -0
package/packages/claude/skills/systematic-debugging/test-academic.md +14 -0
package/packages/claude/skills/systematic-debugging/test-pressure-1.md +58 -0
package/packages/claude/skills/systematic-debugging/test-pressure-2.md +68 -0
package/packages/claude/skills/systematic-debugging/test-pressure-3.md +69 -0
package/packages/claude/skills/test-driven-development/SKILL.md +392 -0
package/packages/claude/skills/testing-anti-patterns/SKILL.md +304 -0
package/packages/claude/skills/verification-before-completion/SKILL.md +152 -0
package/packages/claude/variants.json +9 -0
package/packages/droid/AGENTS.md +52 -0
package/packages/droid/README.md +17 -0
package/packages/droid/change_settings.json +61 -0
package/packages/droid/commands/brainstorming.md +56 -0
package/packages/droid/commands/code-review.md +107 -0
package/packages/droid/commands/condition-based-waiting/example.ts +158 -0
package/packages/droid/commands/condition-based-waiting.md +122 -0
package/packages/droid/commands/debug.md +20 -0
package/packages/droid/commands/docs-builder/templates.md +572 -0
package/packages/droid/commands/docs-builder.md +106 -0
package/packages/droid/commands/explain.md +18 -0
package/packages/droid/commands/git-commit.md +14 -0
package/packages/droid/commands/optimize.md +20 -0
package/packages/droid/commands/refactor.md +21 -0
package/packages/droid/commands/review.md +18 -0
package/packages/droid/commands/root-cause-tracing/find-polluter.sh +63 -0
package/packages/droid/commands/root-cause-tracing.md +176 -0
package/packages/droid/commands/security.md +21 -0
package/packages/droid/commands/ship.md +18 -0
package/packages/droid/commands/skill-creator/scripts/init_skill.py +303 -0
package/packages/droid/commands/skill-creator/scripts/package_skill.py +110 -0
package/packages/droid/commands/skill-creator/scripts/quick_validate.py +65 -0
package/packages/droid/commands/skill-creator.md +211 -0
package/packages/droid/commands/stash.md +45 -0
package/packages/droid/commands/systematic-debugging.md +297 -0
package/packages/droid/commands/test-driven-development.md +390 -0
package/packages/droid/commands/test-generate.md +18 -0
package/packages/droid/commands/testing-anti-patterns.md +304 -0
package/packages/droid/commands/verification-before-completion.md +152 -0
package/packages/droid/droids/1-create-prd.md +170 -0
package/packages/droid/droids/2-generate-tasks.md +190 -0
package/packages/droid/droids/3-process-task-list.md +225 -0
package/packages/droid/droids/code-developer.md +198 -0
package/packages/droid/droids/context-builder.md +142 -0
package/packages/droid/droids/feature-planner.md +199 -0
package/packages/droid/droids/market-researcher.md +89 -0
package/packages/droid/droids/orchestrator.md +116 -0
package/packages/droid/droids/quality-assurance.md +115 -0
package/packages/droid/droids/system-architect.md +135 -0
package/packages/droid/droids/ui-designer.md +184 -0
package/packages/droid/variants.json +8 -0
package/packages/opencode/AGENTS.md +52 -0
package/packages/opencode/README.md +17 -0
package/packages/opencode/agent/1-create-prd.md +179 -0
package/packages/opencode/agent/2-generate-tasks.md +194 -0
package/packages/opencode/agent/3-process-task-list.md +229 -0
package/packages/opencode/agent/code-developer.md +202 -0
package/packages/opencode/agent/context-builder.md +146 -0
package/packages/opencode/agent/feature-planner.md +203 -0
package/packages/opencode/agent/market-researcher.md +93 -0
package/packages/opencode/agent/orchestrator.md +120 -0
package/packages/opencode/agent/quality-assurance.md +119 -0
package/packages/opencode/agent/system-architect.md +139 -0
package/packages/opencode/agent/ui-designer.md +188 -0
package/packages/opencode/command/brainstorming.md +56 -0
package/packages/opencode/command/code-review.md +107 -0
package/packages/opencode/command/condition-based-waiting/example.ts +158 -0
package/packages/opencode/command/condition-based-waiting.md +122 -0
package/packages/opencode/command/debug.md +20 -0
package/packages/opencode/command/docs-builder/templates.md +572 -0
package/packages/opencode/command/docs-builder.md +106 -0
package/packages/opencode/command/explain.md +18 -0
package/packages/opencode/command/git-commit.md +14 -0
package/packages/opencode/command/optimize.md +20 -0
package/packages/opencode/command/refactor.md +21 -0
package/packages/opencode/command/review.md +18 -0
package/packages/opencode/command/root-cause-tracing/find-polluter.sh +63 -0
package/packages/opencode/command/root-cause-tracing.md +176 -0
package/packages/opencode/command/security.md +21 -0
package/packages/opencode/command/ship.md +18 -0
package/packages/opencode/command/skill-creator/scripts/init_skill.py +303 -0
package/packages/opencode/command/skill-creator/scripts/package_skill.py +110 -0
package/packages/opencode/command/skill-creator/scripts/quick_validate.py +65 -0
package/packages/opencode/command/skill-creator.md +211 -0
package/packages/opencode/command/stash.md +45 -0
package/packages/opencode/command/systematic-debugging.md +297 -0
package/packages/opencode/command/test-driven-development.md +390 -0
package/packages/opencode/command/test-generate.md +18 -0
package/packages/opencode/command/testing-anti-patterns.md +304 -0
package/packages/opencode/command/verification-before-completion.md +152 -0
package/packages/opencode/opencode.jsonc +201 -0
package/packages/opencode/variants.json +8 -0
package/packages/subagentic-manual.md +349 -0
package/postinstall.js +21 -0
package/tools/ampcode/manifest-template.json +14 -0
package/tools/claude/manifest-template.json +14 -0
package/tools/droid/manifest-template.json +14 -0
package/tools/opencode/manifest-template.json +14 -0

package/packages/claude/commands/ship.md ADDED Viewed

@@ -0,0 +1,18 @@
+---
+name: ship
+description: Check pre-deployment
+usage: /ship
+allowed-tools: Bash(npm *), Bash(git *)
+---
+Pre-deploy checklist:
+- [ ] Tests pass (`npm test`)
+- [ ] Lint clean (`npm run lint`)
+- [ ] Build succeeds (`npm run build`)
+- [ ] No console.log/debugger statements
+- [ ] Env vars documented
+- [ ] No hardcoded secrets
+- [ ] Error handling complete
+- [ ] Migrations ready
+Run checks and report: Ready 🚀 or Blocked 🛑 with issues.

package/packages/claude/commands/stash.md ADDED Viewed

@@ -0,0 +1,45 @@
+---
+name: stash
+description: Stash session context [name]
+usage: /stash ["optional-name"]
+argument-hint: [optional stash name]
+---
+Save session context for compaction recovery or handoffs.
+**Guardrails**
+- Favor straightforward, minimal implementations first and add complexity only when requested or clearly required.
+- Keep changes tightly scoped to the requested outcome.
+**What it does**
+1. Captures current conversation context and key decisions
+2. Records active work in progress
+3. Stores important findings and insights
+4. Creates stash file in `.claude/stash/`
+5. Enables context restoration after compaction
+**When to use**
+- Before long-running tasks that may trigger compaction
+- When handing off work to another agent or session
+- After completing major investigation or analysis
+- Before taking a break from complex multi-step work
+**Commands**
+```bash
+# Stash with auto-generated name
+/stash
+# Stash with custom name
+/stash "feature-auth-investigation"
+# List available stashes
+ls .claude/stash/
+# Restore from stash
+cat .claude/stash/<name>.md
+```
+**Reference**
+- Stashes stored in `.claude/stash/` (project-local)
+- Automatically includes: timestamp, active plan, recent decisions
+- Maximum context retention with minimal token usage

package/packages/claude/commands/test-generate.md ADDED Viewed

@@ -0,0 +1,18 @@
+---
+name: test-generate
+description: Generate tests [file]
+usage: /test-generate <code-section>
+argument-hint: [file-to-test]
+---
+Generate tests for $ARGUMENTS.
+## Include
+- Happy path (expected usage)
+- Edge cases (empty, null, boundaries)
+- Error scenarios (invalid input, failures)
+- Integration points (mocks for external deps)
+## Requirements
+- Match existing test patterns in this project
+- Use the testing framework already in use
+- Clear test names: "should [expected] when [condition]"

package/packages/claude/skills/brainstorming/SKILL.md ADDED Viewed

@@ -0,0 +1,56 @@
+---
+name: brainstorming
+description: Use when creating or developing, before writing code or implementation plans - refines rough ideas into fully-formed designs through collaborative questioning, alternative exploration, and incremental validation. Don't use during clear 'mechanical' processes
+usage: /brainstorming <session-type> <topic>
+auto_trigger: false
+---
+# Brainstorming Ideas Into Designs
+## Overview
+Help turn ideas into fully formed designs and specs through natural collaborative dialogue.
+Start by understanding the current project context, then ask questions one at a time to refine the idea. Once you understand what you're building, present the design in small sections (200-300 words), checking after each section whether it looks right so far.
+## The Process
+**Understanding the idea:**
+- Check out the current project state first (files, docs, recent commits)
+- Ask questions one at a time to refine the idea
+- Prefer multiple choice questions when possible, but open-ended is fine too
+- Only one question per message - if a topic needs more exploration, break it into multiple questions
+- Focus on understanding: purpose, constraints, success criteria
+**Exploring approaches:**
+- Propose 2-3 different approaches with trade-offs
+- Present options conversationally with your recommendation and reasoning
+- Lead with your recommended option and explain why
+**Presenting the design:**
+- Once you believe you understand what you're building, present the design
+- Break it into sections of 200-300 words
+- Ask after each section whether it looks right so far
+- Cover: architecture, components, data flow, error handling, testing
+- Be ready to go back and clarify if something doesn't make sense
+## After the Design
+**Documentation:**
+- Write the validated design to `docs/plans/YYYY-MM-DD-<topic>-design.md`
+- Use elements-of-style:writing-clearly-and-concisely skill if available
+- Commit the design document to git
+**Implementation (if continuing):**
+- Ask: "Ready to set up for implementation?"
+- Create isolated workspace for implementation
+- Create detailed implementation plan
+## Key Principles
+- **One question at a time** - Don't overwhelm with multiple questions
+- **Multiple choice preferred** - Easier to answer than open-ended when possible
+- **YAGNI ruthlessly** - Remove unnecessary features from all designs
+- **Explore alternatives** - Always propose 2-3 approaches before settling
+- **Incremental validation** - Present design in sections, validate each
+- **Be flexible** - Go back and clarify when something doesn't make sense

package/packages/claude/skills/code-review/SKILL.md ADDED Viewed

@@ -0,0 +1,107 @@
+---
+name: code-review
+description: Use when completing tasks, implementing major features, or before merging to verify work meets requirements - reviews implementation against plan or requirements before proceeding
+usage: /code-review <review-scope> <focus-areas>
+auto_trigger: false
+---
+# Requesting Code Review
+Review code thoroughly to catch issues before they cascade.
+**Core principle:** Review early, review often.
+## When to Request Review
+**Mandatory:**
+- After each task in subagent-driven development
+- After completing major feature
+- Before merge to main
+**Optional but valuable:**
+- When stuck (fresh perspective)
+- Before refactoring (baseline check)
+- After fixing complex bug
+## How to Request
+**1. Get git SHAs:**
+```bash
+BASE_SHA=$(git rev-parse HEAD~1)  # or origin/main
+HEAD_SHA=$(git rev-parse HEAD)
+```
+**2. Conduct code review:**
+Review implementation against requirements and plan
+**Placeholders:**
+- `{WHAT_WAS_IMPLEMENTED}` - What you just built
+- `{PLAN_OR_REQUIREMENTS}` - What it should do
+- `{BASE_SHA}` - Starting commit
+- `{HEAD_SHA}` - Ending commit
+- `{DESCRIPTION}` - Brief summary
+**3. Act on feedback:**
+- Fix Critical issues immediately
+- Fix Important issues before proceeding
+- Note Minor issues for later
+- Push back if reviewer is wrong (with reasoning)
+## Example
+```
+[Just completed Task 2: Add verification function]
+You: Let me request code review before proceeding.
+BASE_SHA=$(git log --oneline | grep "Task 1" | head -1 | awk '{print $1}')
+HEAD_SHA=$(git rev-parse HEAD)
+[Conduct code review]
+  WHAT_WAS_IMPLEMENTED: Verification and repair functions for conversation index
+  PLAN_OR_REQUIREMENTS: Task 2 from docs/plans/deployment-plan.md
+  BASE_SHA: a7981ec
+  HEAD_SHA: 3df7661
+  DESCRIPTION: Added verifyIndex() and repairIndex() with 4 issue types
+[Subagent returns]:
+  Strengths: Clean architecture, real tests
+  Issues:
+    Important: Missing progress indicators
+    Minor: Magic number (100) for reporting interval
+  Assessment: Ready to proceed
+You: [Fix progress indicators]
+[Continue to Task 3]
+```
+## Integration with Workflows
+**Subagent-Driven Development:**
+- Review after EACH task
+- Catch issues before they compound
+- Fix before moving to next task
+**Executing Plans:**
+- Review after each batch (3 tasks)
+- Get feedback, apply, continue
+**Ad-Hoc Development:**
+- Review before merge
+- Review when stuck
+## Red Flags
+**Never:**
+- Skip review because "it's simple"
+- Ignore Critical issues
+- Proceed with unfixed Important issues
+- Argue with valid technical feedback
+**If reviewer wrong:**
+- Push back with technical reasoning
+- Show code/tests that prove it works
+- Request clarification
+See template at: requesting-code-review/code-reviewer.md

package/packages/claude/skills/code-review/code-reviewer.md ADDED Viewed

@@ -0,0 +1,146 @@
+# Code Review Agent
+You are reviewing code changes for production readiness.
+**Your task:**
+1. Review {WHAT_WAS_IMPLEMENTED}
+2. Compare against {PLAN_OR_REQUIREMENTS}
+3. Check code quality, architecture, testing
+4. Categorize issues by severity
+5. Assess production readiness
+## What Was Implemented
+{DESCRIPTION}
+## Requirements/Plan
+{PLAN_REFERENCE}
+## Git Range to Review
+**Base:** {BASE_SHA}
+**Head:** {HEAD_SHA}
+```bash
+git diff --stat {BASE_SHA}..{HEAD_SHA}
+git diff {BASE_SHA}..{HEAD_SHA}
+```
+## Review Checklist
+**Code Quality:**
+- Clean separation of concerns?
+- Proper error handling?
+- Type safety (if applicable)?
+- DRY principle followed?
+- Edge cases handled?
+**Architecture:**
+- Sound design decisions?
+- Scalability considerations?
+- Performance implications?
+- Security concerns?
+**Testing:**
+- Tests actually test logic (not mocks)?
+- Edge cases covered?
+- Integration tests where needed?
+- All tests passing?
+**Requirements:**
+- All plan requirements met?
+- Implementation matches spec?
+- No scope creep?
+- Breaking changes documented?
+**Production Readiness:**
+- Migration strategy (if schema changes)?
+- Backward compatibility considered?
+- Documentation complete?
+- No obvious bugs?
+## Output Format
+### Strengths
+[What's well done? Be specific.]
+### Issues
+#### Critical (Must Fix)
+[Bugs, security issues, data loss risks, broken functionality]
+#### Important (Should Fix)
+[Architecture problems, missing features, poor error handling, test gaps]
+#### Minor (Nice to Have)
+[Code style, optimization opportunities, documentation improvements]
+**For each issue:**
+- File:line reference
+- What's wrong
+- Why it matters
+- How to fix (if not obvious)
+### Recommendations
+[Improvements for code quality, architecture, or process]
+### Assessment
+**Ready to merge?** [Yes/No/With fixes]
+**Reasoning:** [Technical assessment in 1-2 sentences]
+## Critical Rules
+**DO:**
+- Categorize by actual severity (not everything is Critical)
+- Be specific (file:line, not vague)
+- Explain WHY issues matter
+- Acknowledge strengths
+- Give clear verdict
+**DON'T:**
+- Say "looks good" without checking
+- Mark nitpicks as Critical
+- Give feedback on code you didn't review
+- Be vague ("improve error handling")
+- Avoid giving a clear verdict
+## Example Output
+```
+### Strengths
+- Clean database schema with proper migrations (db.ts:15-42)
+- Comprehensive test coverage (18 tests, all edge cases)
+- Good error handling with fallbacks (summarizer.ts:85-92)
+### Issues
+#### Important
+1. **Missing help text in CLI wrapper**
+   - File: index-conversations:1-31
+   - Issue: No --help flag, users won't discover --concurrency
+   - Fix: Add --help case with usage examples
+2. **Date validation missing**
+   - File: search.ts:25-27
+   - Issue: Invalid dates silently return no results
+   - Fix: Validate ISO format, throw error with example
+#### Minor
+1. **Progress indicators**
+   - File: indexer.ts:130
+   - Issue: No "X of Y" counter for long operations
+   - Impact: Users don't know how long to wait
+### Recommendations
+- Add progress reporting for user experience
+- Consider config file for excluded projects (portability)
+### Assessment
+**Ready to merge: With fixes**
+**Reasoning:** Core implementation is solid with good architecture and tests. Important issues (help text, date validation) are easily fixed and don't affect core functionality.
+```

package/packages/claude/skills/condition-based-waiting/SKILL.md ADDED Viewed

@@ -0,0 +1,122 @@
+---
+name: condition-based-waiting
+description: Use when tests have race conditions, timing dependencies, or inconsistent pass/fail behavior - replaces arbitrary timeouts with condition polling to wait for actual state changes, eliminating flaky tests from timing guesses
+usage: /condition-based-waiting <condition-type> <timeout-specs>
+auto_trigger: false
+---
+# Condition-Based Waiting
+## Overview
+Flaky tests often guess at timing with arbitrary delays. This creates race conditions where tests pass on fast machines but fail under load or in CI.
+**Core principle:** Wait for the actual condition you care about, not a guess about how long it takes.
+## When to Use
+```dot
+digraph when_to_use {
+    "Test uses setTimeout/sleep?" [shape=diamond];
+    "Testing timing behavior?" [shape=diamond];
+    "Document WHY timeout needed" [shape=box];
+    "Use condition-based waiting" [shape=box];
+    "Test uses setTimeout/sleep?" -> "Testing timing behavior?" [label="yes"];
+    "Testing timing behavior?" -> "Document WHY timeout needed" [label="yes"];
+    "Testing timing behavior?" -> "Use condition-based waiting" [label="no"];
+}
+```
+**Use when:**
+- Tests have arbitrary delays (`setTimeout`, `sleep`, `time.sleep()`)
+- Tests are flaky (pass sometimes, fail under load)
+- Tests timeout when run in parallel
+- Waiting for async operations to complete
+**Don't use when:**
+- Testing actual timing behavior (debounce, throttle intervals)
+- Always document WHY if using arbitrary timeout
+## Core Pattern
+```typescript
+// ❌ BEFORE: Guessing at timing
+await new Promise(r => setTimeout(r, 50));
+const result = getResult();
+expect(result).toBeDefined();
+// ✅ AFTER: Waiting for condition
+await waitFor(() => getResult() !== undefined);
+const result = getResult();
+expect(result).toBeDefined();
+```
+## Quick Patterns
+| Scenario | Pattern |
+|----------|---------|
+| Wait for event | `waitFor(() => events.find(e => e.type === 'DONE'))` |
+| Wait for state | `waitFor(() => machine.state === 'ready')` |
+| Wait for count | `waitFor(() => items.length >= 5)` |
+| Wait for file | `waitFor(() => fs.existsSync(path))` |
+| Complex condition | `waitFor(() => obj.ready && obj.value > 10)` |
+## Implementation
+Generic polling function:
+```typescript
+async function waitFor<T>(
+  condition: () => T | undefined | null | false,
+  description: string,
+  timeoutMs = 5000
+): Promise<T> {
+  const startTime = Date.now();
+  while (true) {
+    const result = condition();
+    if (result) return result;
+    if (Date.now() - startTime > timeoutMs) {
+      throw new Error(`Timeout waiting for ${description} after ${timeoutMs}ms`);
+    }
+    await new Promise(r => setTimeout(r, 10)); // Poll every 10ms
+  }
+}
+```
+See @example.ts for complete implementation with domain-specific helpers (`waitForEvent`, `waitForEventCount`, `waitForEventMatch`) from actual debugging session.
+## Common Mistakes
+**❌ Polling too fast:** `setTimeout(check, 1)` - wastes CPU
+**✅ Fix:** Poll every 10ms
+**❌ No timeout:** Loop forever if condition never met
+**✅ Fix:** Always include timeout with clear error
+**❌ Stale data:** Cache state before loop
+**✅ Fix:** Call getter inside loop for fresh data
+## When Arbitrary Timeout IS Correct
+```typescript
+// Tool ticks every 100ms - need 2 ticks to verify partial output
+await waitForEvent(manager, 'TOOL_STARTED'); // First: wait for condition
+await new Promise(r => setTimeout(r, 200));   // Then: wait for timed behavior
+// 200ms = 2 ticks at 100ms intervals - documented and justified
+```
+**Requirements:**
+1. First wait for triggering condition
+2. Based on known timing (not guessing)
+3. Comment explaining WHY
+## Real-World Impact
+From debugging session (2025-10-03):
+- Fixed 15 flaky tests across 3 files
+- Pass rate: 60% → 100%
+- Execution time: 40% faster
+- No more race conditions

package/packages/claude/skills/condition-based-waiting/example.ts ADDED Viewed

@@ -0,0 +1,158 @@
+// Complete implementation of condition-based waiting utilities
+// From: Lace test infrastructure improvements (2025-10-03)
+// Context: Fixed 15 flaky tests by replacing arbitrary timeouts
+import type { ThreadManager } from '~/threads/thread-manager';
+import type { LaceEvent, LaceEventType } from '~/threads/types';
+/**
+ * Wait for a specific event type to appear in thread
+ *
+ * @param threadManager - The thread manager to query
+ * @param threadId - Thread to check for events
+ * @param eventType - Type of event to wait for
+ * @param timeoutMs - Maximum time to wait (default 5000ms)
+ * @returns Promise resolving to the first matching event
+ *
+ * Example:
+ *   await waitForEvent(threadManager, agentThreadId, 'TOOL_RESULT');
+ */
+export function waitForEvent(
+  threadManager: ThreadManager,
+  threadId: string,
+  eventType: LaceEventType,
+  timeoutMs = 5000
+): Promise<LaceEvent> {
+  return new Promise((resolve, reject) => {
+    const startTime = Date.now();
+    const check = () => {
+      const events = threadManager.getEvents(threadId);
+      const event = events.find((e) => e.type === eventType);
+      if (event) {
+        resolve(event);
+      } else if (Date.now() - startTime > timeoutMs) {
+        reject(new Error(`Timeout waiting for ${eventType} event after ${timeoutMs}ms`));
+      } else {
+        setTimeout(check, 10); // Poll every 10ms for efficiency
+      }
+    };
+    check();
+  });
+}
+/**
+ * Wait for a specific number of events of a given type
+ *
+ * @param threadManager - The thread manager to query
+ * @param threadId - Thread to check for events
+ * @param eventType - Type of event to wait for
+ * @param count - Number of events to wait for
+ * @param timeoutMs - Maximum time to wait (default 5000ms)
+ * @returns Promise resolving to all matching events once count is reached
+ *
+ * Example:
+ *   // Wait for 2 AGENT_MESSAGE events (initial response + continuation)
+ *   await waitForEventCount(threadManager, agentThreadId, 'AGENT_MESSAGE', 2);
+ */
+export function waitForEventCount(
+  threadManager: ThreadManager,
+  threadId: string,
+  eventType: LaceEventType,
+  count: number,
+  timeoutMs = 5000
+): Promise<LaceEvent[]> {
+  return new Promise((resolve, reject) => {
+    const startTime = Date.now();
+    const check = () => {
+      const events = threadManager.getEvents(threadId);
+      const matchingEvents = events.filter((e) => e.type === eventType);
+      if (matchingEvents.length >= count) {
+        resolve(matchingEvents);
+      } else if (Date.now() - startTime > timeoutMs) {
+        reject(
+          new Error(
+            `Timeout waiting for ${count} ${eventType} events after ${timeoutMs}ms (got ${matchingEvents.length})`
+          )
+        );
+      } else {
+        setTimeout(check, 10);
+      }
+    };
+    check();
+  });
+}
+/**
+ * Wait for an event matching a custom predicate
+ * Useful when you need to check event data, not just type
+ *
+ * @param threadManager - The thread manager to query
+ * @param threadId - Thread to check for events
+ * @param predicate - Function that returns true when event matches
+ * @param description - Human-readable description for error messages
+ * @param timeoutMs - Maximum time to wait (default 5000ms)
+ * @returns Promise resolving to the first matching event
+ *
+ * Example:
+ *   // Wait for TOOL_RESULT with specific ID
+ *   await waitForEventMatch(
+ *     threadManager,
+ *     agentThreadId,
+ *     (e) => e.type === 'TOOL_RESULT' && e.data.id === 'call_123',
+ *     'TOOL_RESULT with id=call_123'
+ *   );
+ */
+export function waitForEventMatch(
+  threadManager: ThreadManager,
+  threadId: string,
+  predicate: (event: LaceEvent) => boolean,
+  description: string,
+  timeoutMs = 5000
+): Promise<LaceEvent> {
+  return new Promise((resolve, reject) => {
+    const startTime = Date.now();
+    const check = () => {
+      const events = threadManager.getEvents(threadId);
+      const event = events.find(predicate);
+      if (event) {
+        resolve(event);
+      } else if (Date.now() - startTime > timeoutMs) {
+        reject(new Error(`Timeout waiting for ${description} after ${timeoutMs}ms`));
+      } else {
+        setTimeout(check, 10);
+      }
+    };
+    check();
+  });
+}
+// Usage example from actual debugging session:
+//
+// BEFORE (flaky):
+// ---------------
+// const messagePromise = agent.sendMessage('Execute tools');
+// await new Promise(r => setTimeout(r, 300)); // Hope tools start in 300ms
+// agent.abort();
+// await messagePromise;
+// await new Promise(r => setTimeout(r, 50));  // Hope results arrive in 50ms
+// expect(toolResults.length).toBe(2);         // Fails randomly
+//
+// AFTER (reliable):
+// ----------------
+// const messagePromise = agent.sendMessage('Execute tools');
+// await waitForEventCount(threadManager, threadId, 'TOOL_CALL', 2); // Wait for tools to start
+// agent.abort();
+// await messagePromise;
+// await waitForEventCount(threadManager, threadId, 'TOOL_RESULT', 2); // Wait for results
+// expect(toolResults.length).toBe(2); // Always succeeds
+//
+// Result: 60% pass rate → 100%, 40% faster execution