npm - codex-workflows - Versions diffs - 0.1.0 - Mend

codex-workflows 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (85) hide show

package/.agents/skills/ai-development-guide/SKILL.md +283 -0
package/.agents/skills/ai-development-guide/agents/openai.yaml +7 -0
package/.agents/skills/ai-development-guide/references/frontend.md +135 -0
package/.agents/skills/coding-rules/SKILL.md +98 -0
package/.agents/skills/coding-rules/agents/openai.yaml +7 -0
package/.agents/skills/coding-rules/references/typescript.md +220 -0
package/.agents/skills/documentation-criteria/SKILL.md +127 -0
package/.agents/skills/documentation-criteria/agents/openai.yaml +7 -0
package/.agents/skills/documentation-criteria/references/adr-template.md +64 -0
package/.agents/skills/documentation-criteria/references/design-template.md +327 -0
package/.agents/skills/documentation-criteria/references/plan-template.md +131 -0
package/.agents/skills/documentation-criteria/references/prd-template.md +119 -0
package/.agents/skills/documentation-criteria/references/task-template.md +38 -0
package/.agents/skills/documentation-criteria/references/ui-spec-template.md +145 -0
package/.agents/skills/implementation-approach/SKILL.md +145 -0
package/.agents/skills/implementation-approach/agents/openai.yaml +7 -0
package/.agents/skills/integration-e2e-testing/SKILL.md +125 -0
package/.agents/skills/integration-e2e-testing/agents/openai.yaml +7 -0
package/.agents/skills/integration-e2e-testing/references/e2e-design.md +86 -0
package/.agents/skills/recipe-add-integration-tests/SKILL.md +128 -0
package/.agents/skills/recipe-add-integration-tests/agents/openai.yaml +7 -0
package/.agents/skills/recipe-build/SKILL.md +119 -0
package/.agents/skills/recipe-build/agents/openai.yaml +7 -0
package/.agents/skills/recipe-design/SKILL.md +90 -0
package/.agents/skills/recipe-design/agents/openai.yaml +7 -0
package/.agents/skills/recipe-diagnose/SKILL.md +187 -0
package/.agents/skills/recipe-diagnose/agents/openai.yaml +7 -0
package/.agents/skills/recipe-front-build/SKILL.md +127 -0
package/.agents/skills/recipe-front-build/agents/openai.yaml +7 -0
package/.agents/skills/recipe-front-design/SKILL.md +90 -0
package/.agents/skills/recipe-front-design/agents/openai.yaml +7 -0
package/.agents/skills/recipe-front-plan/SKILL.md +68 -0
package/.agents/skills/recipe-front-plan/agents/openai.yaml +7 -0
package/.agents/skills/recipe-front-review/SKILL.md +101 -0
package/.agents/skills/recipe-front-review/agents/openai.yaml +7 -0
package/.agents/skills/recipe-fullstack-build/SKILL.md +139 -0
package/.agents/skills/recipe-fullstack-build/agents/openai.yaml +7 -0
package/.agents/skills/recipe-fullstack-implement/SKILL.md +151 -0
package/.agents/skills/recipe-fullstack-implement/agents/openai.yaml +7 -0
package/.agents/skills/recipe-implement/SKILL.md +125 -0
package/.agents/skills/recipe-implement/agents/openai.yaml +7 -0
package/.agents/skills/recipe-plan/SKILL.md +73 -0
package/.agents/skills/recipe-plan/agents/openai.yaml +7 -0
package/.agents/skills/recipe-reverse-engineer/SKILL.md +212 -0
package/.agents/skills/recipe-reverse-engineer/agents/openai.yaml +7 -0
package/.agents/skills/recipe-review/SKILL.md +115 -0
package/.agents/skills/recipe-review/agents/openai.yaml +7 -0
package/.agents/skills/recipe-task/SKILL.md +74 -0
package/.agents/skills/recipe-task/agents/openai.yaml +7 -0
package/.agents/skills/recipe-update-doc/SKILL.md +156 -0
package/.agents/skills/recipe-update-doc/agents/openai.yaml +7 -0
package/.agents/skills/subagents-orchestration-guide/SKILL.md +354 -0
package/.agents/skills/subagents-orchestration-guide/agents/openai.yaml +7 -0
package/.agents/skills/subagents-orchestration-guide/references/monorepo-flow.md +124 -0
package/.agents/skills/task-analyzer/SKILL.md +142 -0
package/.agents/skills/task-analyzer/agents/openai.yaml +7 -0
package/.agents/skills/task-analyzer/references/skills-index.yaml +162 -0
package/.agents/skills/testing/SKILL.md +324 -0
package/.agents/skills/testing/agents/openai.yaml +7 -0
package/.agents/skills/testing/references/typescript.md +224 -0
package/.codex/agents/acceptance-test-generator.toml +310 -0
package/.codex/agents/code-reviewer.toml +228 -0
package/.codex/agents/code-verifier.toml +231 -0
package/.codex/agents/design-sync.toml +265 -0
package/.codex/agents/document-reviewer.toml +367 -0
package/.codex/agents/integration-test-reviewer.toml +178 -0
package/.codex/agents/investigator.toml +197 -0
package/.codex/agents/prd-creator.toml +250 -0
package/.codex/agents/quality-fixer-frontend.toml +356 -0
package/.codex/agents/quality-fixer.toml +249 -0
package/.codex/agents/requirement-analyzer.toml +172 -0
package/.codex/agents/rule-advisor.toml +186 -0
package/.codex/agents/scope-discoverer.toml +248 -0
package/.codex/agents/solver.toml +212 -0
package/.codex/agents/task-decomposer.toml +262 -0
package/.codex/agents/task-executor-frontend.toml +312 -0
package/.codex/agents/task-executor.toml +314 -0
package/.codex/agents/technical-designer-frontend.toml +492 -0
package/.codex/agents/technical-designer.toml +474 -0
package/.codex/agents/ui-spec-designer.toml +150 -0
package/.codex/agents/verifier.toml +228 -0
package/.codex/agents/work-planner.toml +251 -0
package/README.md +365 -0
package/bin/cli.js +249 -0
package/package.json +35 -0

package/.agents/skills/task-analyzer/references/skills-index.yaml ADDED Viewed

@@ -0,0 +1,162 @@
+# Skills Metadata Index
+# Used to select appropriate skills based on task analysis
+skills:
+  coding-rules:
+    skill: "coding-rules"
+    tags: [implementation, code-quality, refactoring, clean-code, maintainability, function-design, error-handling, parameterized-dependencies, performance, security]
+    typical-use: "Language-agnostic code creation, modification, and refactoring principles applicable to all programming languages"
+    size: medium
+    key-references:
+      - "YAGNI Principle - Kent Beck"
+      - "Clean Code - Robert C. Martin"
+      - "DRY Principle - The Pragmatic Programmer"
+      - "Refactoring - Martin Fowler"
+      - "Single Responsibility Principle - SOLID"
+    sections:
+      - "Core Philosophy [MANDATORY]"
+      - "Code Quality [MANDATORY]"
+      - "Function Design [MANDATORY]"
+      - "Error Handling [MANDATORY]"
+      - "Dependency Management"
+      - "Performance"
+      - "Code Organization"
+      - "Commenting Principles"
+      - "Refactoring [SAFE CHANGE PROTOCOL]"
+      - "Security"
+      - "Version Control [MANDATORY]"
+    references:
+      - "references/typescript.md"
+  testing:
+    skill: "testing"
+    tags: [testing, tdd, quality, unit-testing, integration-testing, e2e-testing, test-design, coverage, mocking, test-independence, ci-cd, test-quality-criteria]
+    typical-use: "Universal testing principles, TDD practice, test quality criteria, test creation and quality assurance for all programming languages"
+    size: large
+    key-references:
+      - "Test-Driven Development - Kent Beck"
+      - "Red-Green-Refactor Cycle - Kent Beck"
+      - "AAA Pattern - Arrange-Act-Assert"
+      - "Test Pyramid - Mike Cohn"
+    sections:
+      - "Core Testing Philosophy"
+      - "TDD Process [MANDATORY for all code changes]"
+      - "Quality Requirements [MANDATORY]"
+      - "Test Types"
+      - "Test Design Principles"
+      - "Test Independence"
+      - "Mocking and Test Doubles"
+      - "Test Quality Practices [MANDATORY]"
+      - "What to Test"
+      - "Test Quality Criteria [MANDATORY]"
+      - "Verification Requirements [MANDATORY for VERIFY phase]"
+      - "Test Organization"
+      - "Performance Considerations"
+      - "Common Anti-Patterns"
+      - "Regression Testing"
+    references:
+      - "references/typescript.md"
+  ai-development-guide:
+    skill: "ai-development-guide"
+    tags: [anti-patterns, technical-judgment, debugging, quality-commands, rule-of-three, implementation, refactoring, code-reading, best-practices, fail-fast, error-handling, impact-analysis]
+    typical-use: "Technical decision criteria, anti-pattern detection, debugging techniques, quality check workflows, impact analysis procedures"
+    size: large
+    key-references:
+      - "Rule of Three - Martin Fowler"
+      - "5 Whys - Toyota Production System"
+      - "DRY Principle - The Pragmatic Programmer"
+      - "YAGNI Principle - Extreme Programming"
+    sections:
+      - "Technical Anti-patterns (Red Flag Patterns) [MANDATORY]"
+      - "Fail-Fast Fallback Design Principles"
+      - "Rule of Three - Criteria for Code Duplication"
+      - "Common Failure Patterns and Avoidance Methods"
+      - "Debugging Techniques"
+      - "Quality Check Workflow [MANDATORY]"
+      - "Situations Requiring Technical Decisions"
+      - "Implementation Completeness Assurance"
+      - "Impact Analysis"
+  documentation-criteria:
+    skill: "documentation-criteria"
+    tags: [documentation, decision-making, adr, prd, design-doc, planning, process, scale-assessment]
+    typical-use: "Scale assessment at implementation start, document creation criteria, ADR/PRD/Design Doc/Work Plan creation standards"
+    size: medium
+    key-references:
+      - "ADR Method - Michael Nygard"
+      - "Design Doc Culture - Google Engineering Practices"
+      - "Single Source of Truth"
+    sections:
+      - "Templates"
+      - "Creation Decision Matrix [MANDATORY]"
+      - "ADR Creation Conditions [MANDATORY if Any Apply]"
+      - "Detailed Document Definitions"
+      - "Creation Process [MANDATORY]"
+      - "Storage Locations"
+      - "ADR Status"
+      - "AI Automation Rules [MANDATORY]"
+      - "Diagram Requirements"
+      - "Common ADR Relationships"
+  implementation-approach:
+    skill: "implementation-approach"
+    tags: [architecture, implementation, task-decomposition, strategy-patterns, strangler-pattern, facade-pattern, design, planning, verification-levels]
+    typical-use: "Implementation strategy selection, task decomposition, design decisions, large-scale change planning"
+    size: medium
+    key-references:
+      - "Strangler Fig Pattern - Martin Fowler"
+      - "Feature Slicing - Martin Fowler"
+      - "Walking Skeleton - Alistair Cockburn"
+    sections:
+      - "Meta-cognitive Strategy Selection Process [MANDATORY]"
+      - "Verification Level Definitions"
+      - "Integration Point Definitions"
+      - "Anti-patterns [MANDATORY to detect]"
+      - "Guidelines for Meta-cognitive Execution"
+  integration-e2e-testing:
+    skill: "integration-e2e-testing"
+    tags: [testing, integration-testing, e2e-testing, test-design, behavior-first, roi, test-skeleton, ears-format]
+    typical-use: "Integration and E2E test design principles, ROI-based test selection, behavior-first approach, test skeleton specification"
+    size: medium
+    key-references:
+      - "Test Pyramid - Mike Cohn"
+      - "Behavior-Driven Development"
+    sections:
+      - "References"
+      - "Test Type Definition and Limits [MANDATORY]"
+      - "Behavior-First Principle [MANDATORY]"
+      - "ROI Calculation"
+      - "Test Skeleton Specification [MANDATORY]"
+      - "EARS Format Mapping"
+      - "Test File Naming Convention"
+      - "Review Criteria"
+      - "Quality Standards [MANDATORY]"
+  subagents-orchestration-guide:
+    skill: "subagents-orchestration-guide"
+    tags: [orchestration, workflow, subagents, autonomous-execution, planning, design-flow, implementation-flow]
+    typical-use: "Orchestrating subagents through implementation workflows, scale determination, stop points, autonomous execution mode"
+    size: large
+    key-references:
+      - "Orchestrator Pattern"
+      - "Conductor Pattern"
+    sections:
+      - "Role: The Orchestrator"
+      - "Decision Flow When Receiving Tasks"
+      - "Available Subagents"
+      - "Orchestration Principles"
+      - "Constraints Between Subagents [MANDATORY]"
+      - "How to Spawn Agents"
+      - "Explicit Stop Points [MANDATORY]"
+      - "Scale Determination and Document Requirements"
+      - "Structured Response Specification"
+      - "Handling Requirement Changes"
+      - "Basic Flow for Work Planning"
+      - "Autonomous Execution Mode"
+      - "Main Orchestrator Roles"
+      - "Important Constraints [MANDATORY]"
+      - "Required Dialogue Points with Humans [MANDATORY]"
+      - "Action Checklist"
+      - "References"

package/.agents/skills/testing/SKILL.md ADDED Viewed

@@ -0,0 +1,324 @@
+---
+name: testing
+description: "Testing principles including TDD, test quality, coverage standards, and test design. Use when: writing tests, designing test strategies, reviewing test quality, or following Red-Green-Refactor cycle."
+---
+# Testing Principles
+## Language-Specific References
+For language-specific testing patterns, also read:
+- **TypeScript (Vitest/RTL/Playwright)**: [references/typescript.md](references/typescript.md)
+## Core Testing Philosophy
+1. **Tests are First-Class Code**: Maintain test quality equal to production code
+2. **Fast Feedback**: Tests should run quickly and provide immediate feedback
+3. **Reliability**: Tests should be deterministic and reproducible
+4. **Independence**: Each test should run in isolation
+## TDD Process [MANDATORY for all code changes]
+**Execute this process for every code change:**
+### RED Phase
+**STEP 1**: Write test that defines expected behavior
+**STEP 2**: Run test
+**STEP 3**: Confirm test FAILS (if it passes, the test is wrong)
+### GREEN Phase
+**STEP 1**: Write MINIMAL code to make test pass
+**STEP 2**: Run test
+**STEP 3**: Confirm test PASSES
+### REFACTOR Phase
+**STEP 1**: Improve code quality (eliminate duplication, improve naming)
+**STEP 2**: Run test
+**STEP 3**: Confirm test STILL PASSES
+### VERIFY Phase [MANDATORY - 0 ERRORS REQUIRED]
+**STEP 1**: Execute ALL quality check commands for your language/project
+**STEP 2**: Fix any errors until ALL commands pass with 0 errors
+**STEP 3**: Confirm no regressions
+**ENFORCEMENT**: Cannot proceed to next phase with ANY quality check failures
+### TDD Exceptions (no TDD required)
+- Pure configuration files
+- Documentation only
+- Emergency fixes (but add tests immediately after)
+- Exploratory spikes (discard or rewrite with tests before merging)
+- Build/deployment scripts (unless they contain business logic)
+## Quality Requirements [MANDATORY]
+### Coverage Standards
+- **Minimum 80% code coverage** for production code
+- Prioritize critical paths and business logic
+- Use coverage as a guide, not a goal
+### Test Characteristics
+All tests MUST be:
+- **Independent**: No dependencies between tests
+- **Reproducible**: Same input always produces same output
+- **Fast**: Complete test suite runs in reasonable time
+- **Self-checking**: Clear pass/fail without manual verification
+- **Timely**: Written close to the code they test
+**ENFORCEMENT**: Tests failing ANY characteristic MUST be fixed immediately
+## Test Types
+### Unit Tests
+**Purpose**: Test individual components in isolation
+**Characteristics**:
+- Test single function, method, or class
+- Fast execution (milliseconds)
+- No external dependencies
+- Mock external services
+- Majority of your test suite
+### Integration Tests
+**Purpose**: Test interactions between components
+**Characteristics**:
+- Test multiple components together
+- May include database, file system, or APIs
+- Slower than unit tests
+- Verify contracts between modules
+- Smaller portion of test suite
+### End-to-End (E2E) Tests
+**Purpose**: Test complete workflows from user perspective
+**Characteristics**:
+- Test entire application stack
+- Simulate real user interactions
+- Slowest test type
+- Fewest in number
+- Highest confidence level
+### Test Pyramid
+Follow the test pyramid structure:
+```
+    /\    <- Few E2E Tests (High confidence, slow)
+   /  \
+  /    \  <- Some Integration Tests (Medium confidence, medium speed)
+ /      \
+/________\ <- Many Unit Tests (Fast, foundational)
+```
+## Test Design Principles
+### AAA Pattern (Arrange-Act-Assert)
+Structure every test in three clear phases:
+```
+// Arrange: Setup test data and conditions
+user = createTestUser()
+validator = createValidator()
+// Act: Execute the code under test
+result = validator.validate(user)
+// Assert: Verify expected outcome
+assert(result.isValid == true)
+```
+### One Assertion Per Concept
+- Test one behavior per test case
+- Multiple assertions OK if testing single concept
+- Split unrelated assertions into separate tests — one test MUST verify one behavior
+### Descriptive Test Names
+Test names should clearly describe:
+- What is being tested
+- Under what conditions
+- What the expected outcome is
+**Recommended format**: `"should [expected behavior] when [condition]"`
+## Test Independence
+### Isolation Requirements
+- Each test creates its own test data
+- No dependencies on execution order
+- Clean up own state
+- Pass when run in isolation
+### Setup and Teardown
+- Use setup hooks to prepare test environment
+- Use teardown hooks to clean up resources
+- Keep setup minimal and focused
+- Ensure teardown runs even if test fails
+## Mocking and Test Doubles
+### When to Use Mocks
+- **Mock external dependencies**: APIs, databases, file systems
+- **Mock slow operations**: Network calls, heavy computations
+- **Mock unpredictable behavior**: Random values, current time
+- **Mock unavailable services**: Third-party services
+### Mocking Principles [MANDATORY]
+- Mock at boundaries, not internally — use real implementations for internal utilities
+- Keep mocks simple and focused
+- Verify mock expectations when relevant
+- Use adapters for external libraries/frameworks you do not control
+### Types of Test Doubles
+- **Stub**: Returns predetermined values
+- **Mock**: Verifies it was called correctly
+- **Spy**: Records information about calls
+- **Fake**: Simplified working implementation
+- **Dummy**: Passed but never used
+## Test Quality Practices [MANDATORY]
+### Keep Tests Active
+- **Fix or delete failing tests**: Resolve failures immediately
+- **Remove commented-out tests**: Fix them or delete entirely
+- **Keep tests running**: Broken tests lose value quickly
+- **Maintain test suite**: Refactor tests as needed
+### Test Code Quality
+- Apply same standards as production code
+- Use descriptive variable names
+- Extract test helpers to reduce duplication
+- Keep tests readable and maintainable
+### Test Helpers and Utilities
+- Create reusable test data builders
+- Extract common setup into helper functions
+- Build test utilities for complex scenarios
+- Share helpers across test files appropriately
+## What to Test
+### Focus on Behavior
+**Test observable behavior, not implementation**:
+- Good: Test that function returns expected output
+- Good: Test that correct API endpoint is called
+- Bad: Test that internal variable was set
+- Bad: Test order of private method calls
+### Test Edge Cases
+Always test:
+- **Boundary conditions**: Min/max values, empty collections
+- **Error cases**: Invalid input, null values, missing data
+- **Edge cases**: Special characters, extreme values
+- **Happy path**: Normal, expected usage
+## Test Quality Criteria [MANDATORY]
+1. **Literal expectations**: Use hardcoded literal values in assertions — expected value ≠ mock return value (implementation processes data)
+2. **Result verification**: Assert return values and state, not call order
+3. **Meaningful assertions**: Every test MUST have at least one assertion — a test without assertions provides zero value
+4. **Mock external I/O only**: Mock DB/API/filesystem, use real internal utilities
+5. **Boundary coverage**: Include empty/zero/max/error cases with happy paths
+**ENFORCEMENT**: Tests violating ANY criterion MUST be rewritten
+## Verification Requirements [MANDATORY for VERIFY phase]
+### Before Commit Checklist
+☐ All tests pass
+☐ No tests skipped or commented
+☐ No debug code left in tests
+☐ Test coverage meets standards (≥ 80%)
+☐ Tests run in reasonable time
+### Zero Tolerance Policy
+- **Zero failing tests**: Fix immediately
+- **Zero skipped tests**: Delete or fix
+- **Zero flaky tests**: Make deterministic
+- **Zero slow tests**: Optimize or split
+**ENFORCEMENT**: Cannot proceed with task completion if ANY quality check fails
+## Test Organization
+### File Structure
+- **Mirror production structure**: Tests follow code organization
+- **Clear naming conventions**: Follow project's test file patterns
+- **Logical grouping**: Group related tests together
+- **Separate test types**: Unit, integration, e2e in separate directories
+### Test Suite Organization
+```
+tests/
+├── unit/           # Fast, isolated unit tests
+├── integration/    # Integration tests
+├── e2e/            # End-to-end tests
+├── fixtures/       # Test data and fixtures
+└── helpers/        # Shared test utilities
+```
+## Performance Considerations
+### Test Speed
+- **Unit tests**: < 100ms each
+- **Integration tests**: < 1s each
+- **Full suite**: Should run frequently (< 10 minutes)
+## Common Anti-Patterns
+Detect and eliminate these patterns immediately:
+- Tests that test nothing (always pass)
+- Tests that depend on execution order
+- Tests that depend on external state
+- Tests with complex logic (tests that need their own tests)
+- Testing implementation details instead of observable behavior
+- Excessive mocking (mock boundaries only, use real internals)
+- Test code duplication
+### Flaky Tests
+Eliminate tests that fail intermittently:
+- Remove timing dependencies
+- Use deterministic data instead of random values
+- Ensure proper cleanup
+- Fix race conditions
+- Make all tests deterministic
+## Regression Testing
+- Add test for every bug fix
+- Maintain comprehensive test suite
+- Run full suite regularly
+- Don't delete tests without good reason
+### Legacy Code
+- Add characterization tests before refactoring
+- Test existing behavior first
+- Gradually improve coverage
+- Refactor with confidence

package/.agents/skills/testing/agents/openai.yaml ADDED Viewed

@@ -0,0 +1,7 @@
+interface:
+  display_name: "Testing"
+  short_description: "TDD and test quality standards"
+  default_prompt: "Use $testing to guide my test implementation."
+policy:
+  allow_implicit_invocation: true