npm - @kody-ade/engine - Versions diffs - 0.1.0 - Mend

@kody-ade/engine 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

package/LICENSE +21 -0
package/README.md +322 -0
package/dist/agent-runner.d.ts +4 -0
package/dist/agent-runner.js +122 -0
package/dist/bin/cli.js +11276 -0
package/dist/ci/parse-inputs.d.ts +6 -0
package/dist/ci/parse-inputs.js +76 -0
package/dist/ci/parse-safety.d.ts +6 -0
package/dist/ci/parse-safety.js +22 -0
package/dist/cli/args.d.ts +13 -0
package/dist/cli/args.js +42 -0
package/dist/cli/litellm.d.ts +2 -0
package/dist/cli/litellm.js +85 -0
package/dist/cli/task-resolution.d.ts +2 -0
package/dist/cli/task-resolution.js +41 -0
package/dist/config.d.ts +49 -0
package/dist/config.js +72 -0
package/dist/context.d.ts +4 -0
package/dist/context.js +83 -0
package/dist/definitions.d.ts +3 -0
package/dist/definitions.js +59 -0
package/dist/entry.d.ts +1 -0
package/dist/entry.js +236 -0
package/dist/git-utils.d.ts +13 -0
package/dist/git-utils.js +174 -0
package/dist/github-api.d.ts +14 -0
package/dist/github-api.js +114 -0
package/dist/kody-utils.d.ts +1 -0
package/dist/kody-utils.js +9 -0
package/dist/learning/auto-learn.d.ts +2 -0
package/dist/learning/auto-learn.js +169 -0
package/dist/logger.d.ts +14 -0
package/dist/logger.js +51 -0
package/dist/memory.d.ts +1 -0
package/dist/memory.js +20 -0
package/dist/observer.d.ts +9 -0
package/dist/observer.js +80 -0
package/dist/pipeline/complexity.d.ts +3 -0
package/dist/pipeline/complexity.js +12 -0
package/dist/pipeline/executor-registry.d.ts +3 -0
package/dist/pipeline/executor-registry.js +20 -0
package/dist/pipeline/hooks.d.ts +17 -0
package/dist/pipeline/hooks.js +110 -0
package/dist/pipeline/questions.d.ts +2 -0
package/dist/pipeline/questions.js +44 -0
package/dist/pipeline/runner-selection.d.ts +2 -0
package/dist/pipeline/runner-selection.js +13 -0
package/dist/pipeline/state.d.ts +4 -0
package/dist/pipeline/state.js +37 -0
package/dist/pipeline.d.ts +3 -0
package/dist/pipeline.js +213 -0
package/dist/preflight.d.ts +1 -0
package/dist/preflight.js +69 -0
package/dist/retrospective.d.ts +26 -0
package/dist/retrospective.js +211 -0
package/dist/stages/agent.d.ts +2 -0
package/dist/stages/agent.js +94 -0
package/dist/stages/gate.d.ts +2 -0
package/dist/stages/gate.js +32 -0
package/dist/stages/review.d.ts +2 -0
package/dist/stages/review.js +32 -0
package/dist/stages/ship.d.ts +3 -0
package/dist/stages/ship.js +154 -0
package/dist/stages/verify.d.ts +2 -0
package/dist/stages/verify.js +94 -0
package/dist/types.d.ts +61 -0
package/dist/types.js +1 -0
package/dist/validators.d.ts +8 -0
package/dist/validators.js +42 -0
package/dist/verify-runner.d.ts +11 -0
package/dist/verify-runner.js +110 -0
package/kody.config.schema.json +299 -0
package/package.json +39 -0
package/prompts/autofix.md +52 -0
package/prompts/build.md +26 -0
package/prompts/decompose.md +77 -0
package/prompts/plan.md +65 -0
package/prompts/review-fix.md +27 -0
package/prompts/review.md +115 -0
package/prompts/taskify-ticket.md +122 -0
package/prompts/taskify.md +70 -0
package/templates/kody-watch.yml +57 -0
package/templates/kody.yml +450 -0
package/templates/watch-agents/branch-cleanup/agent.json +7 -0
package/templates/watch-agents/branch-cleanup/agent.md +13 -0
package/templates/watch-agents/dependency-checker/agent.json +7 -0
package/templates/watch-agents/dependency-checker/agent.md +14 -0
package/templates/watch-agents/readme-health/agent.json +7 -0
package/templates/watch-agents/readme-health/agent.md +17 -0
package/templates/watch-agents/stale-pr-reviewer/agent.json +7 -0
package/templates/watch-agents/stale-pr-reviewer/agent.md +13 -0
package/templates/watch-agents/todo-scanner/agent.json +7 -0
package/templates/watch-agents/todo-scanner/agent.md +10 -0

package/prompts/review.md ADDED Viewed

@@ -0,0 +1,115 @@
+---
+name: review
+description: Review code changes for correctness, security, and quality
+mode: primary
+tools: [read, glob, grep, bash]
+---
+You are a code review agent following the Superpowers Structured Review methodology.
+Use Bash to see what changed. For PR reviews, check the Task Context below for a `Diff Command` section with the correct `git diff origin/<base>...HEAD` command. If no diff command is provided, run `git diff HEAD~1`. Do NOT use bare `git diff` — it shows only uncommitted working tree changes, not the actual code changes. Use Read to examine modified files in full context.
+When the diff introduces new enum values, status strings, or type constants — use Grep to trace ALL consumers outside the diff.
+CRITICAL: You MUST output a structured review in the EXACT format below. Do NOT output conversational text, status updates, or summaries. Your entire output must be the structured review markdown.
+Output markdown with this EXACT structure:
+## Verdict: PASS | FAIL
+## Summary
+<1-2 sentence summary of what was changed and why>
+## Findings
+### Critical
+<If none: "None.">
+### Major
+<If none: "None.">
+### Minor
+<If none: "None.">
+For each finding use: `file:line` — problem description. Suggested fix.
+---
+## Two-Pass Review
+**Pass 1 — CRITICAL (must fix before merge):**
+### SQL & Data Safety
+- String interpolation in SQL — use parameterized queries even for `.to_i`/`.to_f` values
+- TOCTOU races: check-then-set patterns that should be atomic `WHERE` + update
+- Bypassing model validations via direct DB writes (e.g., `update_column`, raw queries)
+- N+1 queries: missing eager loading for associations used in loops/views
+### Race Conditions & Concurrency
+- Read-check-write without uniqueness constraint or duplicate key handling
+- find-or-create without unique DB index — concurrent calls create duplicates
+- Status transitions without atomic `WHERE old_status = ? UPDATE SET new_status`
+- Unsafe HTML rendering (`dangerouslySetInnerHTML`, `v-html`, `.html_safe`) on user-controlled data (XSS)
+### LLM Output Trust Boundary
+- LLM-generated values (emails, URLs, names) written to DB without format validation
+- Structured tool output accepted without type/shape checks before DB writes
+- LLM-generated URLs fetched without allowlist — SSRF risk
+- LLM output stored in vector DBs without sanitization — stored prompt injection risk
+### Shell Injection
+- `subprocess.run()` / `os.system()` with `shell=True` AND string interpolation — use argument arrays
+- `eval()` / `exec()` on LLM-generated code without sandboxing
+### Enum & Value Completeness
+When the diff introduces a new enum value, status string, tier name, or type constant:
+- Trace it through every consumer (READ each file that switches/filters on that value)
+- Check allowlists/filter arrays containing sibling values
+- Check `case`/`if-elsif` chains — does the new value fall through to a wrong default?
+**Pass 2 — INFORMATIONAL (should review, may auto-fix):**
+### Conditional Side Effects
+- Code paths that branch but forget a side effect on one branch (e.g., promoted but URL only attached conditionally)
+- Log messages claiming an action happened when it was conditionally skipped
+### Test Gaps
+- Negative-path tests asserting type/status but not side effects
+- Security enforcement features (blocking, rate limiting, auth) without integration tests
+- Missing `.expects(:something).never` when a path should NOT call an external service
+### Dead Code & Consistency
+- Variables assigned but never read
+- Comments/docstrings describing old behavior after code changed
+- Version mismatch between PR title and VERSION/CHANGELOG
+### Crypto & Entropy
+- Truncation instead of hashing — less entropy, easier collisions
+- `rand()` / `Math.random()` for security-sensitive values — use crypto-secure alternatives
+- Non-constant-time comparisons (`==`) on secrets or tokens — timing attack risk
+### Performance & Bundle Impact
+- Known-heavy dependencies added: moment.js (→ date-fns), full lodash (→ lodash-es), jquery
+- Images without `loading="lazy"` or explicit dimensions (CLS)
+- `useEffect` fetch waterfalls — combine or parallelize
+- Synchronous `<script>` without async/defer
+### Type Coercion at Boundaries
+- Values crossing language/serialization boundaries where type could change (numeric vs string)
+- Hash/digest inputs without `.toString()` normalization before serialization
+---
+## Severity Definitions
+- **Critical**: Security vulnerability, data loss, application crash, broken authentication, injection risk, race condition. MUST fix before merge.
+- **Major**: Logic error, missing edge case, broken test, significant performance issue, missing input validation, enum completeness gap. SHOULD fix before merge.
+- **Minor**: Style issue, naming improvement, readability, micro-optimization, stale comments. NICE to fix, not blocking.
+## Suppressions — do NOT flag these:
+- Redundancy that aids readability
+- "Add a comment explaining this threshold" — thresholds change, comments rot
+- Consistency-only changes with no behavioral impact
+- Issues already addressed in the diff you are reviewing — read the FULL diff first
+- devDependencies additions (no production impact)
+{{TASK_CONTEXT}}

package/prompts/taskify-ticket.md ADDED Viewed

@@ -0,0 +1,122 @@
+You are a task decomposition agent. Your job is to break down a product spec into scoped, independently implementable tasks.
+## Input
+{{#if TICKET_ID}}
+**Mode: ticket**
+Use the available MCP tools to fetch ticket **{{TICKET_ID}}**.
+Read everything: title, description, acceptance criteria, sub-tasks, linked issues, attachments.
+{{/if}}
+{{#if FILE_CONTENT}}
+**Mode: file**
+The product spec is provided below:
+```
+{{FILE_CONTENT}}
+```
+{{/if}}
+{{#if ISSUE_BODY}}
+**Mode: issue**
+The task description from the GitHub issue is provided below. Decompose it into scoped, independently implementable sub-tasks.
+```
+{{ISSUE_BODY}}
+```
+{{/if}}
+{{#if PROJECT_CONTEXT}}
+## Existing codebase
+Use this to avoid suggesting things that already exist and to follow established conventions.
+{{PROJECT_CONTEXT}}
+{{/if}}
+## Decomposition rules
+Break the spec into implementation tasks where each task:
+- Can be implemented and reviewed independently in a single PR
+- Has clear, testable acceptance criteria
+- Contains all the context a developer needs — no references back to the original ticket
+- Is labeled appropriately (e.g. "frontend", "backend", "database", "infra")
+Each task body must follow this structure:
+```
+## Context
+Why this task exists and how it fits the bigger picture.
+## Acceptance Criteria
+Bulleted list of what "done" looks like.
+## Test Strategy
+What to test and how — unit tests, integration tests, manual verification steps.
+```
+Sizing guide:
+- A task touching 1–3 files with clear requirements = right size
+- A task requiring design decisions or touching many subsystems = too large, split it
+- A task that is just a config change or a one-liner = too small, merge with a related task
+Priority guidance — assign `priority` to each task:
+- `high` — blocks other tasks or delivers the ticket's core value
+- `medium` — important but not blocking
+- `low` — polish, edge cases, nice-to-have
+Dependency guidance — use `dependsOn` to express ordering:
+- If implementing task B requires task A's code to exist first, set `dependsOn: [indexOfA]` (0-based index into the tasks array).
+- If a task has no dependencies, omit `dependsOn` or use `[]`.
+{{#if FEEDBACK}}
+## Answers to previous questions
+The product team has provided the following answers:
+{{FEEDBACK}}
+Use these answers to resolve any previous ambiguities. Do NOT ask questions again — proceed directly to task decomposition.
+{{/if}}
+## Output
+Write ONLY to: `{{TASK_DIR}}/taskify-result.json`
+Do not write any other files. Do not print anything to stdout.
+The file must be valid JSON matching exactly one of these two schemas:
+**Schema A — tasks ready:**
+```json
+{
+  "status": "ready",
+  "tasks": [
+    {
+      "title": "string (max 72 chars, actionable verb phrase e.g. 'Add OAuth login with Google')",
+      "body": "string (full markdown spec with required sections: ## Context, ## Acceptance Criteria, ## Test Strategy)",
+      "labels": ["optional", "array", "of", "label", "strings"],
+      "priority": "high | medium | low",
+      "dependsOn": [0, 2]
+    }
+  ]
+}
+```
+**Schema B — clarifications needed:**
+```json
+{
+  "status": "questions",
+  "questions": ["string", "..."]
+}
+```
+Rules:
+- Maximum 3 questions. Only ask what genuinely cannot be determined from the spec.
+- Task titles must be actionable verb phrases ("Add X", "Fix Y", "Implement Z", "Migrate X to Y").
+- Each task body must be self-contained and include ## Context, ## Acceptance Criteria, and ## Test Strategy sections.
+- Labels are for categorization only — not implementation details.
+- `priority` must be one of: `high`, `medium`, `low`.
+- `dependsOn` uses 0-based indices into the tasks array. Omit or use `[]` if there are no dependencies.
+- If the spec is already small enough for a single PR, output one task.
+- Maximum 20 tasks. Consolidate related ones if needed.

package/prompts/taskify.md ADDED Viewed

@@ -0,0 +1,70 @@
+---
+name: taskify
+description: Classify and structure a task from free-text description
+mode: primary
+tools: [read, glob, grep]
+---
+You are a task classification agent following the Superpowers Brainstorming methodology.
+## MANDATORY: Explore Before Classifying
+Before classifying, you MUST explore the project context:
+1. **Examine the codebase** — Use Read, Glob, and Grep to understand project structure, existing patterns, and affected files.
+2. **Find existing solutions** — Search for how similar problems are already solved in this codebase. If a pattern exists, the task should reuse it.
+3. **Challenge assumptions** — Does the task description assume an approach? Are there simpler alternatives? Apply YAGNI ruthlessly.
+4. **Identify ambiguity** — Could the requirements be interpreted two ways? Are there missing edge case decisions?
+## Output
+Output ONLY valid JSON. No markdown fences. No explanation. No extra text before or after the JSON.
+Required JSON format:
+{
+  "task_type": "feature | bugfix | refactor | docs | chore",
+  "title": "Brief title, max 72 characters",
+  "description": "Clear description of what the task requires",
+  "scope": ["list", "of", "exact/file/paths", "affected"],
+  "risk_level": "low | medium | high",
+  "existing_patterns": ["list of existing patterns found that the implementation should reuse"],
+  "questions": []
+}
+Risk level heuristics:
+- low: single file change, no breaking changes, docs, config, isolated scripts, test additions, style changes
+- medium: 2-3 files, possible side effects, API changes, new dependencies, refactoring existing logic, adding a new utility/middleware with tests
+- high: 4+ files across multiple directories, core business logic, data migrations, security, authentication, payment processing, database schema changes, cross-cutting concerns, system redesigns
+existing_patterns rules:
+- List patterns found in the codebase that are relevant to this task
+- Include the file path and a brief description of the pattern
+- If no relevant patterns exist, use an empty array []
+- These inform the planner — reuse existing solutions, don't invent new ones
+Questions rules (Superpowers Brainstorming discipline):
+- ONLY ask product/requirements questions — things you CANNOT determine by reading code
+- Ask about: unclear scope, missing acceptance criteria, ambiguous user behavior, missing edge case decisions
+- Challenge assumptions — if the task implies an approach, consider simpler alternatives
+- Check for ambiguity — could requirements be interpreted two ways?
+- Do NOT ask about technical implementation — that is the planner's job
+- Do NOT ask about things you can find by reading the codebase (file structure, frameworks, patterns)
+- If the task is clear and complete, leave questions as an empty array []
+- Maximum 3 questions — only the most important ones
+Good questions: "Should the search be case-sensitive?", "Which users should have access?", "Should this work offline?"
+Bad questions: "What framework should I use?", "Where should I put the file?", "What's the project structure?"
+If the task is already implemented (files exist, tests pass):
+- Still output valid JSON — never output plain text
+- Set task_type to "chore"
+- Set risk_level to "low"
+- Set title to "Verify existing implementation of <feature>"
+- Set description to explain that the work already exists and what was verified
+- Set scope to the existing file paths
+Guidelines:
+- scope must contain exact file paths (use Glob to discover them)
+- title must be actionable ("Add X", "Fix Y", "Refactor Z")
+- description should capture the intent, not just restate the title
+{{TASK_CONTEXT}}

package/templates/kody-watch.yml ADDED Viewed

@@ -0,0 +1,57 @@
+name: kody-watch
+on:
+  schedule:
+    - cron: "*/30 * * * *"
+  workflow_dispatch:
+    inputs:
+      dry_run:
+        type: boolean
+        default: false
+        description: "Run without executing actions"
+concurrency:
+  group: kody-watch
+  cancel-in-progress: false
+jobs:
+  watch:
+    runs-on: ubuntu-latest
+    timeout-minutes: 15
+    permissions:
+      issues: write
+      contents: read
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-node@v4
+        with:
+          node-version: 22
+      - name: Install Claude Code
+        if: hashFiles('.kody/watch/agents/*/agent.json') != ''
+        run: npm install -g @anthropic-ai/claude-code
+      - name: Install Kody Engine
+        run: npm install -g @kody-ade/kody-engine-lite
+      - name: Export project secrets
+        env:
+          ALL_SECRETS: ${{ toJSON(secrets) }}
+        run: |
+          echo "$ALL_SECRETS" | jq -r 'to_entries[] | select(.key | test("^(GITHUB_TOKEN)$") | not) | @json' | while IFS= read -r entry; do
+            KEY=$(echo "$entry" | jq -r '.key')
+            VALUE=$(echo "$entry" | jq -r '.value')
+            DELIM="KODY_EOF_${KEY}"
+            echo "${KEY}<<${DELIM}" >> $GITHUB_ENV
+            echo "${VALUE}" >> $GITHUB_ENV
+            echo "${DELIM}" >> $GITHUB_ENV
+          done
+      - name: Run Kody Watch
+        env:
+          GH_TOKEN: ${{ github.token }}
+          REPO: ${{ github.repository }}
+          WATCH_DIGEST_ISSUE: ${{ vars.WATCH_DIGEST_ISSUE }}
+          DRY_RUN: ${{ inputs.dry_run || 'false' }}
+        run: npx kody-engine-lite watch ${{ inputs.dry_run == 'true' && '--dry-run' || '' }}