npm - @kody-ade/kody-engine-lite - Versions diffs - 0.1.29 → 0.1.31 - Mend

@kody-ade/kody-engine-lite 0.1.29 → 0.1.31

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/README.md CHANGED Viewed

@@ -1,130 +1,163 @@
 # Kody Engine Lite
-**Issue → PR in one command.** Comment `@kody` on a GitHub issue and Kody autonomously classifies, plans, builds, tests, reviews, fixes, and ships a pull request.
-Kody is a 7-stage autonomous SDLC pipeline that runs in GitHub Actions. It uses Claude Code (or any LLM via LiteLLM) to turn issues into production-ready PRs — with quality gates, AI-powered failure diagnosis, risk-based human approval, and self-improving memory.
-## Pipeline
+[![npm](https://img.shields.io/npm/v/@kody-ade/kody-engine-lite)](https://www.npmjs.com/package/@kody-ade/kody-engine-lite)
+[![License: MIT](https://img.shields.io/badge/License-MIT-blue.svg)](LICENSE)
-```
-                        ┌─────────────────────────────────────────────────────────┐
-                        │                    @kody on issue                        │
-                        └────────────────────────┬────────────────────────────────┘
-                                                 │
-                        ┌────────────────────────▼────────────────────────────────┐
-                        │  ① TASKIFY                                              │
-                        │  Classify task, detect complexity, ask questions         │
-                        │  Model: haiku │ Output: task.json                       │
-                        └────────────────────────┬────────────────────────────────┘
-                                                 │
-                                    ┌────────────▼────────────┐
-                                    │  LOW?  skip to ④        │
-                                    │  MEDIUM?  continue      │
-                                    │  HIGH?  continue        │
-                                    └────────────┬────────────┘
-                                                 │
-                        ┌────────────────────────▼────────────────────────────────┐
-                        │  ② PLAN                                                 │
-                        │  TDD implementation plan (deep reasoning)               │
-                        │  Model: opus │ Output: plan.md                          │
-                        └────────────────────────┬────────────────────────────────┘
-                                                 │
-                                    ┌────────────▼────────────┐
-                                    │  HIGH risk?             │
-                                    │  🛑 Pause for approval  │──── @kody approve
-                                    └────────────┬────────────┘
-                                                 │
-                        ┌────────────────────────▼────────────────────────────────┐
-                        │  ③ BUILD                                                │
-                        │  Implement code via Claude Code tools                   │
-                        │  Model: sonnet │ Output: code changes + git commit      │
-                        └────────────────────────┬────────────────────────────────┘
-                                                 │
-                        ┌────────────────────────▼────────────────────────────────┐
-                        │  ④ VERIFY                                               │
-                        │  typecheck + tests + lint                               │
-                        │  ┌──────────────────────────────────────────────┐       │
-                        │  │  Fail? → AI diagnosis → autofix → retry ×2  │       │
-                        │  └──────────────────────────────────────────────┘       │
-                        └────────────────────────┬────────────────────────────────┘
-                                                 │
-                        ┌────────────────────────▼────────────────────────────────┐
-                        │  ⑤ REVIEW                                               │
-                        │  Code review: PASS/FAIL + Critical/Major/Minor          │
-                        │  Model: opus │ Output: review.md                        │
-                        └────────────────────────┬────────────────────────────────┘
-                                                 │
-                        ┌────────────────────────▼────────────────────────────────┐
-                        │  ⑥ REVIEW-FIX                                           │
-                        │  Fix Critical and Major findings                        │
-                        │  Model: sonnet │ Output: code changes + git commit      │
-                        └────────────────────────┬────────────────────────────────┘
-                                                 │
-                        ┌────────────────────────▼────────────────────────────────┐
-                        │  ⑦ SHIP                                                 │
-                        │  Push branch + create PR with Closes #N                 │
-                        │  Output: ship.md + PR link                              │
-                        └────────────────────────┬────────────────────────────────┘
-                                                 │
-                        ┌────────────────────────▼────────────────────────────────┐
-                        │                ✅ PR created & ready for review          │
-                        └─────────────────────────────────────────────────────────┘
-```
-Each stage runs in a **fresh context window** with **accumulated context** from previous stages — so complex tasks (auth systems, CRUD features, API clients) don't lose track of earlier decisions.
+**Issue → PR in one command.** Comment `@kody` on a GitHub issue and Kody autonomously classifies, plans, builds, tests, reviews, fixes, and ships a pull request.
-[Pipeline details →](docs/PIPELINE.md)
+Kody is a 7-stage autonomous SDLC pipeline that runs in GitHub Actions. It uses Claude Code (or any LLM via LiteLLM) to turn issues into production-ready PRs — with quality gates, AI-powered failure diagnosis, risk-based human approval, and shared context between stages.
 ## Why Kody?
-Most AI coding tools are **autocomplete** (Copilot) or **chat-based** (Cursor, Cline). You still drive. Kody is different: it's an **autonomous pipeline** that takes an issue and delivers a tested, reviewed PR — even for complex, multi-file features that single-agent tools choke on.
+Most AI coding tools are **autocomplete** (Copilot) or **chat-based** (Cursor, Cline). You still drive. Kody is an **autonomous pipeline** — comment `@kody`, walk away, come back to a PR.
 | | Kody | Copilot Workspace | Devin | Cursor Agent |
 |---|---|---|---|---|
 | **Runs in CI** | GitHub Actions | GitHub Cloud | Devin Cloud | Local IDE |
-| **Fire and forget** | Comment `@kody`, walk away | Must interact | Must interact | Must be open |
-| **Quality gates** | typecheck + tests + lint + AI diagnosis + auto-retry | Basic | Runs tests | Runs tests |
+| **Fire and forget** | Yes | No — interactive | Partially | No — IDE must be open |
+| **Pipeline stages** | 7 stages with quality gates | Plan → implement | Single agent | Single agent |
+| **Shared sessions** | Stages share Claude Code sessions (no cold starts) | Single conversation | Single conversation | Single conversation |
 | **Risk gate** | Pauses HIGH-risk for human approval | No | No | No |
+| **AI failure diagnosis** | Classifies errors before retry (fixable/infra/abort) | No | No | No |
 | **Model flexible** | Any LLM via LiteLLM | GitHub models only | Proprietary | Cursor models |
 | **Open source** | MIT | Proprietary | Proprietary | Proprietary |
-| **Accumulated context** | Curated context flows between stages | Single bloated conversation | Single agent | Single agent |
-| **Complex tasks** | Full auth system: 7 stages + 3 autofix retries | Struggles with large scope | Better | Struggles with large scope |
 | **Cost** | Your API costs only | $10-39/month | $20-500/month | Subscription |
 [Full comparison →](docs/COMPARISON.md)
+## Pipeline
+```
+  ┌─────────────────────────────────────────────────────────────┐
+  │                      @kody on issue                         │
+  └──────────────────────────┬──────────────────────────────────┘
+                             │
+  ┌──────────────────────────▼──────────────────────────────────┐
+  │  ① TASKIFY         Tier: cheap                              │
+  │  Classify task, detect complexity, ask questions → task.json │
+  └──────────────────────────┬──────────────────────────────────┘
+                             │
+                ┌────────────▼────────────┐
+                │  LOW?  skip to ④        │
+                │  MEDIUM?  continue      │
+                │  HIGH?  continue        │
+                └────────────┬────────────┘
+                             │
+  ┌──────────────────────────▼──────────────────────────────────┐
+  │  ② PLAN            Tier: strong                             │
+  │  TDD implementation plan (deep reasoning)        → plan.md  │
+  └──────────────────────────┬──────────────────────────────────┘
+                             │
+                ┌────────────▼────────────┐
+                │  HIGH risk?             │
+                │  🛑 Pause for approval  │──── @kody approve
+                └────────────┬────────────┘
+                             │
+  ┌──────────────────────────▼──────────────────────────────────┐
+  │  ③ BUILD           Tier: mid                                │
+  │  Implement code via Claude Code tools    → code + git commit│
+  └──────────────────────────┬──────────────────────────────────┘
+                             │
+  ┌──────────────────────────▼──────────────────────────────────┐
+  │  ④ VERIFY          (deterministic gate)                     │
+  │  typecheck + tests + lint                                   │
+  │  ┌───────────────────────────────────────────────────┐      │
+  │  │  Fail? → AI diagnosis → autofix → retry (up to 2) │      │
+  │  └───────────────────────────────────────────────────┘      │
+  └──────────────────────────┬──────────────────────────────────┘
+                             │
+  ┌──────────────────────────▼──────────────────────────────────┐
+  │  ⑤ REVIEW          Tier: strong                             │
+  │  Code review: PASS/FAIL + Critical/Major/Minor  → review.md │
+  └──────────────────────────┬──────────────────────────────────┘
+                             │
+  ┌──────────────────────────▼──────────────────────────────────┐
+  │  ⑥ REVIEW-FIX      Tier: mid                               │
+  │  Fix Critical and Major findings             → code + commit│
+  └──────────────────────────┬──────────────────────────────────┘
+                             │
+  ┌──────────────────────────▼──────────────────────────────────┐
+  │  ⑦ SHIP            (deterministic)                          │
+  │  Push branch + create PR with Closes #N       → ship.md + PR│
+  └──────────────────────────┬──────────────────────────────────┘
+                             │
+  ┌──────────────────────────▼──────────────────────────────────┐
+  │                 ✅ PR created & ready for review             │
+  └─────────────────────────────────────────────────────────────┘
+```
+**Tiers are configurable** — cheap/mid/strong map to any model via `modelMap` in config. Defaults: haiku/sonnet/opus. Route to MiniMax, GPT, Gemini, or local models via [LiteLLM](docs/LITELLM.md).
+**Shared sessions** — stages in the same group share a Claude Code session: taskify+plan (explore), build+autofix+review-fix (implementation), review (fresh perspective). No cold-start re-exploration between stages.
+[Pipeline details →](docs/PIPELINE.md)
 ## Quick Start
+**Prerequisites:** Node.js >= 22, [Claude Code CLI](https://docs.anthropic.com/en/docs/claude-code), [GitHub CLI](https://cli.github.com/), git
+### 1. Install
 ```bash
-# 1. Install
 npm install -g @kody-ade/kody-engine-lite
+```
-# 2. Set up GitHub secret
+### 2. Set up GitHub
+```bash
 gh secret set ANTHROPIC_API_KEY --repo owner/repo
-# Settings → Actions → "Allow GitHub Actions to create and approve pull requests"
+```
-# 3. Initialize (auto-detects, commits, and pushes)
+Then in GitHub: **Settings → Actions → General → "Allow GitHub Actions to create and approve pull requests"**
+### 3. Initialize
+```bash
 cd your-project
 kody-engine-lite init
+```
+This analyzes your project and generates workflow, config, memory, and labels — then commits and pushes.
+### 4. Use
-# 4. Comment on any issue
+Comment on any GitHub issue:
+```
 @kody
 ```
-`init` spawns Claude Code to analyze your project and generates: workflow file, config with auto-detected quality commands, project memory (architecture + conventions), 14 GitHub labels — then commits and pushes everything.
+### Switch to a different model (optional)
-**Prerequisites:** Node.js >= 22, [Claude Code CLI](https://docs.anthropic.com/en/docs/claude-code), [GitHub CLI](https://cli.github.com/), git
+Add `litellm-config.yaml` to route all tiers through MiniMax (or any LLM):
+```yaml
+# litellm-config.yaml
+model_list:
+  - model_name: claude-haiku-4-5-20251001
+    litellm_params:
+      model: minimax/MiniMax-M2.7-highspeed
+      api_key: os.environ/MINIMAX_API_KEY
+```
+```json
+// kody.config.json — add litellmUrl
+{ "agent": { "litellmUrl": "http://localhost:4000" } }
+```
+Kody auto-starts the proxy and loads API keys from `.env`. [Full LiteLLM guide →](docs/LITELLM.md)
 ## Commands
 ### GitHub Comments
-```bash
-@kody                              # Full pipeline
-@kody approve                      # Resume after questions or risk gate
-@kody fix                          # Re-build (comment body = feedback)
-@kody rerun --from <stage>         # Resume from specific stage
-```
+| Command | What it does |
+|---------|-------------|
+| `@kody` | Run full pipeline |
+| `@kody approve` | Resume after questions or risk gate |
+| `@kody fix` | Re-run from build stage. Write feedback in the comment body — it gets injected into the build prompt |
+| `@kody rerun` | Resume from the failed or paused stage |
+| `@kody rerun --from <stage>` | Resume from a specific stage |
 ### CLI
@@ -139,20 +172,20 @@ kody-engine-lite init [--force]
 ## Key Features
+- **Shared Sessions** — stages in the same group share a Claude Code session, eliminating cold-start codebase re-exploration ([details](docs/FEATURES.md#shared-sessions))
 - **Risk Gate** — HIGH-risk tasks pause for human plan approval before building ([details](docs/FEATURES.md#risk-gate))
 - **AI Failure Diagnosis** — classifies errors as fixable/infrastructure/pre-existing/abort before retry ([details](docs/FEATURES.md#ai-powered-failure-diagnosis))
 - **Question Gates** — asks product/architecture questions when the task is unclear ([details](docs/FEATURES.md#question-gates))
-- **Accumulated Context** — each stage passes curated context to the next — fresh window, shared knowledge ([details](docs/FEATURES.md#accumulated-context))
+- **Any LLM** — route through LiteLLM to use MiniMax, GPT, Gemini, local models ([setup guide](docs/LITELLM.md))
 - **Retrospective** — analyzes each run, identifies patterns, suggests improvements ([details](docs/FEATURES.md#retrospective-system))
 - **Auto-Learning** — extracts coding conventions from each successful run ([details](docs/FEATURES.md#auto-learning-memory))
-- **Any LLM** — route through LiteLLM to use MiniMax, GPT, Gemini, local models ([setup guide](docs/LITELLM.md))
 ## Documentation
 | Doc | What's in it |
 |-----|-------------|
-| [Pipeline](docs/PIPELINE.md) | Stage details, complexity skipping, accumulated context, artifacts |
-| [Features](docs/FEATURES.md) | Risk gate, diagnosis, retrospective, auto-learn, labels |
+| [Pipeline](docs/PIPELINE.md) | Stage details, shared sessions, complexity skipping, artifacts |
+| [Features](docs/FEATURES.md) | Risk gate, diagnosis, sessions, retrospective, auto-learn, labels |
 | [LiteLLM](docs/LITELLM.md) | Non-Anthropic model setup, auto-start, tested providers |
 | [Configuration](docs/CONFIGURATION.md) | Full config reference, env vars, workflow setup |
 | [Comparison](docs/COMPARISON.md) | vs Copilot, Devin, Cursor, Cline, SWE-agent, OpenHands |

package/dist/bin/cli.js CHANGED Viewed

@@ -1034,6 +1034,7 @@ function runQualityGates(taskDir, projectRoot) {
   const cwd = projectRoot ?? process.cwd();
   const allErrors = [];
   const allSummary = [];
+  const rawOutputs = [];
   let allPass = true;
   const commands = [
     { name: "typecheck", cmd: config.quality.typecheck },
@@ -1055,10 +1056,11 @@ function runQualityGates(taskDir, projectRoot) {
       allPass = false;
       const errors = parseErrors(result.output);
       allErrors.push(...errors.map((e) => `[${name}] ${e}`));
+      rawOutputs.push({ name, output: result.output.slice(-3e3) });
     }
     allSummary.push(...extractSummary(result.output, name));
   }
-  return { pass: allPass, errors: allErrors, summary: allSummary };
+  return { pass: allPass, errors: allErrors, summary: allSummary, rawOutputs };
 }
 var init_verify_runner = __esm({
   "src/verify-runner.ts"() {
@@ -1190,6 +1192,18 @@ function executeGateStage(ctx, def) {
 `);
     for (const s of verifyResult.summary) {
       lines.push(`- ${s}
+`);
+    }
+  }
+  if (verifyResult.rawOutputs.length > 0) {
+    lines.push(`
+## Raw Output
+`);
+    for (const { name, output } of verifyResult.rawOutputs) {
+      lines.push(`### ${name}
+\`\`\`
+${output}
+\`\`\`
 `);
     }
   }
@@ -2393,21 +2407,26 @@ async function tryStartLitellm(url, projectDir) {
   }
   const portMatch = url.match(/:(\d+)/);
   const port = portMatch ? portMatch[1] : "4000";
+  let litellmFound = false;
   try {
-    execFileSync9("litellm", ["--version"], { timeout: 5e3, stdio: "pipe" });
+    execFileSync9("which", ["litellm"], { timeout: 3e3, stdio: "pipe" });
+    litellmFound = true;
   } catch {
     try {
-      execFileSync9("python3", ["-m", "litellm", "--version"], { timeout: 5e3, stdio: "pipe" });
+      execFileSync9("python3", ["-c", "import litellm"], { timeout: 1e4, stdio: "pipe" });
+      litellmFound = true;
     } catch {
-      logger.warn("litellm not installed (pip install 'litellm[proxy]')");
-      return null;
     }
   }
+  if (!litellmFound) {
+    logger.warn("litellm not installed (pip install 'litellm[proxy]')");
+    return null;
+  }
   logger.info(`Starting LiteLLM proxy on port ${port}...`);
   let cmd;
   let args2;
   try {
-    execFileSync9("litellm", ["--version"], { timeout: 5e3, stdio: "pipe" });
+    execFileSync9("which", ["litellm"], { timeout: 3e3, stdio: "pipe" });
     cmd = "litellm";
     args2 = ["--config", configPath, "--port", port];
   } catch {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@kody-ade/kody-engine-lite",
-  "version": "0.1.29",
+  "version": "0.1.31",
   "description": "Autonomous SDLC pipeline: Kody orchestration + Claude Code + LiteLLM",
   "license": "MIT",
   "type": "module",