npm - @kody-ade/kody-engine-lite - Versions diffs - 0.1.28 → 0.1.29 - Mend

@kody-ade/kody-engine-lite 0.1.28 → 0.1.29

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/README.md CHANGED Viewed

@@ -2,28 +2,93 @@
 **Issue → PR in one command.** Comment `@kody` on a GitHub issue and Kody autonomously classifies, plans, builds, tests, reviews, fixes, and ships a pull request.
+Kody is a 7-stage autonomous SDLC pipeline that runs in GitHub Actions. It uses Claude Code (or any LLM via LiteLLM) to turn issues into production-ready PRs — with quality gates, AI-powered failure diagnosis, risk-based human approval, and self-improving memory.
+## Pipeline
 ```
-@kody  →  taskify → plan → build → verify → review → fix → ship  →  PR created
+                        ┌─────────────────────────────────────────────────────────┐
+                        │                    @kody on issue                        │
+                        └────────────────────────┬────────────────────────────────┘
+                                                 │
+                        ┌────────────────────────▼────────────────────────────────┐
+                        │  ① TASKIFY                                              │
+                        │  Classify task, detect complexity, ask questions         │
+                        │  Model: haiku │ Output: task.json                       │
+                        └────────────────────────┬────────────────────────────────┘
+                                                 │
+                                    ┌────────────▼────────────┐
+                                    │  LOW?  skip to ④        │
+                                    │  MEDIUM?  continue      │
+                                    │  HIGH?  continue        │
+                                    └────────────┬────────────┘
+                                                 │
+                        ┌────────────────────────▼────────────────────────────────┐
+                        │  ② PLAN                                                 │
+                        │  TDD implementation plan (deep reasoning)               │
+                        │  Model: opus │ Output: plan.md                          │
+                        └────────────────────────┬────────────────────────────────┘
+                                                 │
+                                    ┌────────────▼────────────┐
+                                    │  HIGH risk?             │
+                                    │  🛑 Pause for approval  │──── @kody approve
+                                    └────────────┬────────────┘
+                                                 │
+                        ┌────────────────────────▼────────────────────────────────┐
+                        │  ③ BUILD                                                │
+                        │  Implement code via Claude Code tools                   │
+                        │  Model: sonnet │ Output: code changes + git commit      │
+                        └────────────────────────┬────────────────────────────────┘
+                                                 │
+                        ┌────────────────────────▼────────────────────────────────┐
+                        │  ④ VERIFY                                               │
+                        │  typecheck + tests + lint                               │
+                        │  ┌──────────────────────────────────────────────┐       │
+                        │  │  Fail? → AI diagnosis → autofix → retry ×2  │       │
+                        │  └──────────────────────────────────────────────┘       │
+                        └────────────────────────┬────────────────────────────────┘
+                                                 │
+                        ┌────────────────────────▼────────────────────────────────┐
+                        │  ⑤ REVIEW                                               │
+                        │  Code review: PASS/FAIL + Critical/Major/Minor          │
+                        │  Model: opus │ Output: review.md                        │
+                        └────────────────────────┬────────────────────────────────┘
+                                                 │
+                        ┌────────────────────────▼────────────────────────────────┐
+                        │  ⑥ REVIEW-FIX                                           │
+                        │  Fix Critical and Major findings                        │
+                        │  Model: sonnet │ Output: code changes + git commit      │
+                        └────────────────────────┬────────────────────────────────┘
+                                                 │
+                        ┌────────────────────────▼────────────────────────────────┐
+                        │  ⑦ SHIP                                                 │
+                        │  Push branch + create PR with Closes #N                 │
+                        │  Output: ship.md + PR link                              │
+                        └────────────────────────┬────────────────────────────────┘
+                                                 │
+                        ┌────────────────────────▼────────────────────────────────┐
+                        │                ✅ PR created & ready for review          │
+                        └─────────────────────────────────────────────────────────┘
 ```
-Kody is a 7-stage autonomous SDLC pipeline that runs in GitHub Actions. It uses Claude Code (or any LLM via LiteLLM) to turn issues into production-ready PRs — with quality gates, AI-powered failure diagnosis, risk-based human approval, and self-improving memory.
+Each stage runs in a **fresh context window** with **accumulated context** from previous stages — so complex tasks (auth systems, CRUD features, API clients) don't lose track of earlier decisions.
+[Pipeline details →](docs/PIPELINE.md)
 ## Why Kody?
 Most AI coding tools are **autocomplete** (Copilot) or **chat-based** (Cursor, Cline). You still drive. Kody is different: it's an **autonomous pipeline** that takes an issue and delivers a tested, reviewed PR — even for complex, multi-file features that single-agent tools choke on.
-Single agents hit context limits on large tasks. Kody splits work into focused stages — each with a fresh context window but access to curated context from previous stages. A 27-minute auth system build (JWT, sessions, middleware, RBAC, 7 stages, 3 autofix retries) completes end-to-end without losing track.
 | | Kody | Copilot Workspace | Devin | Cursor Agent |
 |---|---|---|---|---|
 | **Runs in CI** | GitHub Actions | GitHub Cloud | Devin Cloud | Local IDE |
 | **Fire and forget** | Comment `@kody`, walk away | Must interact | Must interact | Must be open |
 | **Quality gates** | typecheck + tests + lint + AI diagnosis + auto-retry | Basic | Runs tests | Runs tests |
-| **Risk gate** | Pauses HIGH-risk tasks for human approval | No | No | No |
+| **Risk gate** | Pauses HIGH-risk for human approval | No | No | No |
 | **Model flexible** | Any LLM via LiteLLM | GitHub models only | Proprietary | Cursor models |
 | **Open source** | MIT | Proprietary | Proprietary | Proprietary |
-| **Accumulated context** | Curated context flows between stages | Single conversation | Single agent | Single agent |
-| **Complex tasks** | 27-min auth system with 7 stages + autofix | Struggles with large scope | Better | Struggles with large scope |
+| **Accumulated context** | Curated context flows between stages | Single bloated conversation | Single agent | Single agent |
+| **Complex tasks** | Full auth system: 7 stages + 3 autofix retries | Struggles with large scope | Better | Struggles with large scope |
 | **Cost** | Your API costs only | $10-39/month | $20-500/month | Subscription |
 [Full comparison →](docs/COMPARISON.md)
@@ -50,27 +115,6 @@ kody-engine-lite init
 **Prerequisites:** Node.js >= 22, [Claude Code CLI](https://docs.anthropic.com/en/docs/claude-code), [GitHub CLI](https://cli.github.com/), git
-## Pipeline
-```
-@kody on issue
-  ↓
-1. taskify   — classify task, detect complexity, ask questions     → task.json
-2. plan      — TDD implementation plan (deep reasoning)           → plan.md
-   ↓ HIGH risk? pause for human approval
-3. build     — implement code via Claude Code tools                → code changes
-4. verify    — typecheck + tests + lint (AI diagnosis + autofix)   → verify.md
-5. review    — code review: PASS/FAIL + Critical/Major/Minor      → review.md
-6. review-fix — fix Critical and Major findings                    → code changes
-7. ship      — push branch + create PR with Closes #N             → ship.md
-  ↓
-PR created
-```
-Complexity auto-detected: **low** skips plan/review (4 stages), **medium** skips review-fix (6 stages), **high** runs all 7.
-[Pipeline details →](docs/PIPELINE.md)
 ## Commands
 ### GitHub Comments
@@ -98,16 +142,16 @@ kody-engine-lite init [--force]
 - **Risk Gate** — HIGH-risk tasks pause for human plan approval before building ([details](docs/FEATURES.md#risk-gate))
 - **AI Failure Diagnosis** — classifies errors as fixable/infrastructure/pre-existing/abort before retry ([details](docs/FEATURES.md#ai-powered-failure-diagnosis))
 - **Question Gates** — asks product/architecture questions when the task is unclear ([details](docs/FEATURES.md#question-gates))
+- **Accumulated Context** — each stage passes curated context to the next — fresh window, shared knowledge ([details](docs/FEATURES.md#accumulated-context))
 - **Retrospective** — analyzes each run, identifies patterns, suggests improvements ([details](docs/FEATURES.md#retrospective-system))
 - **Auto-Learning** — extracts coding conventions from each successful run ([details](docs/FEATURES.md#auto-learning-memory))
-- **Accumulated Context** — each stage passes curated context to the next — fresh window, shared knowledge ([details](docs/FEATURES.md#accumulated-context))
 - **Any LLM** — route through LiteLLM to use MiniMax, GPT, Gemini, local models ([setup guide](docs/LITELLM.md))
 ## Documentation
 | Doc | What's in it |
 |-----|-------------|
-| [Pipeline](docs/PIPELINE.md) | Stage details, complexity skipping, artifacts, state machine |
+| [Pipeline](docs/PIPELINE.md) | Stage details, complexity skipping, accumulated context, artifacts |
 | [Features](docs/FEATURES.md) | Risk gate, diagnosis, retrospective, auto-learn, labels |
 | [LiteLLM](docs/LITELLM.md) | Non-Anthropic model setup, auto-start, tested providers |
 | [Configuration](docs/CONFIGURATION.md) | Full config reference, env vars, workflow setup |

package/dist/bin/cli.js CHANGED Viewed

@@ -87,20 +87,22 @@ function checkCommand(command2, args2) {
 function createClaudeCodeRunner() {
   return {
     async run(_stageName, prompt, model, timeout, _taskDir, options) {
-      return runSubprocess(
-        "claude",
-        [
-          "--print",
-          "--model",
-          model,
-          "--dangerously-skip-permissions",
-          "--allowedTools",
-          "Bash,Edit,Read,Write,Glob,Grep"
-        ],
-        prompt,
-        timeout,
-        options
-      );
+      const args2 = [
+        "--print",
+        "--model",
+        model,
+        "--dangerously-skip-permissions",
+        "--allowedTools",
+        "Bash,Edit,Read,Write,Glob,Grep"
+      ];
+      if (options?.sessionId) {
+        if (options.resumeSession) {
+          args2.push("--resume", options.sessionId);
+        } else {
+          args2.push("--session-id", options.sessionId);
+        }
+      }
+      return runSubprocess("claude", args2, prompt, timeout, options);
     },
     async healthCheck() {
       return checkCommand("claude", ["--version"]);
@@ -824,6 +826,17 @@ var init_runner_selection = __esm({
 // src/stages/agent.ts
 import * as fs5 from "fs";
 import * as path5 from "path";
+function getSessionInfo(stageName, sessions) {
+  const group = SESSION_GROUP[stageName];
+  if (!group) return void 0;
+  const existing = sessions[group];
+  if (existing) {
+    return { sessionId: existing, resumeSession: true };
+  }
+  const newId = crypto.randomUUID();
+  sessions[group] = newId;
+  return { sessionId: newId, resumeSession: false };
+}
 function validateStageOutput(stageName, content) {
   switch (stageName) {
     case "taskify":
@@ -850,10 +863,16 @@ async function executeAgentStage(ctx, def) {
   if (config.agent.litellmUrl) {
     extraEnv.ANTHROPIC_BASE_URL = config.agent.litellmUrl;
   }
+  const sessions = ctx.sessions ?? {};
+  const sessionInfo = getSessionInfo(def.name, sessions);
+  if (sessionInfo) {
+    logger.info(`  session: ${SESSION_GROUP[def.name]} (${sessionInfo.resumeSession ? "resume" : "new"})`);
+  }
   const runner = getRunnerForStage(ctx, def.name);
   const result = await runner.run(def.name, prompt, model, def.timeout, ctx.taskDir, {
     cwd: ctx.projectDir,
-    env: extraEnv
+    env: extraEnv,
+    ...sessionInfo
   });
   if (result.outcome !== "completed") {
     return { outcome: result.outcome, error: result.error, retries: 0 };
@@ -924,6 +943,7 @@ ${summary}
 `;
   fs5.appendFileSync(contextPath, entry);
 }
+var SESSION_GROUP;
 var init_agent = __esm({
   "src/stages/agent.ts"() {
     "use strict";
@@ -932,6 +952,14 @@ var init_agent = __esm({
     init_config();
     init_runner_selection();
     init_logger();
+    SESSION_GROUP = {
+      taskify: "explore",
+      plan: "explore",
+      build: "build",
+      autofix: "build",
+      "review-fix": "build",
+      review: "review"
+    };
   }
 });
@@ -2072,6 +2100,7 @@ async function runPipelineInner(ctx) {
     state = initState(ctx.taskId);
     writeState(state, ctx.taskDir);
   }
+  ctx.sessions = state.sessions ?? {};
   if (state.state !== "running") {
     state.state = "running";
     for (const stage of STAGES) {
@@ -2159,6 +2188,7 @@ async function runPipelineInner(ctx) {
         error: isTimeout ? "Stage timed out" : result.error ?? "Stage failed"
       };
       state.state = "failed";
+      state.sessions = ctx.sessions;
       writeState(state, ctx.taskDir);
       logger.error(`[${def.name}] ${isTimeout ? "\u23F1 timed out" : `\u2717 failed: ${result.error}`}`);
       if (ctx.input.issueNumber && !ctx.input.local) {
@@ -2166,6 +2196,7 @@ async function runPipelineInner(ctx) {
       }
       break;
     }
+    state.sessions = ctx.sessions;
     writeState(state, ctx.taskDir);
   }
   const allCompleted = STAGES.every((s) => state.stages[s.name].state === "completed");

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@kody-ade/kody-engine-lite",
-  "version": "0.1.28",
+  "version": "0.1.29",
   "description": "Autonomous SDLC pipeline: Kody orchestration + Claude Code + LiteLLM",
   "license": "MIT",
   "type": "module",