npm - kc-beta - Versions diffs - 0.7.5 → 0.8.3 - Mend

kc-beta 0.7.5 → 0.8.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (81) hide show

package/README.md +47 -0
package/package.json +3 -2
package/src/agent/context.js +17 -1
package/src/agent/engine.js +467 -100
package/src/agent/llm-client.js +24 -1
package/src/agent/pipelines/_advance-hints.js +92 -0
package/src/agent/pipelines/_milestone-derive.js +325 -20
package/src/agent/pipelines/skill-authoring.js +49 -3
package/src/agent/tools/agent-tool.js +2 -2
package/src/agent/tools/consult-skill.js +15 -0
package/src/agent/tools/dashboard-render.js +48 -1
package/src/agent/tools/document-parse.js +31 -2
package/src/agent/tools/phase-advance.js +17 -13
package/src/agent/tools/release.js +343 -7
package/src/agent/tools/sandbox-exec.js +65 -8
package/src/agent/tools/worker-llm-call.js +95 -15
package/src/agent/workspace.js +25 -4
package/src/cli/components.js +4 -1
package/src/cli/index.js +125 -8
package/src/config.js +19 -2
package/src/marathon/driver.js +217 -0
package/src/marathon/prompts.js +93 -0
package/template/.env.template +17 -1
package/template/AGENT.md +2 -2
package/template/skills/en/auto-model-selection/SKILL.md +55 -35
package/template/skills/en/bootstrap-workspace/SKILL.md +27 -0
package/template/skills/en/compliance-judgment/SKILL.md +14 -0
package/template/skills/en/confidence-system/SKILL.md +30 -8
package/template/skills/en/corner-case-management/SKILL.md +53 -33
package/template/skills/en/cross-document-verification/SKILL.md +88 -83
package/template/skills/en/dashboard-reporting/SKILL.md +91 -66
package/template/skills/en/dashboard-reporting/scripts/generate_dashboard.py +1 -1
package/template/skills/en/data-sensibility/SKILL.md +19 -12
package/template/skills/en/document-chunking/SKILL.md +99 -15
package/template/skills/en/entity-extraction/SKILL.md +14 -4
package/template/skills/en/quality-control/SKILL.md +23 -0
package/template/skills/en/rule-extraction/SKILL.md +92 -94
package/template/skills/en/rule-extraction/references/chunking-strategies.md +7 -78
package/template/skills/en/skill-authoring/SKILL.md +85 -2
package/template/skills/en/skill-creator/SKILL.md +25 -3
package/template/skills/en/skill-to-workflow/SKILL.md +73 -1
package/template/skills/en/task-decomposition/SKILL.md +1 -1
package/template/skills/en/tree-processing/SKILL.md +1 -1
package/template/skills/en/version-control/SKILL.md +15 -0
package/template/skills/en/work-decomposition/SKILL.md +52 -32
package/template/skills/phase_skills.yaml +5 -0
package/template/skills/zh/auto-model-selection/SKILL.md +54 -33
package/template/skills/zh/bootstrap-workspace/SKILL.md +27 -0
package/template/skills/zh/compliance-judgment/SKILL.md +51 -37
package/template/skills/zh/compliance-judgment/references/output-format.md +62 -62
package/template/skills/zh/confidence-system/SKILL.md +34 -9
package/template/skills/zh/corner-case-management/SKILL.md +71 -104
package/template/skills/zh/cross-document-verification/SKILL.md +90 -195
package/template/skills/zh/cross-document-verification/references/contradiction-taxonomy.md +36 -36
package/template/skills/zh/dashboard-reporting/SKILL.md +82 -232
package/template/skills/zh/dashboard-reporting/scripts/generate_dashboard.py +1 -1
package/template/skills/zh/data-sensibility/SKILL.md +13 -0
package/template/skills/zh/document-chunking/SKILL.md +101 -18
package/template/skills/zh/document-parsing/SKILL.md +65 -65
package/template/skills/zh/document-parsing/references/parser-catalog.md +26 -26
package/template/skills/zh/entity-extraction/SKILL.md +78 -68
package/template/skills/zh/evolution-loop/references/convergence-guide.md +38 -38
package/template/skills/zh/quality-control/SKILL.md +23 -0
package/template/skills/zh/quality-control/references/qa-layers.md +65 -65
package/template/skills/zh/quality-control/references/sampling-strategies.md +49 -49
package/template/skills/zh/rule-extraction/SKILL.md +199 -188
package/template/skills/zh/rule-extraction/references/chunking-strategies.md +5 -78
package/template/skills/zh/skill-authoring/SKILL.md +136 -58
package/template/skills/zh/skill-authoring/references/skill-format-spec.md +39 -39
package/template/skills/zh/skill-creator/SKILL.md +215 -201
package/template/skills/zh/skill-creator/references/schemas.md +60 -60
package/template/skills/zh/skill-to-workflow/SKILL.md +73 -1
package/template/skills/zh/skill-to-workflow/references/worker-llm-catalog.md +24 -24
package/template/skills/zh/task-decomposition/SKILL.md +1 -1
package/template/skills/zh/task-decomposition/references/decision-matrix.md +54 -54
package/template/skills/zh/tree-processing/SKILL.md +67 -63
package/template/skills/zh/version-control/SKILL.md +15 -0
package/template/skills/zh/version-control/references/trace-id-spec.md +34 -34
package/template/skills/zh/work-decomposition/SKILL.md +52 -30
package/template/workflows/common/llm_client.py +168 -0
package/template/workflows/common/utils.py +132 -0

package/README.md CHANGED Viewed

@@ -21,12 +21,59 @@ npm install -g kc-beta
 kc-beta onboard      # configure provider + API key
 cd my-project        # a folder containing rules/ and samples/
 kc-beta              # launch the agent
+# v0.8.1+ unattended runs: type the slash command inside the kc-beta TUI
+> /marathon Verify the new regulation against samples/. Iterate twice. If
+  most workflows work with regex, build another version using tier1+tier2
+  worker LLMs more aggressively.
+# Marathon mode chains turns automatically. /marathon off disengages.
+# /marathon status shows the driver state.
 ```
 Requires **Node.js 20+**. See [QUICKSTART.md](./QUICKSTART.md) for the full setup walkthrough.
 ---
+## v0.8 Highlights
+- **`/marathon <goal>` slash command** (v0.8.1; replaces the v0.8.0
+  separate-process `kc-marathon` CLI). Activates an inline driver inside
+  the running kc-beta TUI. Goal embedded in the command. `/marathon off`
+  to disengage manually; `/marathon status` to inspect. F5
+  one-phase-per-prompt stays enabled for interactive sessions and
+  bypasses cleanly when marathon is active. Status-bar shows
+  `🏃 MARATHON` only when active — no clutter in normal mode. v0.8.0's
+  separate-process driver was scrapped after E2E #11 found drivers
+  died silently when their parent terminal closed (SIGHUP unhandled).
+- **Skill usage counter** — passive Layer-B measurement of which skills
+  the engine actually ships to the LLM. `skill_byte_send` events go to
+  events.jsonl; the audit script aggregates per-phase × per-skill.
+  Agent-blind by design.
+- **`worker_llm_call` batch mode** — `prompts: [...]` array input with
+  concurrency control (default 5, max 10). Pairs with a canonical
+  `workflows/common/llm_client.py` shim (taught in `skill-to-workflow`)
+  so distilled workflows route through the engine where possible and
+  log to `output/llm_ledger.jsonl` when they don't.
+- **`sandbox_exec` timeout model** — default 120s (was 30s); per-call
+  `timeout_ms` up to 600s for known-slow commands. Configurable via
+  `KC_EXEC_DEFAULT_TIMEOUT_MS` + `KC_EXEC_MAX_TIMEOUT_MS`.
+- **Prescriptive phase-advance hints** — refusal messages now name
+  concrete next-action artifacts (`workflows/<rule_id>/workflow_v1.py`,
+  `output/results/production_qc_results.json`, etc.) instead of
+  descriptive `engineCounts` only.
+- **`check.py` substantiveness audit** — engine detects stub-shaped
+  rule_skills/<id>/check.py files (NOT_APPLICABLE-only returns with no
+  workflow delegation). Surfaced in milestones; opt-in enforcement via
+  `KC_ENFORCE_CHECK_PY_SUBSTANTIVE=1`.
+Plus engine-fix carryover from the v0.7.5 audit cycle: H3 calibration
+aggregator schema, milestone-derivation gaps (review_001.json + multi-
+path coverage_report.md), VLM runtime hardcode (workspace .env overlay),
+heap_mb periodic-write fix, stale release detection, taskboard skill
+availability in every phase. Full list: see DEV_LOG v0.8 entry.
+---
 ## What It Does
 KC drives a single coding agent through seven phases:

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "kc-beta",
-  "version": "0.7.5",
+  "version": "0.8.3",
   "description": "KC Agent — LLM document verification agent (pure Node.js CLI). Dual-licensed: PolyForm Noncommercial 1.0.0 for personal/noncommercial use; commercial license required for enterprise production. See LICENSE and LICENSE-COMMERCIAL.md.",
   "type": "module",
   "bin": {
@@ -18,7 +18,8 @@
   ],
   "scripts": {
     "build:meme": "node scripts/build-meme.js",
-    "prepublishOnly": "node scripts/build-meme.js"
+    "prepublishOnly": "node scripts/build-meme.js",
+    "test": "node scripts/run-tests.js"
   },
   "homepage": "https://github.com/kitchen-engineer42/kc-cli",
   "repository": {

package/src/agent/context.js CHANGED Viewed

@@ -152,10 +152,26 @@ export class ContextAssembler {
    * @param {string} [opts.projectMemory] - v0.7.0 B3: rules/PATTERNS.md
    *   content. Capped at ~5 KB by the caller. Surfaced for phases the
    *   work-decomposition skill operates in (skill_authoring + skill_testing).
+   * @param {string} [opts.marathonGoal] - v0.8.2 P12-A: the active marathon
+   *   goal text. Pinned at the system-prompt layer (never windowed) for the
+   *   duration of the marathon session. Surfaced only when marathon mode is
+   *   active; absent otherwise. Fixes the v0.8.1 regression where the goal
+   *   user_message got evicted by context_windowed before distillation, so
+   *   agents reverted to default behavior mid-run.
    * @returns {string}
    */
-  build({ agentMd, pipelineState, workspaceState, skillIndex, projectMemory } = {}) {
+  build({ agentMd, pipelineState, workspaceState, skillIndex, projectMemory, marathonGoal } = {}) {
     const parts = [AGENT_IDENTITY];
+    if (marathonGoal) {
+      parts.push(
+        "## Marathon goal (pinned for the duration of this session)\n\n" +
+        marathonGoal.trim() + "\n\n" +
+        "You are running in marathon mode — no manual user check-ins between " +
+        "phases. This goal is your north star; keep returning to it as you " +
+        "advance through the pipeline. If a continuation prompt focuses on " +
+        "phase mechanics, the goal above tells you *why*.",
+      );
+    }
     if (agentMd) parts.push(agentMd);
     if (skillIndex) parts.push(skillIndex);
     if (projectMemory) {