npm - @kkelly-offical/kkcode - Versions diffs - 0.1.7 → 0.2.1 - Mend

@kkelly-offical/kkcode 0.1.7 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (163) hide show

package/LICENSE +674 -674
package/README.md +452 -387
package/package.json +50 -46
package/src/agent/agent.mjs +228 -220
package/src/agent/custom-agent-loader.mjs +6 -3
package/src/agent/generator.mjs +2 -2
package/src/agent/prompt/assistant.txt +12 -0
package/src/agent/prompt/bug-hunter.txt +89 -89
package/src/agent/prompt/frontend-designer.txt +58 -58
package/src/agent/prompt/guide.txt +1 -1
package/src/agent/prompt/longagent-blueprint-agent.txt +83 -83
package/src/agent/prompt/longagent-coding-agent.txt +37 -37
package/src/agent/prompt/longagent-debugging-agent.txt +46 -46
package/src/agent/prompt/longagent-preview-agent.txt +63 -63
package/src/command/custom-commands.mjs +2 -2
package/src/commands/agent.mjs +1 -1
package/src/commands/background.mjs +145 -4
package/src/commands/chat.mjs +117 -76
package/src/commands/config.mjs +148 -1
package/src/commands/doctor.mjs +30 -6
package/src/commands/init.mjs +32 -6
package/src/commands/longagent.mjs +117 -0
package/src/commands/mcp.mjs +275 -43
package/src/commands/permission.mjs +1 -1
package/src/commands/session.mjs +195 -140
package/src/commands/skill.mjs +63 -0
package/src/commands/theme.mjs +1 -1
package/src/config/defaults.mjs +280 -260
package/src/config/import-config.mjs +1 -1
package/src/config/load-config.mjs +61 -4
package/src/config/schema.mjs +591 -574
package/src/context.mjs +4 -1
package/src/core/constants.mjs +97 -91
package/src/core/types.mjs +1 -1
package/src/github/api.mjs +78 -78
package/src/github/auth.mjs +294 -286
package/src/github/flow.mjs +298 -298
package/src/github/workspace.mjs +225 -212
package/src/index.mjs +84 -82
package/src/knowledge/frontend-aesthetics.txt +38 -38
package/src/mcp/client-http.mjs +139 -141
package/src/mcp/client-sse.mjs +297 -288
package/src/mcp/client-stdio.mjs +534 -533
package/src/mcp/constants.mjs +2 -2
package/src/mcp/registry.mjs +498 -479
package/src/mcp/stdio-framing.mjs +135 -133
package/src/mcp/tool-result.mjs +24 -24
package/src/observability/edit-diagnostics.mjs +449 -0
package/src/observability/index.mjs +42 -42
package/src/observability/metrics.mjs +165 -137
package/src/observability/tracer.mjs +137 -137
package/src/onboarding.mjs +209 -0
package/src/orchestration/background-manager.mjs +567 -372
package/src/orchestration/background-worker.mjs +419 -305
package/src/orchestration/interruption-reason.mjs +21 -0
package/src/orchestration/longagent-manager.mjs +197 -171
package/src/orchestration/stage-scheduler.mjs +733 -728
package/src/orchestration/subagent-router.mjs +7 -1
package/src/orchestration/task-scheduler.mjs +219 -7
package/src/permission/engine.mjs +1 -1
package/src/permission/exec-policy.mjs +370 -370
package/src/permission/file-edit-policy.mjs +108 -0
package/src/permission/prompt.mjs +1 -1
package/src/permission/rules.mjs +116 -7
package/src/plugin/builtin-hooks/post-edit-format.mjs +2 -1
package/src/plugin/builtin-hooks/post-edit-typecheck.mjs +104 -40
package/src/plugin/hook-bus.mjs +19 -5
package/src/plugin/manifest-loader.mjs +222 -0
package/src/provider/anthropic.mjs +396 -390
package/src/provider/ollama.mjs +7 -1
package/src/provider/openai.mjs +382 -340
package/src/provider/retry-policy.mjs +74 -68
package/src/provider/router.mjs +242 -241
package/src/provider/sse.mjs +104 -104
package/src/provider/wizard.mjs +556 -0
package/src/repl/capability-facade.mjs +30 -0
package/src/repl/command-surface.mjs +23 -0
package/src/repl/controller-entry.mjs +40 -0
package/src/repl/core-shell.mjs +208 -0
package/src/repl/dialog-router.mjs +87 -0
package/src/repl/input-engine.mjs +76 -0
package/src/repl/keymap.mjs +7 -0
package/src/repl/operator-surface.mjs +15 -0
package/src/repl/permission-flow.mjs +49 -0
package/src/repl/runtime-facade.mjs +36 -0
package/src/repl/slash-router.mjs +62 -0
package/src/repl/state-store.mjs +29 -0
package/src/repl/turn-controller.mjs +58 -0
package/src/repl/verification.mjs +23 -0
package/src/repl.mjs +3368 -2981
package/src/rules/load-rules.mjs +3 -3
package/src/runtime.mjs +1 -1
package/src/session/agent-transaction.mjs +86 -0
package/src/session/checkpoint.mjs +302 -302
package/src/session/compaction.mjs +298 -298
package/src/session/engine.mjs +417 -232
package/src/session/longagent-4stage.mjs +467 -460
package/src/session/longagent-hybrid.mjs +1344 -1097
package/src/session/longagent-plan.mjs +376 -365
package/src/session/longagent-project-memory.mjs +53 -53
package/src/session/longagent-scaffold.mjs +291 -291
package/src/session/longagent-task-bus.mjs +138 -54
package/src/session/longagent-utils.mjs +828 -472
package/src/session/longagent.mjs +911 -900
package/src/session/loop.mjs +1005 -930
package/src/session/prompt/agent.txt +25 -25
package/src/session/prompt/anthropic.txt +150 -150
package/src/session/prompt/beast.txt +1 -1
package/src/session/prompt/plan.txt +31 -31
package/src/session/prompt/qwen.txt +46 -46
package/src/session/recovery.mjs +21 -0
package/src/session/rollback.mjs +196 -195
package/src/session/routing-observability.mjs +72 -0
package/src/session/runtime-state.mjs +47 -0
package/src/session/store.mjs +523 -519
package/src/session/system-prompt.mjs +308 -273
package/src/session/task-validator.mjs +267 -267
package/src/session/usability-gates.mjs +2 -2
package/src/skill/builtin/commit.mjs +64 -64
package/src/skill/builtin/design.mjs +76 -76
package/src/skill/generator.mjs +18 -2
package/src/skill/registry.mjs +642 -390
package/src/storage/audit-store.mjs +18 -11
package/src/storage/event-log.mjs +7 -1
package/src/storage/ghost-commit-store.mjs +243 -245
package/src/storage/paths.mjs +13 -0
package/src/theme/default-theme.mjs +1 -1
package/src/theme/markdown.mjs +4 -0
package/src/theme/schema.mjs +1 -1
package/src/theme/status-bar.mjs +162 -158
package/src/tool/audit-wrapper.mjs +18 -2
package/src/tool/edit-transaction.mjs +23 -0
package/src/tool/executor.mjs +26 -1
package/src/tool/file-read-state.mjs +65 -0
package/src/tool/git-auto.mjs +526 -526
package/src/tool/git-full-auto.mjs +487 -478
package/src/tool/mutation-guard.mjs +54 -0
package/src/tool/prompt/edit.txt +3 -3
package/src/tool/prompt/multiedit.txt +1 -0
package/src/tool/prompt/notebookedit.txt +2 -1
package/src/tool/prompt/patch.txt +25 -24
package/src/tool/prompt/read.txt +3 -3
package/src/tool/prompt/sysinfo.txt +29 -0
package/src/tool/prompt/task.txt +66 -4
package/src/tool/prompt/write.txt +2 -2
package/src/tool/question-prompt.mjs +99 -93
package/src/tool/registry.mjs +1701 -1343
package/src/tool/task-tool.mjs +14 -6
package/src/ui/activity-renderer.mjs +667 -664
package/src/ui/repl-background-panel.mjs +7 -0
package/src/ui/repl-capability-panel.mjs +9 -0
package/src/ui/repl-dashboard.mjs +54 -4
package/src/ui/repl-help.mjs +110 -0
package/src/ui/repl-operator-panel.mjs +12 -0
package/src/ui/repl-route-feedback.mjs +35 -0
package/src/ui/repl-status-view.mjs +76 -0
package/src/ui/repl-task-panel.mjs +5 -0
package/src/ui/repl-transcript-panel.mjs +56 -0
package/src/ui/repl-turn-summary.mjs +135 -0
package/src/usage/pricing.mjs +122 -121
package/src/usage/usage-meter.mjs +1 -0
package/src/util/git.mjs +562 -519
package/src/util/template.mjs +6 -1

package/src/session/system-prompt.mjs CHANGED Viewed

@@ -1,273 +1,308 @@
-import { readFile, access } from "node:fs/promises"
-import { execSync } from "node:child_process"
-import path from "node:path"
-import { fileURLToPath } from "node:url"
-import { createHash } from "node:crypto"
-import { loadSessionPrompt } from "./prompt-loader.mjs"
-import { getAgentPrompt, listAgents } from "../agent/agent.mjs"
-import { loadAutoMemory } from "./memory-loader.mjs"
-const __dirname = path.dirname(fileURLToPath(import.meta.url))
-const TOOL_PROMPT_DIR = path.join(__dirname, "..", "tool", "prompt")
-const toolPromptCache = new Map()
-// Session-level block cache: avoids rebuilding identical blocks across turns
-// Key = hash of inputs, Value = { blocks, text, timestamp }
-let blockCache = { key: null, result: null }
-function hashInputs(obj) {
-  return createHash("md5").update(JSON.stringify(obj)).digest("hex")
-}
-async function loadToolPrompt(name) {
-  if (!toolPromptCache.has(name)) {
-    try {
-      const file = path.join(TOOL_PROMPT_DIR, `${name}.txt`)
-      const text = (await readFile(file, "utf8")).trim()
-      toolPromptCache.set(name, text)
-    } catch {
-      toolPromptCache.set(name, "")
-    }
-  }
-  return toolPromptCache.get(name)
-}
-// Detect if cwd is a git repo
-function detectGitRepo(cwd) {
-  try {
-    execSync("git rev-parse --is-inside-work-tree", { cwd, stdio: "pipe", timeout: 3000 })
-    return true
-  } catch {
-    return false
-  }
-}
-// Detect the user's default shell
-function detectShell() {
-  if (process.platform === "win32") {
-    // On Windows, kkcode uses bash (git bash / WSL) internally
-    return "bash (use Unix shell syntax, not Windows — e.g., /dev/null not NUL, forward slashes in paths)"
-  }
-  const shell = process.env.SHELL || "/bin/bash"
-  return path.basename(shell)
-}
-// Layer 1: Environment information (dynamic per turn — changes with cwd/date)
-export function environmentPrompt({ model, cwd }) {
-  const isGit = detectGitRepo(cwd)
-  const shell = detectShell()
-  const today = new Date().toISOString().slice(0, 10)
-  const lines = [
-    `<env>`,
-    `  model: ${model}`,
-    `  cwd: ${cwd}`,
-    `  platform: ${process.platform}`,
-    `  shell: ${shell}`,
-    `  node: ${process.version}`,
-    `  date: ${today}`,
-    `  git_repo: ${isGit}`,
-    `</env>`,
-    ``,
-    `Knowledge cutoff: early 2025. Current date: ${today}.`,
-    `When searching for recent information, use the current year (${today.slice(0, 4)}) in queries.`
-  ]
-  return lines.join("\n")
-}
-// Layer 2: System prompt (model-specific — stable across session)
-export async function providerPromptByModel(model) {
-  const m = String(model).toLowerCase()
-  if (m.includes("claude")) return loadSessionPrompt("anthropic.txt")
-  if (m.includes("gpt-5") || m.includes("codex")) return loadSessionPrompt("beast.txt")
-  if (m.includes("gpt") || m.includes("o1") || m.includes("o3")) return loadSessionPrompt("beast.txt")
-  if (m.includes("gemini")) return loadSessionPrompt("qwen.txt")
-  if (m.includes("deepseek")) return loadSessionPrompt("qwen.txt")
-  if (m.includes("qwen")) return loadSessionPrompt("qwen.txt")
-  return loadSessionPrompt("qwen.txt")
-}
-// Layer 3: Agent-specific prompt (stable across session)
-export async function agentPrompt(agent) {
-  if (!agent) return ""
-  return getAgentPrompt(agent.name)
-}
-// Layer 4: Mode reminder (stable within mode)
-export async function modeReminder(mode) {
-  if (mode === "plan") return loadSessionPrompt("plan.txt")
-  if (mode === "agent") return loadSessionPrompt("agent.txt")
-  return ""
-}
-// Layer 5: Tool descriptions (stable across session — ideal cache target)
-export async function toolDescriptions(tools) {
-  if (!tools || !tools.length) return ""
-  const descriptions = []
-  for (const tool of tools) {
-    const prompt = await loadToolPrompt(tool.name)
-    if (prompt) {
-      descriptions.push(`## ${tool.name}\n${prompt}`)
-    }
-  }
-  if (!descriptions.length) return ""
-  return `# Available Tools\n\n${descriptions.join("\n\n")}`
-}
-// Layer 6: User custom instructions (loaded externally via instruction-loader.mjs and rules)
-// Assembled in loop.mjs from loadInstructions() and renderRulesPrompt()
-/**
- * Build system prompt as structured blocks for provider-level cache optimization.
- *
- * Returns { text, blocks } where:
- * - text: single concatenated string (for providers that don't support block-level caching)
- * - blocks: array of { label, text, cacheable } objects
- *
- * Cache strategy:
- * - Blocks marked cacheable=true are stable across turns (provider/agent/tools/skills)
- * - Blocks marked cacheable=false are dynamic per turn (env/user instructions)
- * - Providers use this to place cache_control breakpoints optimally
- *
- * Anthropic: up to 4 cache breakpoints — place on stable blocks
- * OpenAI: automatic prefix caching — stable blocks should come first
- */
-export async function buildSystemPromptBlocks({ mode, model, cwd, agent = null, tools = [], skills = [], userInstructions = "", projectContext = "", language = "en" }) {
-  // Cache key: hash of all inputs that affect block content
-  const cacheKey = hashInputs({
-    mode, model, cwd, language,
-    agent: agent?.name || null,
-    tools: tools.map(t => t.name).sort(),
-    skills: skills.map(s => s.name).sort(),
-    userInstructions: userInstructions.slice(0, 200) // first 200 chars as fingerprint
-  })
-  if (blockCache.key === cacheKey && blockCache.result) {
-    // Only env block changes per turn — rebuild just that
-    const cached = blockCache.result
-    const envIdx = cached.blocks.findIndex(b => b.label === "env")
-    if (envIdx >= 0) {
-      const freshEnv = environmentPrompt({ model, cwd })
-      if (cached.blocks[envIdx].text === freshEnv) {
-        return cached // fully identical
-      }
-      // Clone and update only the env block
-      const updatedBlocks = cached.blocks.map((b, i) =>
-        i === envIdx ? { ...b, text: freshEnv } : b
-      )
-      const text = updatedBlocks.map(b => b.text).join("\n\n")
-      const result = { text, blocks: updatedBlocks }
-      blockCache = { key: cacheKey, result }
-      return result
-    }
-  }
-  const blocks = []
-  // Block 0: Provider prompt (stable — loaded once per model)
-  const providerText = await providerPromptByModel(model)
-  if (providerText) {
-    blocks.push({ label: "provider", text: providerText, cacheable: true })
-  }
-  // Block 1: Agent prompt (stable — loaded once per agent)
-  const agentText = agent ? await getAgentPrompt(agent.name) : ""
-  if (agentText) {
-    blocks.push({ label: "agent", text: agentText, cacheable: true })
-  }
-  // Block 2: Mode reminder (stable within mode)
-  const modeText = await modeReminder(mode)
-  if (modeText) {
-    blocks.push({ label: "mode", text: modeText, cacheable: true })
-  }
-  // Block 3: Tool descriptions (stable — changes only when tools change)
-  const toolText = await toolDescriptions(tools)
-  if (toolText) {
-    blocks.push({ label: "tools", text: toolText, cacheable: true })
-  }
-  // Block 3.5: Large output strategy (stable — always included)
-  const outputStrategyLines = [
-    "# Large Output Strategy",
-    "",
-    "When generating large amounts of content:",
-    "- For large file creation, write no more than 200 lines per tool call; use append mode for subsequent chunks",
-    "- For partial file edits, use patch with line ranges instead of rewriting the whole file",
-    "- If a task requires more than 300 lines of code, proactively split into multiple sequential tool calls",
-    "- Never attempt to write an entire large file in a single tool call"
-  ]
-  blocks.push({ label: "output_strategy", text: outputStrategyLines.join("\n"), cacheable: true })
-  // Block 4: Skills descriptions (stable — changes only when skills change)
-  if (skills.length) {
-    const skillLines = skills.map((s) => `- /${s.name}: ${s.description || s.name}`).join("\n")
-    const skillText = `# Available Skills\n\nInvoke with /<skill-name> [arguments].\n\n${skillLines}`
-    blocks.push({ label: "skills", text: skillText, cacheable: true })
-  }
-  // Block 4.5: Available sub-agents (stable — changes only when custom agents change)
-  const allAgents = listAgents({ includeHidden: false })
-  const customSubagents = allAgents.filter((a) => a.mode === "subagent" && a._customAgent)
-  if (customSubagents.length) {
-    const agentLines = customSubagents.map((a) => {
-      const perms = a.permission === "readonly" ? " (read-only)" : a.permission === "full" ? " (full access)" : ""
-      return `- ${a.name}: ${a.description}${perms}`
-    })
-    const subagentText = [
-      "# Available Sub-agents",
-      "",
-      "Delegate specialized work to these sub-agents using the `task` tool with `subagent_type` parameter.",
-      "Use sub-agents when a task is self-contained and would benefit from a specialist, or to save context window space.",
-      "",
-      ...agentLines
-    ].join("\n")
-    blocks.push({ label: "subagents", text: subagentText, cacheable: true })
-  }
-  // Block 4.7: Project context (semi-stable — changes when cwd changes)
-  if (projectContext) {
-    blocks.push({ label: "project", text: projectContext, cacheable: false })
-  }
-  // Block 4.9: Language constraint (stable — changes only when config changes)
-  if (language && language !== "en") {
-    const langMap = {
-      zh: "Always respond in Chinese (中文). Use Chinese for all explanations, comments, and communications. Technical terms, code identifiers, and code content should remain in their original form (typically English)."
-    }
-    const langText = langMap[language]
-    if (langText) {
-      blocks.push({ label: "language", text: `# Language\n\n${langText}`, cacheable: true })
-    }
-  }
-  // Block 4.95: Auto Memory (semi-stable — changes when user updates memory files)
-  const memoryText = await loadAutoMemory(cwd)
-  if (memoryText) {
-    blocks.push({ label: "memory", text: memoryText, cacheable: false })
-  }
-  // Block 5: Environment (dynamic per turn)
-  const envText = environmentPrompt({ model, cwd })
-  blocks.push({ label: "env", text: envText, cacheable: false })
-  // Block 6: User instructions + rules (semi-stable — cacheable if unchanged between turns)
-  if (userInstructions) {
-    blocks.push({ label: "user", text: userInstructions, cacheable: false })
-  }
-  const text = blocks.map((b) => b.text).join("\n\n")
-  const result = { text, blocks }
-  blockCache = { key: cacheKey, result }
-  return result
-}
-// Legacy flat assembly (kept for backward compatibility)
-export async function buildSystemPromptLayers({ mode, model, cwd, agent = null }) {
-  const layer1 = environmentPrompt({ model, cwd })
-  const layer2 = await providerPromptByModel(model)
-  const layer3 = await agentPrompt(agent)
-  const layer4 = await modeReminder(mode)
-  return { layer1, layer2, layer3, layer4 }
-}
+import { readFile, access } from "node:fs/promises"
+import { execSync } from "node:child_process"
+import path from "node:path"
+import { fileURLToPath } from "node:url"
+import { createHash } from "node:crypto"
+import { loadSessionPrompt } from "./prompt-loader.mjs"
+import { renderPublicModeContract } from "./engine.mjs"
+import { getAgentPrompt, listAgents } from "../agent/agent.mjs"
+import { loadAutoMemory } from "./memory-loader.mjs"
+const __dirname = path.dirname(fileURLToPath(import.meta.url))
+const TOOL_PROMPT_DIR = path.join(__dirname, "..", "tool", "prompt")
+const toolPromptCache = new Map()
+// Session-level block cache: avoids rebuilding identical blocks across turns
+// Key = hash of inputs, Value = { blocks, text, timestamp }
+let blockCache = { key: null, result: null }
+function hashInputs(obj) {
+  return createHash("md5").update(JSON.stringify(obj)).digest("hex")
+}
+async function loadToolPrompt(name) {
+  if (!toolPromptCache.has(name)) {
+    try {
+      const file = path.join(TOOL_PROMPT_DIR, `${name}.txt`)
+      const text = (await readFile(file, "utf8")).trim()
+      toolPromptCache.set(name, text)
+    } catch {
+      toolPromptCache.set(name, "")
+    }
+  }
+  return toolPromptCache.get(name)
+}
+// Detect if cwd is a git repo
+function detectGitRepo(cwd) {
+  try {
+    execSync("git rev-parse --is-inside-work-tree", { cwd, stdio: "pipe", timeout: 3000 })
+    return true
+  } catch {
+    return false
+  }
+}
+// Detect the user's default shell
+function detectShell() {
+  if (process.platform === "win32") {
+    // On Windows, kkcode uses bash (git bash / WSL) internally
+    return "bash (use Unix shell syntax, not Windows — e.g., /dev/null not NUL, forward slashes in paths)"
+  }
+  const shell = process.env.SHELL || "/bin/bash"
+  return path.basename(shell)
+}
+// Layer 1: Environment information (dynamic per turn — changes with cwd/date)
+export function environmentPrompt({ model, cwd }) {
+  const isGit = detectGitRepo(cwd)
+  const shell = detectShell()
+  const today = new Date().toISOString().slice(0, 10)
+  const lines = [
+    `<env>`,
+    `  model: ${model}`,
+    `  cwd: ${cwd}`,
+    `  platform: ${process.platform}`,
+    `  shell: ${shell}`,
+    `  node: ${process.version}`,
+    `  date: ${today}`,
+    `  git_repo: ${isGit}`,
+    `</env>`,
+    ``,
+    `Knowledge cutoff: early 2025. Current date: ${today}.`,
+    `When searching for recent information, use the current year (${today.slice(0, 4)}) in queries.`
+  ]
+  return lines.join("\n")
+}
+// Layer 2: System prompt (model-specific — stable across session)
+export async function providerPromptByModel(model) {
+  const m = String(model).toLowerCase()
+  if (m.includes("claude")) return loadSessionPrompt("anthropic.txt")
+  if (m.includes("gpt-5") || m.includes("codex")) return loadSessionPrompt("beast.txt")
+  if (m.includes("gpt") || m.includes("o1") || m.includes("o3")) return loadSessionPrompt("beast.txt")
+  if (m.includes("gemini")) return loadSessionPrompt("qwen.txt")
+  if (m.includes("deepseek")) return loadSessionPrompt("qwen.txt")
+  if (m.includes("qwen")) return loadSessionPrompt("qwen.txt")
+  return loadSessionPrompt("qwen.txt")
+}
+// Layer 3: Agent-specific prompt (stable across session)
+export async function agentPrompt(agent) {
+  if (!agent) return ""
+  return getAgentPrompt(agent.name)
+}
+// Layer 4: Mode reminder (stable within mode)
+export async function modeReminder(mode) {
+  const contractBlock = renderPublicModeContract()
+  if (mode === "assistant") return `${contractBlock}\n\nAssistant mode active. Treat this as the default CLI personal assistant lane for bounded terminal-native work: local files, logs, system checks, web lookup, Git/GitHub assistance, notes, task organization, and lightweight automation. Escalate to agent/code for explicit coding mutations and to longagent for staged multi-file delivery.`
+  if (mode === "plan") return `${contractBlock}\n\n${await loadSessionPrompt("plan.txt")}`
+  if (mode === "agent") return `${contractBlock}\n\n${await loadSessionPrompt("agent.txt")}\n\nCoding lane active. Focus on inspect/patch/verify coding work, keep diffs small, and validate with the narrowest useful tests.`
+  if (mode === "longagent") {
+    return `${contractBlock}\n\nLongAgent mode active. Treat this as the heavyweight staged delivery lane for multi-file or system-level work. Keep explicit gates, ownership, and recovery behavior intact.`
+  }
+  return contractBlock
+}
+// Layer 5: Tool descriptions (stable across session — ideal cache target)
+export async function toolDescriptions(tools) {
+  if (!tools || !tools.length) return ""
+  const descriptions = []
+  for (const tool of tools) {
+    const prompt = await loadToolPrompt(tool.name)
+    if (prompt) {
+      descriptions.push(`## ${tool.name}\n${prompt}`)
+    }
+  }
+  if (!descriptions.length) return ""
+  return `# Available Tools\n\n${descriptions.join("\n\n")}`
+}
+// Layer 6: User custom instructions (loaded externally via instruction-loader.mjs and rules)
+// Assembled in loop.mjs from loadInstructions() and renderRulesPrompt()
+/**
+ * Build system prompt as structured blocks for provider-level cache optimization.
+ *
+ * Returns { text, blocks } where:
+ * - text: single concatenated string (for providers that don't support block-level caching)
+ * - blocks: array of { label, text, cacheable } objects
+ *
+ * Cache strategy:
+ * - Blocks marked cacheable=true are stable across turns (provider/agent/tools/skills)
+ * - Blocks marked cacheable=false are dynamic per turn (env/user instructions)
+ * - Providers use this to place cache_control breakpoints optimally
+ *
+ * Anthropic: up to 4 cache breakpoints — place on stable blocks
+ * OpenAI: automatic prefix caching — stable blocks should come first
+ */
+export async function buildSystemPromptBlocks({ mode, model, cwd, agent = null, tools = [], skills = [], userInstructions = "", projectContext = "", language = "en" }) {
+  // Cache key: hash of all inputs that affect block content
+  const cacheKey = hashInputs({
+    mode, model, cwd, language,
+    agent: agent?.name || null,
+    tools: tools.map(t => t.name).sort(),
+    skills: skills.map(s => s.name).sort(),
+    userInstructions: hashInputs({ ui: userInstructions }) // hash full string to avoid collisions
+  })
+  if (blockCache.key === cacheKey && blockCache.result) {
+    // Only env block changes per turn — rebuild just that
+    const cached = blockCache.result
+    const envIdx = cached.blocks.findIndex(b => b.label === "env")
+    if (envIdx >= 0) {
+      const freshEnv = environmentPrompt({ model, cwd })
+      if (cached.blocks[envIdx].text === freshEnv) {
+        return cached // fully identical
+      }
+      // Clone and update only the env block
+      const updatedBlocks = cached.blocks.map((b, i) =>
+        i === envIdx ? { ...b, text: freshEnv } : b
+      )
+      const text = updatedBlocks.map(b => b.text).join("\n\n")
+      const result = { text, blocks: updatedBlocks }
+      blockCache = { key: cacheKey, result }
+      return result
+    }
+  }
+  const blocks = []
+  // Block 0: Provider prompt (stable — loaded once per model)
+  const providerText = await providerPromptByModel(model)
+  if (providerText) {
+    blocks.push({ label: "provider", text: providerText, cacheable: true })
+  }
+  // Block 1: Agent prompt (stable — loaded once per agent)
+  const agentText = agent ? await getAgentPrompt(agent.name) : ""
+  if (agentText) {
+    blocks.push({ label: "agent", text: agentText, cacheable: true })
+  }
+  // Block 2: Mode reminder (stable within mode)
+  const modeText = await modeReminder(mode)
+  if (modeText) {
+    blocks.push({ label: "mode", text: modeText, cacheable: true })
+  }
+  // Block 3: Tool descriptions (stable — changes only when tools change)
+  const toolText = await toolDescriptions(tools)
+  if (toolText) {
+    blocks.push({ label: "tools", text: toolText, cacheable: true })
+  }
+  // Block 3.5: Large output strategy (stable — always included)
+  const outputStrategyLines = [
+    "# Large Output Strategy",
+    "",
+    "When generating large amounts of content:",
+    "- For large file creation, write no more than 200 lines per tool call; use append mode for subsequent chunks",
+    "- For partial file edits, use patch with line ranges instead of rewriting the whole file",
+    "- If a task requires more than 300 lines of code, proactively split into multiple sequential tool calls",
+    "- Never attempt to write an entire large file in a single tool call"
+  ]
+  blocks.push({ label: "output_strategy", text: outputStrategyLines.join("\n"), cacheable: true })
+  // Block 4: CLI assistant contract (stable — release-facing behavior boundary)
+  const assistantContractLines = [
+    "# CLI Assistant Contract",
+    "",
+    "Operate as a CLI-first personal assistant, not an IDE shell or GUI automation product.",
+    "",
+    "Prefer the lightest path that completes the next step well:",
+    "- answer directly for short questions",
+    "- treat assistant as the default lane for bounded terminal-native personal assistant work",
+    "- treat agent/code/coding as the dedicated lane for coding mutation, debugging, refactoring, and test repair",
+    "- handle small local inspect/run/summarize tasks without over-upgrading to heavyweight execution",
+    "- continue an interrupted local transaction when the follow-up still fits the same bounded scope",
+    "- reserve longagent-style behavior for structured multi-file or system-level delivery with explicit heavy evidence",
+    "",
+    "Current safe capability boundary:",
+    "- coding and patching",
+    "- local filesystem, config, and log inspection",
+    "- shell/task execution",
+    "- repo/release assistance",
+    "- web lookup/fetch",
+    "- bounded delegated sidecar work",
+    "",
+    "Do not imply unsupported product surfaces such as GUI desktop automation, IDE integration, marketplace installs, or remote bridge platforms."
+  ]
+  blocks.push({ label: "assistant_contract", text: assistantContractLines.join("\n"), cacheable: true })
+  // Block 4.5: Public mode contract (stable — keeps assistant/plan/agent/longagent aligned)
+  blocks.push({ label: "mode_contract", text: renderPublicModeContract(), cacheable: true })
+  // Block 5: Skills descriptions (stable — changes only when skills change)
+  if (skills.length) {
+    const skillLines = skills.map((s) => `- /${s.name}: ${s.description || s.name}`).join("\n")
+    const skillText = `# Available Skills\n\nInvoke with /<skill-name> [arguments].\n\n${skillLines}`
+    blocks.push({ label: "skills", text: skillText, cacheable: true })
+  }
+  // Block 5.5: Available sub-agents (stable — changes only when custom agents change)
+  const allAgents = listAgents({ includeHidden: false })
+  const customSubagents = allAgents.filter((a) => a.mode === "subagent" && a._customAgent)
+  if (customSubagents.length) {
+    const agentLines = customSubagents.map((a) => {
+      const perms = a.permission === "readonly" ? " (read-only)" : a.permission === "full" ? " (full access)" : ""
+      return `- ${a.name}: ${a.description}${perms}`
+    })
+    const subagentText = [
+      "# Available Sub-agents",
+      "",
+      "Delegate specialized work to these sub-agents using the `task` tool with `subagent_type` parameter.",
+      "Use sub-agents when a task is self-contained and would benefit from a specialist, or to save context window space.",
+      "",
+      ...agentLines
+    ].join("\n")
+    blocks.push({ label: "subagents", text: subagentText, cacheable: true })
+  }
+  // Block 5.7: Project context (semi-stable — changes when cwd changes)
+  if (projectContext) {
+    blocks.push({ label: "project", text: projectContext, cacheable: false })
+  }
+  // Block 5.9: Language constraint (stable — changes only when config changes)
+  if (language && language !== "en") {
+    const langMap = {
+      zh: "Always respond in Chinese (中文). Use Chinese for all explanations, comments, and communications. Technical terms, code identifiers, and code content should remain in their original form (typically English)."
+    }
+    const langText = langMap[language]
+    if (langText) {
+      blocks.push({ label: "language", text: `# Language\n\n${langText}`, cacheable: true })
+    }
+  }
+  // Block 5.95: Auto Memory (semi-stable — changes when user updates memory files)
+  const memoryText = await loadAutoMemory(cwd)
+  if (memoryText) {
+    blocks.push({ label: "memory", text: memoryText, cacheable: false })
+  }
+  // Block 5: Environment (dynamic per turn)
+  const envText = environmentPrompt({ model, cwd })
+  blocks.push({ label: "env", text: envText, cacheable: false })
+  // Block 6: User instructions + rules (semi-stable — cacheable if unchanged between turns)
+  if (userInstructions) {
+    blocks.push({ label: "user", text: userInstructions, cacheable: false })
+  }
+  const text = blocks.map((b) => b.text).join("\n\n")
+  const result = { text, blocks }
+  blockCache = { key: cacheKey, result }
+  return result
+}
+// Legacy flat assembly (kept for backward compatibility)
+export async function buildSystemPromptLayers({ mode, model, cwd, agent = null }) {
+  const layer1 = environmentPrompt({ model, cwd })
+  const layer2 = await providerPromptByModel(model)
+  const layer3 = await agentPrompt(agent)
+  const layer4 = await modeReminder(mode)
+  return { layer1, layer2, layer3, layer4 }
+}