npm - jeo-code - Versions diffs - 0.1.0 → 0.4.5 - Mend

jeo-code 0.1.0 → 0.4.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (177) hide show

package/README.ja.md +160 -0
package/README.ko.md +160 -0
package/README.md +115 -297
package/README.zh.md +160 -0
package/package.json +11 -6
package/scripts/install.sh +28 -28
package/scripts/uninstall.sh +17 -15
package/src/AGENTS.md +50 -0
package/src/agent/AGENTS.md +49 -0
package/src/agent/bash-fixups.ts +103 -0
package/src/agent/compaction.ts +410 -19
package/src/agent/config-schema.ts +119 -5
package/src/agent/context-files.ts +314 -17
package/src/agent/dev/AGENTS.md +36 -0
package/src/agent/dev/advanced-analyzer.ts +12 -0
package/src/agent/dev/evolution-bridge.ts +82 -0
package/src/agent/dev/evolution-logger.ts +41 -0
package/src/agent/dev/self-analysis.ts +64 -0
package/src/agent/dev/self-improve.ts +24 -0
package/src/agent/dev/spec-automation.ts +49 -0
package/src/agent/engine.ts +808 -54
package/src/agent/hooks.ts +273 -0
package/src/agent/loop.ts +21 -1
package/src/agent/memory.ts +201 -0
package/src/agent/model-recency.ts +32 -0
package/src/agent/output-minimizer.ts +108 -0
package/src/agent/output-util.ts +64 -0
package/src/agent/plan.ts +187 -0
package/src/agent/seed.ts +52 -0
package/src/agent/session.ts +235 -21
package/src/agent/state.ts +286 -39
package/src/agent/step-budget.ts +232 -0
package/src/agent/subagents.ts +223 -26
package/src/agent/task-tool.ts +272 -0
package/src/agent/todo-tool.ts +87 -0
package/src/agent/tokenizer.ts +117 -0
package/src/agent/tool-registry.ts +54 -0
package/src/agent/tools.ts +624 -103
package/src/agent/web-search.ts +538 -0
package/src/ai/AGENTS.md +44 -0
package/src/ai/index.ts +1 -0
package/src/ai/model-catalog-compat.ts +3 -1
package/src/ai/model-catalog.ts +74 -9
package/src/ai/model-discovery.ts +215 -17
package/src/ai/model-manager.ts +346 -32
package/src/ai/model-picker.ts +1 -1
package/src/ai/model-registry.ts +4 -2
package/src/ai/pricing.ts +84 -0
package/src/ai/provider-registry.ts +23 -0
package/src/ai/provider-status.ts +60 -16
package/src/ai/providers/AGENTS.md +42 -0
package/src/ai/providers/anthropic.ts +250 -31
package/src/ai/providers/antigravity.ts +219 -0
package/src/ai/providers/errors.ts +15 -1
package/src/ai/providers/gemini.ts +196 -13
package/src/ai/providers/ollama.ts +37 -7
package/src/ai/providers/openai-responses.ts +173 -0
package/src/ai/providers/openai.ts +64 -12
package/src/ai/sse.ts +4 -1
package/src/ai/types.ts +18 -1
package/src/auth/AGENTS.md +41 -0
package/src/auth/callback-server.ts +6 -1
package/src/auth/flows/AGENTS.md +32 -0
package/src/auth/flows/antigravity.ts +151 -0
package/src/auth/flows/google-project.ts +190 -0
package/src/auth/flows/google.ts +39 -18
package/src/auth/flows/index.ts +15 -5
package/src/auth/flows/openai.ts +2 -2
package/src/auth/oauth.ts +8 -0
package/src/auth/refresh.ts +44 -27
package/src/auth/storage.ts +149 -26
package/src/auth/types.ts +1 -1
package/src/autopilot.ts +362 -0
package/src/bun-imports.d.ts +4 -0
package/src/cli/AGENTS.md +39 -0
package/src/cli/runner.ts +148 -14
package/src/cli.ts +13 -4
package/src/commands/AGENTS.md +40 -0
package/src/commands/approve.ts +62 -3
package/src/commands/auth.ts +167 -25
package/src/commands/chat.ts +37 -8
package/src/commands/deep-interview.ts +633 -175
package/src/commands/doctor.ts +84 -37
package/src/commands/evolve-core.ts +18 -0
package/src/commands/evolve.ts +2 -1
package/src/commands/export.ts +176 -0
package/src/commands/gjc.ts +52 -0
package/src/commands/launch.ts +3549 -240
package/src/commands/mcp.ts +3 -3
package/src/commands/ooo-seed.ts +19 -0
package/src/commands/ralplan.ts +253 -35
package/src/commands/resume.ts +1 -1
package/src/commands/session.ts +183 -0
package/src/commands/setup-helpers.ts +10 -3
package/src/commands/setup.ts +57 -16
package/src/commands/skills.ts +78 -18
package/src/commands/state.ts +198 -0
package/src/commands/status.ts +84 -0
package/src/commands/team.ts +340 -212
package/src/commands/ultragoal.ts +122 -61
package/src/commands/update.ts +244 -0
package/src/ledger.ts +270 -0
package/src/mcp/AGENTS.md +38 -0
package/src/mcp/server.ts +115 -14
package/src/mcp/tools.ts +42 -22
package/src/md-modules.d.ts +4 -0
package/src/prompts/AGENTS.md +41 -0
package/src/prompts/agents/AGENTS.md +35 -0
package/src/prompts/agents/architect.md +35 -0
package/src/prompts/agents/critic.md +37 -0
package/src/prompts/agents/executor.md +36 -0
package/src/prompts/agents/planner.md +37 -0
package/src/prompts/skills/AGENTS.md +36 -0
package/src/prompts/skills/deep-dive/AGENTS.md +31 -0
package/src/prompts/skills/deep-dive/SKILL.md +13 -0
package/src/prompts/skills/deep-interview/AGENTS.md +31 -0
package/src/prompts/skills/deep-interview/SKILL.md +12 -0
package/src/prompts/skills/gjc/AGENTS.md +31 -0
package/src/prompts/skills/gjc/SKILL.md +15 -0
package/src/prompts/skills/ralplan/AGENTS.md +31 -0
package/src/prompts/skills/ralplan/SKILL.md +11 -0
package/src/prompts/skills/team/AGENTS.md +31 -0
package/src/prompts/skills/team/SKILL.md +11 -0
package/src/prompts/skills/ultragoal/AGENTS.md +31 -0
package/src/prompts/skills/ultragoal/SKILL.md +11 -0
package/src/skills/AGENTS.md +38 -0
package/src/skills/catalog.ts +565 -31
package/src/tui/AGENTS.md +43 -0
package/src/tui/app.ts +1181 -92
package/src/tui/components/AGENTS.md +42 -0
package/src/tui/components/ascii-art.ts +257 -15
package/src/tui/components/autocomplete.ts +98 -16
package/src/tui/components/autopilot-status.ts +65 -0
package/src/tui/components/category-index.ts +49 -0
package/src/tui/components/code-view.ts +54 -11
package/src/tui/components/color.ts +171 -2
package/src/tui/components/config-panel.ts +82 -15
package/src/tui/components/duration.ts +38 -0
package/src/tui/components/evolution.ts +3 -3
package/src/tui/components/footer.ts +91 -42
package/src/tui/components/forge.ts +426 -31
package/src/tui/components/hints.ts +54 -0
package/src/tui/components/hud.ts +73 -0
package/src/tui/components/index.ts +4 -0
package/src/tui/components/input-box.ts +150 -0
package/src/tui/components/layout.ts +11 -3
package/src/tui/components/live-model-picker.ts +108 -0
package/src/tui/components/markdown-table.ts +140 -0
package/src/tui/components/markdown-text.ts +97 -0
package/src/tui/components/meter.ts +4 -1
package/src/tui/components/model-picker.ts +3 -2
package/src/tui/components/provider-picker.ts +3 -2
package/src/tui/components/section.ts +70 -0
package/src/tui/components/select-list.ts +40 -10
package/src/tui/components/skill-picker.ts +25 -0
package/src/tui/components/slash.ts +244 -21
package/src/tui/components/status.ts +272 -11
package/src/tui/components/step-timeline.ts +218 -0
package/src/tui/components/stream.ts +26 -9
package/src/tui/components/themes.ts +212 -6
package/src/tui/components/todo-card.ts +47 -0
package/src/tui/components/tool-list.ts +58 -12
package/src/tui/components/transcript.ts +120 -0
package/src/tui/components/update-box.ts +31 -0
package/src/tui/components/welcome.ts +162 -0
package/src/tui/components/width.ts +163 -0
package/src/tui/monitoring/AGENTS.md +31 -0
package/src/tui/monitoring/hud-view.ts +55 -0
package/src/tui/renderer.ts +112 -3
package/src/tui/terminal.ts +40 -33
package/src/util/AGENTS.md +39 -0
package/src/util/clipboard-image.ts +118 -0
package/src/util/env.ts +12 -0
package/src/util/provider-error.ts +78 -0
package/src/util/retry.ts +91 -6
package/src/util/update-check.ts +64 -0
package/src/commands/models.ts +0 -104

package/src/agent/compaction.ts CHANGED Viewed

@@ -1,17 +1,296 @@
 import { callLlm, type Message } from "./loop";
+import { countTokensAccurate, encodingFamilyForModel } from "./tokenizer";
 export interface CompactionOptions {
   maxMessages?: number;
+  /** Compact even a short history when pasted/tool content exceeds this many tokens. */
+  maxTokens?: number;
+  /** Char-based backward compatible fallback option */
+  maxChars?: number;
+  contextTokens?: number;
   keepRecent?: number;
   model?: string;
+  /** Cap the summarizer prompt so compaction itself cannot balloon context. */
+  maxSummaryInputTokens?: number;
+  maxSummaryInputChars?: number;
   /** User-initiated `/compact`: lower the trigger floor so it actually compacts a small history. */
   force?: boolean;
+  /** When set, the summary `callLlm` is aborted/short-circuited and retries stop. */
+  signal?: AbortSignal;
 }
 export interface CompactionResult {
   compacted: boolean;
   removed: number;
   summary?: string;
+  /** True when the LLM summary persistently failed; recent messages were kept
+   *  (token-bounded) and older ones dropped (no summary message). Signals degraded compaction. */
+  summaryFailed?: boolean;
+  /** Clear error context when limits are exceeded even after compaction. */
+  error?: string;
+  /** The 0-based index of the last message in history replaced by this compaction. */
+  replacesThrough?: number;
+  /** Files mutated in the span this compaction dropped — surfaced so callers
+   *  (engine/session) can keep file context even when the LLM summary omits it. */
+  touchedFiles?: string[];
+}
+export const DEFAULT_MAX_TOKENS = 30_000;
+export const DEFAULT_SUMMARY_INPUT_TOKENS = 20_000;
+export function estimateTokens(text: string): number {
+  let tokens = 0;
+  for (let i = 0; i < text.length; i++) {
+    const code = text.charCodeAt(i);
+    if (code <= 127) {
+      tokens += 0.25;
+    } else if (
+      (code >= 0xac00 && code <= 0xd7a3) || // 한글 가~힣
+      (code >= 0x1100 && code <= 0x11ff) || // 한글 자모
+      (code >= 0x3130 && code <= 0x318f) || // 한글 호환 자모
+      (code >= 0x4e00 && code <= 0x9fff) || // CJK 통합 한자
+      (code >= 0x3400 && code <= 0x4dbf) || // CJK 통합 한자 확장 A
+      (code >= 0x3040 && code <= 0x309f) || // 히라가나
+      (code >= 0x30a0 && code <= 0x30ff) || // 가타카나
+      (code >= 0xff00 && code <= 0xffef)    // 전각 문자
+    ) {
+      tokens += 1 / 1.5;
+    } else {
+      tokens += 1 / 1.5; // Default CJK-like weight for non-ASCII
+    }
+  }
+  return tokens;
+}
+/** Rough per-image vision-token cost (provider median for a clipboard screenshot).
+ *  Keeps the context meter and compaction trigger honest when images are attached. */
+const IMAGE_TOKEN_ESTIMATE = 1100;
+/** Per-message estimate cache keyed by OBJECT IDENTITY. Engine/compaction always
+ *  replace messages with new objects (never mutate `content` in place), so a
+ *  cached count can never go stale; a WeakMap holds no reference once a message
+ *  is dropped from history, so the cache CANNOT grow cumulatively. This turns
+ *  the per-turn `historyTokens(history)` context meter from O(total chars) into
+ *  O(new messages) on long sessions. */
+const messageTokenCache = new WeakMap<Message, number>();
+export function estimateMessageTokens(msg: Message): number {
+  const hit = messageTokenCache.get(msg);
+  if (hit !== undefined) return hit;
+  const n = estimateTokens(msg.role) + estimateTokens(msg.content) + (msg.images?.length ?? 0) * IMAGE_TOKEN_ESTIMATE + 1;
+  messageTokenCache.set(msg, n);
+  return n;
+}
+export function historyTokens(history: Message[]): number {
+  return history.reduce((sum, msg) => sum + estimateMessageTokens(msg), 0);
+}
+/** Engine tool-feedback message prefix (`Tool [name] result (ok|fail):`). */
+const TOOL_RESULT_RE = /^Tool \[[^\]]+\] result \((ok|fail)\):/;
+/**
+ * MID-TURN deterministic context trim: when a single long agent turn grows the
+ * history past `budgetTokens`, elide the BODIES of the OLDEST tool-result
+ * feedback messages in place (newest `keepRecent` kept verbatim) until the
+ * estimate fits the budget. This is what keeps a 60+-step turn from snowballing
+ * to multi-million-token prompts (degrading the model into repeat loops and
+ * compounding cost): turn-boundary compaction (`maybeCompact`) never runs
+ * mid-turn, so without this the per-step input grew without bound.
+ *  - Deterministic, zero LLM calls — safe to run between any two steps.
+ *  - Only tool-result feedback is elided; system / real user prompts /
+ *    assistant messages are never touched (the model keeps its own reasoning).
+ *  - Messages are REPLACED with new objects (never mutated) so the
+ *    identity-keyed token caches stay truthful.
+ * Returns the number of elided messages and the resulting token estimate.
+ */
+export function trimToolResultsInPlace(
+  history: Message[],
+  opts: { budgetTokens: number; keepRecent?: number },
+): { trimmed: number; tokens: number } {
+  const keepRecent = Math.max(0, opts.keepRecent ?? 8);
+  let tokens = historyTokens(history);
+  if (tokens <= opts.budgetTokens) return { trimmed: 0, tokens };
+  // Candidate indices: tool-result user messages, oldest first, excluding the
+  // newest `keepRecent` of them (the model still needs its recent evidence).
+  const candidates: number[] = [];
+  for (let i = 0; i < history.length; i++) {
+    const m = history[i]!;
+    if (m.role === "user" && TOOL_RESULT_RE.test(m.content)) candidates.push(i);
+  }
+  const trimmable = candidates.slice(0, Math.max(0, candidates.length - keepRecent));
+  let trimmed = 0;
+  for (const i of trimmable) {
+    if (tokens <= opts.budgetTokens) break;
+    const m = history[i]!;
+    const header = m.content.match(TOOL_RESULT_RE)?.[0] ?? "Tool result:";
+    const stub = `${header} [elided mid-turn to free context — re-run the tool if this result is needed again]`;
+    if (m.content.length <= stub.length) continue; // already tiny — nothing to win
+    const replacement: Message = { ...m, content: stub };
+    tokens -= estimateMessageTokens(m);
+    history[i] = replacement;
+    tokens += estimateMessageTokens(replacement);
+    trimmed++;
+  }
+  return { trimmed, tokens };
+}
+/**
+ * Accurate BPE token total for a history, summing `countTokensAccurate` per
+ * message (+1 per message for role/separator overhead, mirroring
+ * `estimateMessageTokens`). Use this ONLY at the compaction decision boundary
+ * and summary-budget points — never in the per-render footer path, which must
+ * stay on the cheap `historyTokens` heuristic.
+ */
+const accurateMessageTokenCache = new WeakMap<Message, Map<string, number>>();
+/** Accurate BPE count for ONE message, cached by message IDENTITY (same contract
+ *  as `messageTokenCache`: messages are replaced, never mutated in place) and
+ *  partitioned by tokenizer family so a mid-session model switch can never serve
+ *  a count from the wrong encoder. The WeakMap holds no reference once a message
+ *  leaves history — the cache CANNOT grow cumulatively. */
+export function accurateMessageTokens(msg: Message, model?: string): number {
+  const family = encodingFamilyForModel(model);
+  let perFamily = accurateMessageTokenCache.get(msg);
+  const hit = perFamily?.get(family);
+  if (hit !== undefined) return hit;
+  const n =
+    countTokensAccurate(msg.role, model) +
+    countTokensAccurate(msg.content, model) +
+    (msg.images?.length ?? 0) * IMAGE_TOKEN_ESTIMATE +
+    1;
+  if (!perFamily) {
+    perFamily = new Map();
+    accurateMessageTokenCache.set(msg, perFamily);
+  }
+  perFamily.set(family, n);
+  return n;
+}
+export function accurateHistoryTokens(history: Message[], model?: string): number {
+  return history.reduce((sum, msg) => sum + accurateMessageTokens(msg, model), 0);
+}
+function formatMessagesForSummaryByTokens(messages: Message[], maxTokens: number): string {
+  const out: string[] = [];
+  let used = 0;
+  let omitted = 0;
+  for (const msg of messages) {
+    const line = `[${msg.role}] ${msg.content}`;
+    const needed = estimateTokens(line) + 1;
+    if (used + needed > maxTokens) {
+      const remaining = Math.max(0, maxTokens - used);
+      if (remaining > 20) {
+        out.push(truncateRecentContentByTokens(line, remaining - 1) + "…");
+        used = maxTokens;
+      }
+      omitted++;
+      continue;
+    }
+    out.push(line);
+    used += needed;
+  }
+  if (omitted > 0) out.push(`…(${omitted} older message(s) omitted from summary input to cap compaction context)`);
+  return out.join("\n");
+}
+export function truncateRecentContentByTokens(content: string, maxTokens: number): string {
+  if (maxTokens <= 0) return "";
+  if (estimateTokens(content) <= maxTokens) return content;
+  const marker = "\n…(recent message truncated to bound context)";
+  const markerTokens = estimateTokens(marker);
+  const targetTokens = maxTokens - markerTokens;
+  if (targetTokens <= 0) {
+    let curTokens = 0;
+    let i = 0;
+    for (; i < content.length; i++) {
+      const code = content.charCodeAt(i);
+      const t = code <= 127 ? 0.25 : 1 / 1.5;
+      if (curTokens + t > maxTokens) break;
+      curTokens += t;
+    }
+    return content.slice(0, i);
+  }
+  let curTokens = 0;
+  let i = 0;
+  for (; i < content.length; i++) {
+    const code = content.charCodeAt(i);
+    const t = code <= 127 ? 0.25 : 1 / 1.5;
+    if (curTokens + t > targetTokens) break;
+    curTokens += t;
+  }
+  return content.slice(0, i) + marker;
+}
+function truncateSummaryByTokens(summary: string, maxTokens: number): string {
+  const prefix = "[Earlier conversation summary]\n";
+  const prefixTokens = estimateTokens(prefix);
+  return truncateRecentContentByTokens(summary, Math.max(0, maxTokens - prefixTokens));
+}
+function clampRecentMessagesByTokens(messages: Message[], budgetTokens: number): Message[] {
+  if (messages.length === 0) return messages;
+  const overhead = messages.reduce((sum, msg) => sum + estimateTokens(msg.role) + 1, 0);
+  const contentBudget = Math.max(0, budgetTokens - overhead);
+  const perMessageBudget = Math.floor(contentBudget / messages.length);
+  return messages.map(msg => ({
+    ...msg,
+    content: truncateRecentContentByTokens(msg.content, perMessageBudget),
+  }));
+}
+const SUMMARY_PREFIX = "[Earlier conversation summary]\n";
+const FALLBACK_SUMMARY_PREFIX = "[Earlier conversation omitted:";
+function alreadyCompacted(body: Message[]): boolean {
+  if (body.length === 0) return false;
+  const first = body[0];
+  if (first.role !== "user") return false;
+  return first.content.startsWith(SUMMARY_PREFIX) || first.content.startsWith(FALLBACK_SUMMARY_PREFIX);
+}
+/** File paths the agent mutated in `messages` — parsed mechanically (capped,
+ *  deduped, insertion order) from two sources:
+ *   1. the assistant's write/edit tool-call JSON (`"tool":"write"…"filePath":…`);
+ *   2. CONSERVATIVE bash mutation mentions in `Tool [bash] result` feedback
+ *      (`created/wrote/written to/deleted/removed <path>`) — gated to bash output
+ *      and filtered to path-shaped tokens so prose ("wrote 123 bytes") is ignored. */
+const BASH_RESULT_RE = /^Tool \[bash\] result \((?:ok|fail)\):/;
+export function extractTouchedFiles(messages: Message[], max = 20): string[] {
+  const seen = new Set<string>();
+  const writeRe = /"tool"\s*:\s*"(?:write|edit)"[^}]*?"filePath"\s*:\s*"((?:[^"\\]|\\.){1,300})"/g;
+  const bashRe = /(?:created|wrote|written to|deleted|removed)\s+(['"`]?)([\w./@+-]{1,200})\1/gi;
+  const looksLikePath = (p: string) => /\//.test(p) || /[\w-]\.[A-Za-z0-9]{1,8}$/.test(p);
+  const add = (p: string): boolean => {
+    if (p && !seen.has(p)) seen.add(p);
+    return seen.size >= max;
+  };
+  for (const msg of messages) {
+    if (msg.role === "assistant") {
+      let m: RegExpExecArray | null;
+      while ((m = writeRe.exec(msg.content))) {
+        try {
+          const p = JSON.parse(`"${m[1]}"`) as string;
+          if (add(p)) return [...seen];
+        } catch { /* malformed escape — skip this path */ }
+      }
+      writeRe.lastIndex = 0;
+    }
+    if (BASH_RESULT_RE.test(msg.content)) {
+      let m: RegExpExecArray | null;
+      while ((m = bashRe.exec(msg.content))) {
+        if (looksLikePath(m[2]) && add(m[2])) return [...seen];
+      }
+      bashRe.lastIndex = 0;
+    }
+  }
+  return [...seen];
 }
 export async function maybeCompact(
@@ -19,17 +298,48 @@ export async function maybeCompact(
   opts: CompactionOptions = {}
 ): Promise<CompactionResult> {
   const maxMessages = opts.maxMessages ?? (opts.force ? 1 : 40);
+  // opts.contextTokens가 제공되면 그것의 70%를 예산으로 사용하고, 없으면 opts.maxTokens 혹은 DEFAULT_MAX_TOKENS를 사용한다.
+  // maxChars가 구버전에서 넘어온 경우의 fallback도 지원한다.
+  const budgetTokens = opts.contextTokens
+    ? opts.contextTokens * 0.7
+    : (opts.maxTokens ?? (opts.maxChars ? Math.max(opts.maxChars / 4, 60) : DEFAULT_MAX_TOKENS));
   const keepRecent = opts.keepRecent ?? (opts.force ? 4 : 12);
+  const maxSummaryInputTokens = opts.maxSummaryInputTokens ??
+    (opts.maxSummaryInputChars ? opts.maxSummaryInputChars / 4 : DEFAULT_SUMMARY_INPUT_TOKENS);
   const hasSystem = history.length > 0 && history[0].role === "system";
   const systemCount = hasSystem ? 1 : 0;
   const body = history.slice(systemCount);
+  const overMessages = opts.force || body.length > maxMessages;
+  // Decision boundary: use accurate BPE counts against a real TOKEN budget so we neither
+  // compact prematurely nor blow past the window on heuristic error. But when the budget
+  // is CHAR-derived (legacy `maxChars` → chars/4), measure with the matching char heuristic
+  // so the basis is consistent (accurate BPE under-counts repeated-char runs vs the heuristic).
+  const budgetFromChars = !opts.contextTokens && opts.maxTokens === undefined && opts.maxChars !== undefined;
+  const measuredTokens = budgetFromChars ? historyTokens(history) : accurateHistoryTokens(history, opts.model);
+  const overTokens = measuredTokens > budgetTokens;
-  if (body.length <= maxMessages) {
+  if (!overMessages && !overTokens) {
     return { compacted: false, removed: 0 };
   }
-  const olderCount = body.length - keepRecent;
+  // Idempotence guard: once the body is `[summary|omitted] + recent`, another
+  // compaction pass can only summarize the summary and lose information. If a
+  // hard context window is still exceeded, report it; otherwise leave history
+  // unchanged so repeated auto-/manual compaction converges.
+  if (alreadyCompacted(body) && body.length <= keepRecent + 1) {
+    const finalTokens = accurateHistoryTokens(history, opts.model);
+    const error = opts.contextTokens && finalTokens > opts.contextTokens
+      ? `Context window limit exceeded even after compaction. Remaining content size: ${Math.round(finalTokens)} tokens, Window limit: ${opts.contextTokens} tokens.`
+      : undefined;
+    return { compacted: false, removed: 0, error };
+  }
+  const recentCount = Math.min(keepRecent, Math.max(0, body.length - 1));
+  const olderCount = body.length - recentCount;
   if (olderCount <= 0) {
     return { compacted: false, removed: 0 };
   }
@@ -37,39 +347,120 @@ export async function maybeCompact(
   const older = body.slice(0, olderCount);
   const recent = body.slice(olderCount);
-  const olderFormatted = older
-    .map(msg => `[${msg.role}] ${msg.content}`)
-    .join("\n");
+  const olderFormatted = formatMessagesForSummaryByTokens(older, maxSummaryInputTokens);
+  // gjc-style file-operation preservation (plan/gjc-inheritance.md B8, gjc
+  // CompactionDetails 계승): the summary model may drop WHICH files were touched —
+  // extract them mechanically from the to-be-summarized messages and pin them
+  // into the prompt so post-compaction turns keep their file context.
+  const touched = extractTouchedFiles(older);
+  const touchedNote = touched.length
+    ? `\nFiles touched in the summarized span (PRESERVE this list verbatim in the summary): ${touched.join(", ")}`
+    : "";
   const systemPrompt =
-    "Summarize the following coding-agent conversation so work can continue. Capture decisions, files changed, current task state, and open TODOs. Be concise.";
-  try {
-    const summary = await callLlm(
-      [
-        { role: "user", content: olderFormatted }
-      ],
-      {
-        model: opts.model,
-        systemPrompt,
+    "Summarize the following coding-agent conversation so work can continue. Capture decisions, files changed, current task state, and open TODOs. Be concise." +
+    touchedNote;
+  // Degradation ladder: (1) RETRY the summary a few times with short, abort-aware
+  // backoff; (2) on persistent failure KEEP the recent messages verbatim and drop the
+  // older ones — no misleading placeholder — and surface summaryFailed.
+  const maxSummaryAttempts = 3; // initial attempt + up to 2 retries
+  const summaryBackoffMs = 200;
+  let summary: string | undefined;
+  let summaryError: unknown;
+  for (let attempt = 1; attempt <= maxSummaryAttempts; attempt++) {
+    if (opts.signal?.aborted) {
+      summaryError = new Error("aborted");
+      break;
+    }
+    try {
+      summary = await callLlm(
+        [
+          { role: "user", content: olderFormatted }
+        ],
+        {
+          model: opts.model,
+          systemPrompt,
+          signal: opts.signal,
+        }
+      );
+      summaryError = undefined;
+      break;
+    } catch (err) {
+      summaryError = err;
+      if (attempt < maxSummaryAttempts && !opts.signal?.aborted) {
+        await new Promise<void>(resolve => setTimeout(resolve, summaryBackoffMs * attempt));
       }
-    );
+    }
+  }
+  if (summary !== undefined) {
+    // Rung 1 success: behave exactly as before — summary message + bounded recent.
     const systemMessages = hasSystem ? [history[0]] : [];
+    const boundedSummary = truncateSummaryByTokens(summary, Math.min(budgetTokens, maxSummaryInputTokens));
+    // Force a mechanical "Files touched:" header at the FRONT of the summary so
+    // the file list survives even if the LLM dropped it from its prose (cycle 11).
+    const filesHeader = touched.length ? `Files touched: ${touched.join(", ")}\n\n` : "";
+    const summaryMessage: Message = { role: "user", content: SUMMARY_PREFIX + filesHeader + boundedSummary };
+    const systemTokens = historyTokens(systemMessages);
+    const summaryMessageTokens = historyTokens([summaryMessage]);
+    const boundedRecent = clampRecentMessagesByTokens(recent, Math.max(0, budgetTokens - summaryMessageTokens - systemTokens));
     const next: Message[] = [
       ...systemMessages,
-      { role: "user", content: "[Earlier conversation summary]\n" + summary },
-      ...recent
+      summaryMessage,
+      ...boundedRecent,
     ];
     history.splice(0, history.length, ...next);
+    const finalTokens = accurateHistoryTokens(history, opts.model);
+    let error: string | undefined;
+    if (opts.contextTokens && finalTokens > opts.contextTokens) {
+      error = `Context window limit exceeded even after compaction. Remaining content size: ${Math.round(finalTokens)} tokens, Window limit: ${opts.contextTokens} tokens.`;
+    }
     return {
       compacted: true,
       removed: older.length,
       summary,
+      error,
+      replacesThrough: systemCount + older.length - 1,
+      touchedFiles: touched.length ? touched : undefined,
     };
-  } catch {
+  }
+  // Aborted (user cancelled the turn): do NOT mutate history as a side effect of a
+  // cancelled compaction — leave it untouched and report no compaction.
+  if (opts.signal?.aborted) {
     return { compacted: false, removed: 0 };
   }
+  // Rung 2: KEEP-RECENT fallback. The summarizer persistently failed, so rather than inject
+  // a placeholder the model could mistake for real conversation, keep the N most-recent
+  // messages (token-bounded, like the success path) and drop the older ones (system kept).
+  const systemMessages = hasSystem ? [history[0]] : [];
+  const systemTokens = historyTokens(systemMessages);
+  const boundedRecent = clampRecentMessagesByTokens(recent, Math.max(0, budgetTokens - systemTokens));
+  const next: Message[] = [
+    ...systemMessages,
+    ...boundedRecent,
+  ];
+  history.splice(0, history.length, ...next);
+  process.stderr.write(`[jeo] compaction summary failed (${(summaryError as Error)?.message ?? "error"}); kept ${boundedRecent.length} recent messages (token-bounded) and dropped ${older.length} older messages.\n`);
+  const finalTokens = accurateHistoryTokens(history, opts.model);
+  let error: string | undefined;
+  if (opts.contextTokens && finalTokens > opts.contextTokens) {
+    error = `Context window limit exceeded even after compaction. Remaining content size: ${Math.round(finalTokens)} tokens, Window limit: ${opts.contextTokens} tokens.`;
+  }
+  return {
+    compacted: true,
+    removed: older.length,
+    summaryFailed: true,
+    error,
+    replacesThrough: systemCount + older.length - 1,
+    touchedFiles: touched.length ? touched : undefined,
+  };
 }

package/src/agent/config-schema.ts CHANGED Viewed

@@ -1,7 +1,9 @@
+import { findCatalogEntry } from "../ai/model-catalog-compat";
+import { CODEX_MODELS } from "../ai/model-catalog";
 import { z } from "zod";
 /**
- * Runtime validation for `~/.joc/config.json`. Previously the file was
+ * Runtime validation for `~/.jeo/config.json`. Previously the file was
  * `JSON.parse`d and cast straight to `Config` — a wrong-typed field (e.g. a
  * numeric `defaultModel`) slipped through untyped and surfaced as a confusing
  * downstream failure. `parseConfig` turns that into a clear, actionable signal.
@@ -16,6 +18,24 @@ const StoredOAuthSchema = z.object({
 });
 const OAuthEntry = z.union([z.string(), StoredOAuthSchema]);
+const HookConfigSchema = z.object({
+  enabled: z.boolean().optional(),
+  hooks: z
+    .array(
+      z.object({
+        event: z.enum(["pre-tool", "post-turn", "post-implementation"]),
+        match: z
+          .object({
+            tool: z.string().optional(),
+          })
+          .optional(),
+        run: z.string(),
+        timeoutMs: z.number().int().min(1).optional(),
+      })
+    )
+    .optional(),
+});
 export const ConfigSchema = z
   .object({
@@ -24,6 +44,7 @@ export const ConfigSchema = z
         anthropic: z.string().optional(),
         openai: z.string().optional(),
         gemini: z.string().optional(),
+        antigravity: z.string().optional(),
       })
       .default({}),
     oauth: z
@@ -31,17 +52,21 @@ export const ConfigSchema = z
         anthropic: OAuthEntry.optional(),
         openai: OAuthEntry.optional(),
         gemini: OAuthEntry.optional(),
+        antigravity: OAuthEntry.optional(),
       })
       .optional(),
     ollamaBaseUrl: z.string().optional(),
     openaiBaseUrl: z.string().optional(),
     defaultModel: z.string().min(1),
+    theme: z.string().optional(),
     thinkingLevel: z.enum(["minimal", "low", "medium", "high", "xhigh"]).optional(),
     modelAliases: z.record(z.string()).optional(),
+    /** Most-recently-selected models, newest first (drives the default + pickers). */
+    recentModels: z.array(z.string()).optional(),
     /**
-     * Provider retry budgets (gjc parity). `requestMaxRetries` counts retries
-     * (not the initial request) for a provider request; `maxDelayMs` caps backoff.
-     * `maxRetries`/`streamMaxRetries` are accepted for gjc-config compatibility.
+     * Provider retry budgets (gjc parity). `requestMaxRetries` is used for non-stream
+     * calls and stream initial connections; `streamMaxRetries` is used for stream retries.
+     * `maxRetries` is the fallback budget when either is unset; `maxDelayMs` caps backoff.
      */
     retry: z
       .object({
@@ -49,6 +74,8 @@ export const ConfigSchema = z
         streamMaxRetries: z.number().int().min(0).optional(),
         maxRetries: z.number().int().min(0).optional(),
         maxDelayMs: z.number().int().min(0).optional(),
+        rateLimitRetries: z.number().int().min(0).optional(),
+        rateLimitMinDelayMs: z.number().int().min(0).optional(),
       })
       .optional(),
     /**
@@ -60,7 +87,22 @@ export const ConfigSchema = z
       .record(
         z.object({
           model: z.string().optional(),
+          // Tolerated, informational provider tag (model ids are persisted provider-qualified)
+          provider: z.enum(["anthropic", "openai", "gemini", "antigravity", "ollama"]).optional(),
           maxSteps: z.number().int().min(1).optional(),
+          /** Per-role reasoning budget; absent = inherit the global thinkingLevel. */
+          thinking: z.enum(["minimal", "low", "medium", "high", "xhigh"]).optional(),
+          // ─── Custom-role declaration (SYSTEM-driven registry) ───
+          // An entry under a NON-bundled id that sets any of these becomes a
+          // first-class subagent role at runtime — no code change required.
+          /** Human title shown in /agents listings. */
+          title: z.string().optional(),
+          /** One-line purpose (also fed into the default prompt template). */
+          description: z.string().optional(),
+          /** Role prompt template ({{TOOL_PROTOCOL}}/{{ROLE_TITLE}}/{{ROLE_DESCRIPTION}} supported). */
+          prompt: z.string().optional(),
+          /** Custom roles default to READ-ONLY; set false to allow edits. */
+          readOnly: z.boolean().optional(),
         }),
       )
       .optional(),
@@ -72,15 +114,87 @@ export const ConfigSchema = z
         plan: z.string().optional(),
       })
       .optional(),
+    hooks: HookConfigSchema.optional(),
   })
   .passthrough();
 export type ValidatedConfig = z.infer<typeof ConfigSchema>;
 /** Validate parsed JSON against the config schema. Returns a tagged result, never throws. */
+const BUILTIN_ALIASES = new Set(["fast", "local", "sonnet", "opus", "haiku", "gpt", "flash"]);
+function normalizeModelId(id: string | undefined, aliases: Record<string, string>): string | undefined {
+  if (!id) return id;
+  const trimmed = id.trim();
+  const lower = trimmed.toLowerCase();
+  // 1. 이미 접두사가 있는가? (ollama/, openai/, anthropic/, google/, antigravity/)
+  if (
+    lower.startsWith("ollama/") ||
+    lower.startsWith("openai/") ||
+    lower.startsWith("anthropic/") ||
+    lower.startsWith("google/") ||
+    lower.startsWith("antigravity/")
+  ) {
+    return trimmed;
+  }
+  // 2. catalog canonical인가?
+  if (findCatalogEntry(trimmed)) {
+    return trimmed;
+  }
+  // 3. CODEX 모델인가?
+  if (CODEX_MODELS.includes(trimmed)) {
+    return trimmed;
+  }
+  // 4. alias인가?
+  if (trimmed in aliases || BUILTIN_ALIASES.has(trimmed)) {
+    return trimmed;
+  }
+  // 5. 접두사가 없고, :tag를 포함하는가?
+  if (trimmed.includes(":")) {
+    return `ollama/${trimmed}`;
+  }
+  return trimmed;
+}
 export function parseConfig(raw: unknown): { ok: true; config: ValidatedConfig } | { ok: false; message: string } {
   const result = ConfigSchema.safeParse(raw);
-  if (result.success) return { ok: true, config: result.data };
+  if (result.success) {
+    const config = result.data;
+    const aliases = config.modelAliases || {};
+    if (config.defaultModel) {
+      config.defaultModel = normalizeModelId(config.defaultModel, aliases) || config.defaultModel;
+    }
+    if (config.roles) {
+      if (config.roles.smol) {
+        config.roles.smol = normalizeModelId(config.roles.smol, aliases);
+      }
+      if (config.roles.slow) {
+        config.roles.slow = normalizeModelId(config.roles.slow, aliases);
+      }
+      if (config.roles.plan) {
+        config.roles.plan = normalizeModelId(config.roles.plan, aliases);
+      }
+    }
+    if (config.subagents) {
+      for (const key of Object.keys(config.subagents)) {
+        const sub = config.subagents[key];
+        if (sub && sub.model) {
+          sub.model = normalizeModelId(sub.model, aliases);
+        }
+      }
+    }
+    return { ok: true, config };
+  }
   const issue = result.error.issues[0];
   const where = issue?.path?.length ? issue.path.join(".") : "config";
   return { ok: false, message: `${where}: ${issue?.message ?? "invalid"}` };