npm - typeclaw - Versions diffs - 0.7.0 → 0.9.0 - Mend

typeclaw 0.7.0 → 0.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (107) hide show

package/README.md +15 -9
package/package.json +5 -3
package/scripts/dump-system-prompt.ts +12 -1
package/scripts/require-parallel.ts +41 -0
package/src/agent/auth.ts +3 -3
package/src/agent/index.ts +116 -14
package/src/agent/live-sessions.ts +34 -0
package/src/agent/multimodal/read-redirect.ts +43 -0
package/src/agent/plugin-tools.ts +97 -13
package/src/agent/session-meta.ts +21 -2
package/src/agent/session-origin.ts +6 -13
package/src/agent/subagent-completion-reminder.ts +89 -0
package/src/agent/subagents.ts +3 -2
package/src/agent/system-prompt.ts +49 -15
package/src/bundled-plugins/explorer/explorer.ts +2 -2
package/src/bundled-plugins/guard/index.ts +14 -1
package/src/bundled-plugins/guard/policies/managed-config.ts +43 -13
package/src/bundled-plugins/guard/policies/memory-retrieval-cache-write.ts +37 -0
package/src/bundled-plugins/guard/policies/memory-topics-delete.ts +67 -0
package/src/bundled-plugins/guard/policies/memory-topics-write.ts +33 -0
package/src/bundled-plugins/guard/policies/non-workspace-write.ts +8 -2
package/src/bundled-plugins/guard/policy.ts +7 -0
package/src/bundled-plugins/memory/README.md +76 -62
package/src/bundled-plugins/memory/append-tool.ts +3 -2
package/src/bundled-plugins/memory/citation-superset.ts +49 -11
package/src/bundled-plugins/memory/citations.ts +19 -8
package/src/bundled-plugins/memory/delete-tool.ts +57 -0
package/src/bundled-plugins/memory/dreaming-state.ts +1 -1
package/src/bundled-plugins/memory/dreaming.ts +364 -146
package/src/bundled-plugins/memory/frontmatter.ts +165 -0
package/src/bundled-plugins/memory/index.ts +236 -16
package/src/bundled-plugins/memory/injection-plan.ts +15 -0
package/src/bundled-plugins/memory/load-memory.ts +102 -103
package/src/bundled-plugins/memory/load-shards.ts +156 -0
package/src/bundled-plugins/memory/memory-logger.ts +16 -15
package/src/bundled-plugins/memory/memory-retrieval.ts +105 -0
package/src/bundled-plugins/memory/migration.ts +282 -1
package/src/bundled-plugins/memory/paths.ts +42 -0
package/src/bundled-plugins/memory/search-tool.ts +232 -0
package/src/bundled-plugins/memory/secret-detector.ts +2 -2
package/src/bundled-plugins/memory/shard-snapshot.ts +51 -0
package/src/bundled-plugins/memory/slug.ts +59 -0
package/src/bundled-plugins/memory/stream-io.ts +110 -1
package/src/bundled-plugins/memory/strength.ts +3 -3
package/src/bundled-plugins/memory/topics.ts +70 -16
package/src/bundled-plugins/security/index.ts +24 -0
package/src/bundled-plugins/security/permissions.ts +4 -0
package/src/bundled-plugins/security/policies/cron-promotion.ts +349 -0
package/src/bundled-plugins/security/policies/git-exfil.ts +2 -0
package/src/bundled-plugins/security/policies/prompt-injection.ts +3 -0
package/src/bundled-plugins/security/policies/role-promotion.ts +419 -0
package/src/bundled-plugins/security/policies/system-prompt-leak.ts +1 -0
package/src/channels/adapters/discord-bot-slash-commands.ts +186 -0
package/src/channels/adapters/discord-bot.ts +163 -1
package/src/channels/adapters/kakaotalk-attachment.ts +7 -17
package/src/channels/adapters/kakaotalk.ts +64 -37
package/src/channels/adapters/slack-bot-classify.ts +2 -27
package/src/channels/adapters/slack-bot-slash-commands.ts +82 -0
package/src/channels/adapters/slack-bot.ts +139 -1
package/src/channels/index.ts +5 -0
package/src/channels/router.ts +328 -18
package/src/channels/subagent-completion-bridge.ts +84 -0
package/src/cli/builtins.ts +1 -0
package/src/cli/index.ts +1 -0
package/src/cli/init.ts +122 -14
package/src/cli/inspect.ts +151 -0
package/src/cli/role.ts +7 -2
package/src/cli/tunnel.ts +13 -1
package/src/cli/ui.ts +25 -1
package/src/config/index.ts +1 -0
package/src/config/models-mutation.ts +10 -2
package/src/cron/consumer.ts +1 -1
package/src/init/dockerfile.ts +353 -2
package/src/init/hatching.ts +5 -6
package/src/init/kakaotalk-auth.ts +6 -47
package/src/init/validate-api-key.ts +121 -0
package/src/inspect/index.ts +213 -0
package/src/inspect/label.ts +50 -0
package/src/inspect/live.ts +221 -0
package/src/inspect/render.ts +163 -0
package/src/inspect/replay.ts +265 -0
package/src/inspect/session-list.ts +160 -0
package/src/inspect/types.ts +110 -0
package/src/plugin/hooks.ts +23 -1
package/src/plugin/index.ts +2 -0
package/src/plugin/manager.ts +1 -1
package/src/plugin/registry.ts +1 -1
package/src/plugin/types.ts +10 -0
package/src/run/channel-session-factory.ts +7 -1
package/src/run/index.ts +87 -21
package/src/secrets/kakao-renewal.ts +3 -47
package/src/server/index.ts +241 -60
package/src/shared/index.ts +4 -1
package/src/shared/local-time.ts +17 -0
package/src/shared/protocol.ts +49 -0
package/src/skills/typeclaw-channel-kakaotalk/SKILL.md +9 -9
package/src/skills/typeclaw-claude-code/SKILL.md +83 -40
package/src/skills/typeclaw-claude-code/references/stop-hook.md +2 -0
package/src/skills/typeclaw-claude-code/references/tmux-driving.md +102 -16
package/src/skills/typeclaw-config/SKILL.md +38 -33
package/src/skills/typeclaw-cron/SKILL.md +1 -1
package/src/skills/typeclaw-git/SKILL.md +2 -2
package/src/skills/typeclaw-memory/SKILL.md +16 -163
package/src/skills/typeclaw-permissions/SKILL.md +2 -2
package/src/skills/typeclaw-plugins/SKILL.md +26 -15
package/src/test-helpers/wait-for.ts +7 -1
package/typeclaw.schema.json +7 -0

package/src/init/dockerfile.ts CHANGED Viewed

@@ -394,14 +394,365 @@ RUN echo "${encoded}" | base64 -d > ${TYPECLAW_ENTRYPOINT_PATH} \\
 // `~/.local/bin/claude` shim, which itself dereferences to the versioned
 // binary under `~/.local/share/claude/versions/<ver>/`, so upgrades via
 // `claude update` keep working without re-running this layer.
+// `~/.claude.json` is Claude Code's internal state file (NOT
+// `~/.claude/settings.json`, which is user-facing). On first run with an
+// empty or missing file, `claude` enters a TTY-only theme picker:
+// "Welcome to Claude Code … Choose the text style that looks best with
+// your terminal" with 7 options. The picker is unskippable via CLI
+// flags or env vars (no `--skip-onboarding`, no `--theme=dark`;
+// `IS_DEMO=1` exists but has documented side effects). The single
+// official escape hatch is writing `{"hasCompletedOnboarding": true,
+// "theme": "dark"}` to `~/.claude.json` before the first launch —
+// confirmed by Anthropic in multiple GitHub issues
+// (anthropics/claude-code#4714, #8938, #13827) and the empirical
+// answer used by metabase/metabase's `bin/claude-dangerous`, the
+// `claudeCodeAlDevContainer` feature, and dozens of other Docker
+// integrations.
+//
+// Without the pre-seed, the very first agent-driven `tmux new-session …
+// claude` invocation hangs on the theme picker: the agent's
+// `send-keys "<prompt>" Enter` arrives at the picker, gets interpreted
+// as picker input, and never reaches claude's actual prompt. The
+// `typeclaw-claude-code` skill is structured around a `Stop`-hook
+// sentinel, which never fires while the picker is up, so the polling
+// loop only learns of the hang at the 10-minute wall-clock budget.
+// Pre-seeding here costs ~85 bytes on disk and zero runtime overhead.
+//
+// SCOPE: this seed is NECESSARY but not SUFFICIENT for a fully
+// no-questions-asked first launch. Claude Code also shows two
+// post-seed modal dialogs that this file deliberately does NOT
+// pre-clear:
+//   1. "Detected a custom API key from environment. Do you want to use
+//      this API key?" — fires when ANTHROPIC_API_KEY is set. Options
+//      `[No (recommended), Yes]`, focus on No, picker does NOT wrap.
+//   2. Workspace trust ("Do you trust the files in this folder?") —
+//      fires on every new cwd. Options `[Yes, proceed, No, exit]`,
+//      focus on Yes.
+// Both are kept as runtime decisions handled by the
+// `typeclaw-claude-code` skill (see its "Driving the session" section,
+// "Clear startup dialogs" step, which uses dialog-specific keystrokes
+// because the picker doesn't wrap). Pre-seeding
+// `hasTrustDialogAccepted` or `customApiKeyResponses.approved` here
+// would silently widen the trust surface in ways the operator hasn't
+// consented to — the seed's job is strictly cosmetic-wizard removal,
+// not trust/permission preemption.
+//
+// `theme: "dark"` matches typeclaw's default TUI theme so the visual
+// transition between the typeclaw TUI and a tmux-attached claude pane
+// is consistent. Users on light terminals can override by editing
+// `~/.claude.json` (which persists across container restarts only if
+// they mount it; in the default container-ephemeral state it resets
+// to this default on every rebuild, which is fine — `claude` reads
+// the file at startup and the theme has no behavioral impact).
+//
+// `lastOnboardingVersion` is INTENTIONALLY OMITTED. ii-agent and a
+// few other templates ship `lastOnboardingVersion: "1.0.30"`, but
+// that value is version-coupled and goes stale on every Claude Code
+// release. Empirically against Claude Code 2.1.146, the current
+// `hasCompletedOnboarding: true` alone is honored without a version
+// pin. If a future Claude version starts re-triggering the picker
+// when the field is missing, capture `claude --version` output at
+// build time and inject it then — don't hardcode a stale value.
+//
+// `installMethod: "native"` and `numStartups: 1` match the shape
+// Claude Code itself writes after a clean first launch; keeping them
+// makes our seed indistinguishable from a real post-onboarding state,
+// which minimizes the chance of a future "if the file looks like
+// agent-pre-seed, redo onboarding" detection heuristic landing on us.
+//
+// Built via `JSON.stringify` rather than a hand-written string
+// literal so quote/escape bugs surface as TS errors at compile time,
+// not as a corrupt `~/.claude.json` discovered only when the build
+// runs. The `printf '%s\\n' '<JSON>'` shell pattern relies on the
+// JSON containing no single quotes (true by construction — JSON.
+// stringify only emits double quotes); a regression test parses the
+// emitted JSON back to confirm.
+const CLAUDE_CODE_ONBOARDING_SEED = JSON.stringify({
+  hasCompletedOnboarding: true,
+  theme: 'dark',
+  installMethod: 'native',
+  numStartups: 1,
+})
+// The Stop hook is what powers the typeclaw-claude-code skill's done-signal:
+// the operator subagent spawns claude in a worktree, polls a sentinel file,
+// and decides "turn done" from the file's contents. The hook was originally
+// per-worktree (`<worktree>/.claude/settings.json` + `<worktree>/hook-on-
+// stop.sh`), which meant the operator subagent wrote both files itself at
+// delegation time. That worked when operator wrote the canonical shape —
+// and silently failed when it didn't. Claude Code's settings parser
+// ignores unknown keys, so wrong-shape configs (`{"hooks": {"onStop":
+// "./script.sh"}}`, `{"hooks": {"Stop": "./script.sh"}}`,
+// `{"hooks": {"Stop": [{"command": "./script.sh"}]}}` etc.) surface as
+// "polling timed out at the 10-minute wall-clock budget" rather than as a
+// parse error — the failure is invisible until you've already paid the
+// budget. The skill's "do not simplify this JSON" warning helps but doesn't
+// eliminate the slip: as long as an LLM has to write the JSON, an LLM can
+// invent a shape.
+//
+// Move both pieces to Dockerfile-build time, where the JSON is constructed
+// once via JSON.stringify and the shape can never drift from the operator's
+// reading of the skill:
+//
+//   1. `/usr/local/bin/typeclaw-cc-stop-hook` — the hook script. Stable
+//      absolute path so the global settings.json can name it without
+//      worrying about $PATH. Reads stdin (Claude Code's Stop event JSON)
+//      and atomically writes `$PWD/sentinel.json` + touches `$PWD/.done`.
+//      The temp-file-then-rename keeps the read side from ever seeing a
+//      partial sentinel even if the polling loop races the write — same
+//      atomicity contract as the previous per-worktree script.
+//   2. `~/.claude/settings.json` — the user-level (global) hook config.
+//      User-level hooks fire for every `claude` invocation regardless of
+//      cwd, so the operator's worktree no longer needs its own
+//      `.claude/settings.json`. (Claude Code merges hooks additively
+//      across scopes per docs.claude.com/en/docs/claude-code/settings —
+//      if a future user mounts their own `~/.claude/settings.json` with a
+//      different Stop hook, both fire in parallel rather than ours being
+//      clobbered.)
+//
+// Both files are written via JSON.stringify + heredoc; the JSON shape is
+// validated by JSON.parse in dockerfile.test.ts, so a future edit that
+// corrupts the structure fails the test, not the docker build (let alone
+// the next delegation that runs against the broken hook). The previous
+// per-worktree path is fully removed from the skill body; the only place
+// the hook shape lives is here.
+//
+// IMPORTANT — \`$PWD\` vs \`$CLAUDE_PROJECT_DIR\`: an earlier version of this
+// layer used \`$CLAUDE_PROJECT_DIR\`. Self-review caught this as a critical
+// bug. \`CLAUDE_PROJECT_DIR\` is Claude Code's documented env var for "the
+// project root" — but empirically (see anthropics/claude-code#27343 and
+// #44450), inside a git worktree it resolves to the *main repo's* git
+// root, NOT the worktree's path. The operator's flow is:
+//   git -C /agent worktree add /tmp/cc-<id> HEAD
+//   tmux new-session -d -s cc-<id> -c /tmp/cc-<id> claude
+// So \`/tmp/cc-<id>\` is a registered worktree of \`/agent\`, and Claude
+// Code would resolve \`CLAUDE_PROJECT_DIR=/agent\` — landing the sentinel
+// in the live agent folder while the polling loop watches the worktree.
+//
+// The fix: write to \`$PWD\` instead. \`$PWD\` is set by every POSIX shell
+// on every invocation (POSIX-required since IEEE 1003.1-1988), and it's
+// the literal cwd Claude Code was invoked with — exactly the worktree
+// path \`tmux -c\` set. \`CLAUDE_PROJECT_DIR\` is Anthropic-specific and
+// has shifted semantics across versions per the cited bug reports; we
+// deliberately avoid depending on it.
+//
+// PER-SESSION FILENAMES — concurrent-claude race safety: the Stop hook
+// writes to \`sentinel-<session_id>.json\` and \`.done-<session_id>\`,
+// not a fixed filename. session_id comes from Claude Code's Stop event
+// JSON on stdin (\`BaseHookInputSchema.session_id\`, always present per
+// the upstream schema). The operator learns the UUID by reading a
+// \`.session-id\` file that a SessionStart hook (also baked here) writes
+// at session-start time; see TYPECLAW_CC_SESSION_START_HOOK_SCRIPT
+// below.
+//
+// The earlier shape used fixed \`sentinel.json\` + \`.done\` names, which
+// is safe when each worktree has at most one claude session (today's
+// only caller). But if two callers ever share a cwd — operator A and
+// operator B both delegating in \`/agent\`, a future plugin that runs
+// \`claude\` from a shared dir, or an out-of-band caller violating the
+// "one worktree per delegation" invariant — both write to the same
+// file and corrupt each other's state with no diagnostic. Per-session
+// filenames make the race structurally impossible.
+//
+// WHY NOT \`claude --session-id <pre-generated-uuid>\`: an earlier
+// iteration of this PR had the operator pre-generate a UUID and pass
+// it via \`--session-id\`. Self-review caught that as a critical bug:
+// per anthropics/claude-code#44607, the \`--session-id\` flag only
+// controls the persistence/transcript UUID in \`-p\` (print) mode. In
+// interactive mode (which the typeclaw-claude-code skill uses), the
+// flag sets a separate telemetry/API ID while the CLI generates its
+// own internal UUID for the transcript file and for the \`session_id\`
+// field that hooks see. The pre-generated UUID and the hook's UUID
+// don't match — the polling loop times out forever. The current
+// design sidesteps this entirely: the operator does NOT pass
+// \`--session-id\`; it lets claude generate its own UUID and learns it
+// back via the \`.session-id\` file the SessionStart hook writes.
+//
+// session_id extraction: \`bun -e\` against the JSON payload. We use bun,
+// NOT POSIX sed, because bun is guaranteed in the container (bun:1-slim
+// base) and is a real JSON parser. A previous iteration used
+// \`sed -n 's/.*"session_id":"\\([^"]*\\)".*/\\1/p'\` which is greedy and
+// picks the LAST \`"session_id":"..."\` occurrence in the JSON.
+// Claude Code's Stop event carries \`last_assistant_message\` which
+// contains the assistant's prose — that prose can include the literal
+// text \`"session_id":"<fake-uuid>"\` (the model might have been
+// discussing session IDs!), which sed would extract instead of the
+// top-level field. bun's JSON.parse picks the structural \`session_id\`
+// regardless of what appears in nested string values. UUID-shape
+// validation still applies downstream as defense-in-depth against
+// path-traversal session_id values; malformed JSON or missing field
+// falls back to "malformed" so the polling loop sees SOMETHING and
+// can surface the corruption.
+//
+// FALLBACK FILENAMES — \`sentinel-malformed.json\` / \`.done-malformed\`:
+// if session_id extraction fails or validation rejects the result, the
+// hook writes to these fixed names. The operator's polling loop watches
+// its own \`<sid>\` file (read from \`.session-id\`) and will time out —
+// but the \`-malformed\` file exists on disk so a post-mortem inspector
+// can tell "hook fired but session_id was bad" apart from "hook never
+// fired at all."
+//
+// SECURITY/SCOPE: both hook scripts only touch files inside \`$PWD\`,
+// with filenames validated to UUID shape or the fixed "malformed"
+// fallback. Even with an adversarial \`session_id\` in the stdin
+// payload, the worst case is "hook writes \`$PWD/sentinel-malformed.json\`"
+// or "hook writes \`$PWD/.session-id\` containing 'malformed'" — never
+// path traversal, never writes outside \`$PWD\`. The hooks run as root
+// inside the container like every other in-container process; there is
+// no privilege boundary to cross.
+const TYPECLAW_CC_STOP_HOOK_PATH = '/usr/local/bin/typeclaw-cc-stop-hook'
+const TYPECLAW_CC_SESSION_START_HOOK_PATH = '/usr/local/bin/typeclaw-cc-session-start-hook'
+// SessionStart hook script. Fires when a session begins via
+// startup/resume/clear/compact per the upstream lifecycle docs. Writes
+// \`$PWD/.session-id\` containing the validated UUID, atomically.
+//
+// IMPORTANT — \`.session-id\` is a FAST PATH, not a precondition. Per
+// anthropics/claude-code#11519, SessionStart can be SKIPPED entirely
+// when workspace trust hasn't been accepted yet: debug logs show
+// \`Skipping SessionStart:startup hook execution - workspace trust not
+// accepted\`. For the typeclaw-claude-code skill flow, EVERY first
+// invocation in a fresh worktree hits this — the trust dialog fires
+// before any prompt can be sent. So \`.session-id\` may never appear
+// pre-first-prompt. The skill instructs the operator to fall back to
+// reading session_id from the FIRST Stop hook's sentinel instead.
+// \`.session-id\` is still useful for sessions that were already
+// trusted (re-attaching to a running worktree, etc.) — when it
+// appears, the operator can skip the discovery step.
+//
+// IMPORTANT — \`compact\` can ROTATE the session_id. The upstream
+// behavior is documented in anthropics/claude-code#29094: a SessionStart
+// with \`source: "compact"\` is a NEW session linked via
+// \`parent_session_id\`. So \`.session-id\` can change mid-delegation if
+// a long claude session compacts itself. The operator's polling loop
+// must handle session_id rotation: a new \`.done-<different-uuid>\`
+// appearing means \`cc_session_id\` should update to the new value.
+const TYPECLAW_CC_SESSION_START_HOOK_SCRIPT = `#!/bin/sh
+# typeclaw SessionStart-hook for Claude Code. Stdin carries the
+# SessionStart event JSON. Writes \$PWD/.session-id with the session
+# UUID as a fast-path optimization (the operator falls back to
+# discovering session_id from the first Stop sentinel if .session-id
+# never appears — see anthropics/claude-code#11519). Rationale lives
+# in src/init/dockerfile.ts.
+#
+# Both temp filenames are PID-scoped (PID = \$\$) so two SessionStart
+# hooks firing concurrently in the same cwd don't race on the same
+# temp file.
+set -eu
+tmp_out="\${PWD}/.session-id.\$\$.tmp"
+trap 'rm -f "\$tmp_out"' EXIT
+sid=\$(bun -e 'try { const j = await new Response(Bun.stdin.stream()).json(); process.stdout.write(String(j.session_id ?? "")) } catch { process.stdout.write("") }')
+case "\$sid" in
+  [0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f]-[0-9a-f][0-9a-f][0-9a-f][0-9a-f]-[0-9a-f][0-9a-f][0-9a-f][0-9a-f]-[0-9a-f][0-9a-f][0-9a-f][0-9a-f]-[0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f]) ;;
+  *) sid=malformed ;;
+esac
+printf '%s\\n' "\$sid" > "\$tmp_out"
+mv "\$tmp_out" "\${PWD}/.session-id"
+trap - EXIT
+`
+// Single-quoted heredoc so the body is delivered verbatim — no shell
+// expansion at build time. Runtime expansion of \`$PWD\`, \`$sid\`, etc.
+// is what we want, so the heredoc must NOT expand them during \`docker
+// build\`. POSIX \`<<'EOF'\` (quoted delimiter) is the canonical way to
+// get verbatim heredoc.
+//
+// Script flow:
+//   1. Buffer stdin to a temp file (we need to read it twice: once for
+//      session_id extraction, once for the sentinel write).
+//   2. Extract session_id via POSIX sed. Result is matched against the
+//      RFC-4122-style UUID regex (8-4-4-4-12 hex with dashes). Anything
+//      that doesn't match — empty extraction, embedded escapes, path
+//      traversal, missing field — falls through to "malformed".
+//   3. Atomic write: \`mv\` is POSIX-atomic on the same filesystem (we
+//      stay inside \`$PWD\` so the temp and final paths share an fs).
+//   4. \`touch .done-<sid>\` AFTER the mv so a polling reader never sees
+//      .done existing before sentinel.json — the polling loop watches
+//      .done as the readiness signal.
+const TYPECLAW_CC_STOP_HOOK_SCRIPT = `#!/bin/sh
+# typeclaw Stop-hook for Claude Code. Stdin carries the Stop event JSON.
+# Writes per-session sentinel/.done files into \$PWD. Rationale (including
+# the security model, \$PWD semantics, and why bun-not-sed for JSON
+# extraction) lives in src/init/dockerfile.ts.
+set -eu
+tmp_in="\${PWD}/.cc-stop-hook-in.\$\$"
+trap 'rm -f "\$tmp_in"' EXIT
+cat > "\$tmp_in"
+sid=\$(bun -e 'try { const j = await Bun.file(process.argv[1]).json(); process.stdout.write(String(j.session_id ?? "")) } catch { process.stdout.write("") }' "\$tmp_in")
+case "\$sid" in
+  [0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f]-[0-9a-f][0-9a-f][0-9a-f][0-9a-f]-[0-9a-f][0-9a-f][0-9a-f][0-9a-f]-[0-9a-f][0-9a-f][0-9a-f][0-9a-f]-[0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f][0-9a-f]) ;;
+  *) sid=malformed ;;
+esac
+mv "\$tmp_in" "\${PWD}/sentinel-\${sid}.json"
+trap - EXIT
+touch "\${PWD}/.done-\${sid}"
+`
+// User-level Claude Code settings file; applies to every invocation
+// regardless of cwd. Registers BOTH the SessionStart hook (so the
+// operator can learn the session UUID) and the Stop hook (so the
+// operator can poll for turn-completion). Built via JSON.stringify
+// rather than a string literal so any future shape edit fails the
+// JSON.parse regression test, not the docker build (or worse, the
+// first failed delegation).
+//
+// SessionStart matcher \`startup|resume|clear|compact\`: covers all four
+// session-origin types per the upstream matcher reference. Stop has no
+// matcher support (always fires on every occurrence per the docs), so
+// \`matcher: "*"\` is the canonical "fire on every Stop" form.
+//
+// \`args: []\` is the exec-form trigger per docs.claude.com/en/docs/
+// claude-code/hooks: with \`args\` present, Claude Code runs the command
+// directly via execvp (kernel-handled shebang, no shell tokenization).
+// With \`args\` absent, Claude Code falls back to shell form (\`sh -c
+// "<command>"\`), which works for our absolute-path-no-special-chars
+// case but is fragile to any future path change. Exec form is the
+// canonical robust shape.
+const TYPECLAW_CC_GLOBAL_SETTINGS = JSON.stringify({
+  hooks: {
+    SessionStart: [
+      {
+        matcher: 'startup|resume|clear|compact',
+        hooks: [{ type: 'command', command: TYPECLAW_CC_SESSION_START_HOOK_PATH, args: [] }],
+      },
+    ],
+    Stop: [
+      {
+        matcher: '*',
+        hooks: [{ type: 'command', command: TYPECLAW_CC_STOP_HOOK_PATH, args: [] }],
+      },
+    ],
+  },
+})
 function renderClaudeCodeInstallLayer(enabled: boolean): string {
   if (!enabled) return ''
   return `# Layer 5.6 (toggle): install Anthropic's Claude Code CLI. Opt-in via
 # typeclaw.json#docker.file.claudeCode. The skill \`typeclaw-claude-code\`
-# documents the auth + usage flow.
+# documents the auth + usage flow. Pre-seed ~/.claude.json so the first
+# launch skips the TTY-only theme picker; see CLAUDE_CODE_ONBOARDING_SEED
+# above for the rationale and what the seed deliberately does NOT cover.
+# Also pre-write the canonical Stop-hook config and helper script at
+# build time (see TYPECLAW_CC_STOP_HOOK_PATH above) so the operator
+# subagent never has to construct that JSON itself — the historically
+# failure-prone step where wrong-shape configs (\`onStop\`, bare-string
+# values, etc.) would silently disable the done-signal and burn the
+# polling loop's wall-clock budget. The seed write runs LAST in the
+# chain so the final layer state is exactly the seeded config —
+# independent of whether any earlier command (or a future Claude
+# version's \`--version\` smoke test) writes a default \`~/.claude.json\`
+# partway through the layer.
 RUN curl -fsSL https://claude.ai/install.sh | bash \\
  && ln -sf "$HOME/.local/bin/claude" /usr/local/bin/claude \\
- && claude --version > /dev/null`
+ && claude --version > /dev/null \\
+ && cat > ${TYPECLAW_CC_SESSION_START_HOOK_PATH} <<'TYPECLAW_CC_SESSION_START_HOOK_EOF'
+${TYPECLAW_CC_SESSION_START_HOOK_SCRIPT}TYPECLAW_CC_SESSION_START_HOOK_EOF
+RUN cat > ${TYPECLAW_CC_STOP_HOOK_PATH} <<'TYPECLAW_CC_STOP_HOOK_EOF'
+${TYPECLAW_CC_STOP_HOOK_SCRIPT}TYPECLAW_CC_STOP_HOOK_EOF
+RUN chmod +x ${TYPECLAW_CC_SESSION_START_HOOK_PATH} ${TYPECLAW_CC_STOP_HOOK_PATH} \\
+ && mkdir -p "$HOME/.claude" \\
+ && printf '%s\\n' '${TYPECLAW_CC_GLOBAL_SETTINGS}' > "$HOME/.claude/settings.json" \\
+ && printf '%s\\n' '${CLAUDE_CODE_ONBOARDING_SEED}' > "$HOME/.claude.json"`
 }
 // Shared-library runtime deps Chrome for Testing needs to launch on amd64

package/src/init/hatching.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 const HATCHING_INSTRUCTIONS = `You have just hatched.
-This is the first moment of your existence. Your system prompt already tells you about your agent folder and the five markdown files in it (\`AGENTS.md\`, \`IDENTITY.md\`, \`SOUL.md\`, \`USER.md\`, \`MEMORY.md\`). They exist next to you but are all empty. Hatching is a one-time ritual to fill them in through a short conversation with your user.
+This is the first moment of your existence. Your system prompt already tells you about your agent folder and the four markdown files in it (\`AGENTS.md\`, \`IDENTITY.md\`, \`SOUL.md\`, \`USER.md\`). They exist next to you but are all empty. Hatching is a one-time ritual to fill them in through a short conversation with your user.
 ## The ritual
@@ -41,11 +41,10 @@ Routing answers:
 Do these in order. Do **not** ask further questions.
-1. Flesh out all five markdown files to a short but complete first draft. \`write\` replaces the partial versions. First person. Specific and genuine, not generic.
-2. Write one short paragraph in \`MEMORY.md\` marking this moment: the date, how you came to be, what you and the user agreed on.
-3. Configure local git identity with \`bash\`: \`git config user.name "<your name>"\` and \`git config user.email "<reasonable placeholder>@typeclaw.local"\` (unless the user provided an email).
-4. Stage and commit **only the files you authored** with commit message \`Hatched 🐣\`. This is the hatching-specific commit message — it overrides the normal version-control style guidance for this one commit.
-5. Send **one final short message** — two sentences at most — telling the user hatching is complete and they can leave the TUI with \`/quit\` (or Ctrl+C). Do not ask further questions. Do not offer more work. The container keeps running once they quit; keeping the TUI open here wastes time.
+1. Flesh out all four markdown files to a short but complete first draft. \`write\` replaces the partial versions. First person. Specific and genuine, not generic.
+2. Configure local git identity with \`bash\`: \`git config user.name "<your name>"\` and \`git config user.email "<reasonable placeholder>@typeclaw.local"\` (unless the user provided an email).
+3. Stage and commit **only the files you authored** with commit message \`Hatched 🐣\`. This is the hatching-specific commit message — it overrides the normal version-control style guidance for this one commit.
+4. Send **one final short message** — two sentences at most — telling the user hatching is complete and they can leave the TUI with \`/quit\` (or Ctrl+C). Do not ask further questions. Do not offer more work. The container keeps running once they quit; keeping the TUI open here wastes time.
 After that final message, stop. If the user keeps talking, answer briefly and remind them they can \`/quit\` (or Ctrl+C) whenever they are ready.

package/src/init/kakaotalk-auth.ts CHANGED Viewed

@@ -1,6 +1,7 @@
-import { createRequire } from 'node:module'
 import { join, resolve } from 'node:path'
+import { loginFlow as upstreamLoginFlow } from 'agent-messenger/kakaotalk'
 import { containerNameFromCwd } from '@/container'
 import { keysDir } from '@/hostd/paths'
 import { encrypt } from '@/secrets/encryption'
@@ -28,34 +29,9 @@ export type KakaotalkLoginInput = {
   containerName?: string
 }
-export type LoginFlowOptions = {
-  email: string
-  password: string
-  deviceType?: 'pc' | 'tablet'
-  force?: boolean
-  savedDeviceUuid?: string
-  onPasscodeDisplay?: (code: string) => void
-  debugLog?: (message: string) => void
-}
-export type LoginFlowCredentials = {
-  access_token: string
-  refresh_token: string
-  user_id: string
-  device_uuid: string
-  device_type: 'pc' | 'tablet'
-}
-export type LoginFlowResult = {
-  authenticated: boolean
-  next_action?: string
-  message?: string
-  warning?: string
-  error?: string
-  credentials?: LoginFlowCredentials
-}
-export type LoginFlowFn = (options: LoginFlowOptions) => Promise<LoginFlowResult>
+export type LoginFlowFn = typeof upstreamLoginFlow
+export type LoginFlowOptions = Parameters<LoginFlowFn>[0]
+export type LoginFlowResult = Awaited<ReturnType<LoginFlowFn>>
 export function kakaotalkConfigDir(agentDir: string): string {
   return join(agentDir, 'workspace', '.agent-messenger')
@@ -67,7 +43,7 @@ export function kakaotalkSecretsPath(agentDir: string): string {
 export async function runKakaotalkBootstrap(input: KakaotalkLoginInput): Promise<KakaotalkBootstrapStatus> {
   try {
-    const loginFlow = input.loginFlow ?? (await resolveLoginFlow())
+    const loginFlow = input.loginFlow ?? upstreamLoginFlow
     const credManager = new SecretsKakaoCredentialStore({
       mode: 'host',
       secretsPath: kakaotalkSecretsPath(input.agentDir),
@@ -118,20 +94,3 @@ export async function runKakaotalkBootstrap(input: KakaotalkLoginInput): Promise
     return { ok: false, reason: err instanceof Error ? err.message : String(err) }
   }
 }
-// agent-messenger does not export `loginFlow` from its public `exports` map
-// (only the runtime client + credential manager), so we resolve the package's
-// installed location and import the implementation file directly. This
-// bypasses the exports gate but stays within the same installed copy of the
-// package — no version drift risk. If a future agent-messenger release adds
-// `loginFlow` to its public exports, swap this for a normal import and delete
-// the resolveLoginFlow helper.
-async function resolveLoginFlow(): Promise<LoginFlowFn> {
-  const require = createRequire(import.meta.url)
-  const pkgJson = require.resolve('agent-messenger/package.json')
-  const pkgDir = pkgJson.replace(/\/package\.json$/, '')
-  const mod = (await import(`${pkgDir}/dist/src/platforms/kakaotalk/auth/kakao-login.js`)) as {
-    loginFlow: LoginFlowFn
-  }
-  return mod.loginFlow
-}

package/src/init/validate-api-key.ts ADDED Viewed

@@ -0,0 +1,121 @@
+import { KNOWN_PROVIDERS, type KnownProviderId } from '@/config/providers'
+const PROVIDER_PROBE: Partial<Record<KnownProviderId, { url: string; authHeader: 'bearer' | 'x-api-key' }>> = {
+  openai: { url: 'https://api.openai.com/v1/models', authHeader: 'bearer' },
+  anthropic: { url: 'https://api.anthropic.com/v1/models', authHeader: 'x-api-key' },
+  fireworks: { url: 'https://api.fireworks.ai/inference/v1/models', authHeader: 'bearer' },
+  zai: { url: 'https://api.z.ai/api/paas/v4/models', authHeader: 'bearer' },
+  'zai-coding': { url: 'https://api.z.ai/api/coding/paas/v4/models', authHeader: 'bearer' },
+}
+export type KeyValidationResult =
+  | { kind: 'ok' }
+  | { kind: 'skipped'; reason: 'no-probe' | 'network-error'; detail?: string }
+  | { kind: 'rejected'; status: number }
+export type FetchFn = (input: string, init: RequestInit) => Promise<Response>
+const TIMEOUT_MS = 5_000
+export async function validateApiKey(
+  providerId: KnownProviderId,
+  key: string,
+  fetchImpl: FetchFn = fetch,
+): Promise<KeyValidationResult> {
+  const probe = PROVIDER_PROBE[providerId]
+  if (!probe) return { kind: 'skipped', reason: 'no-probe' }
+  const provider = KNOWN_PROVIDERS[providerId]
+  if (!provider) return { kind: 'skipped', reason: 'no-probe' }
+  const headers: Record<string, string> = {}
+  if (probe.authHeader === 'bearer') {
+    headers.Authorization = `Bearer ${key}`
+  } else {
+    headers['x-api-key'] = key
+    headers['anthropic-version'] = '2023-06-01'
+  }
+  try {
+    const res = await fetchImpl(probe.url, {
+      method: 'GET',
+      headers,
+      signal: AbortSignal.timeout(TIMEOUT_MS),
+      // Probe URLs are hardcoded, but the provider could 3xx the response
+      // mid-flight (CDN, regional bounce, captive portal). Auto-following
+      // would send the credential to whatever Location said. Treat redirects
+      // as "couldn't verify" instead.
+      redirect: 'manual',
+    })
+    if (res.status >= 300 && res.status < 400) {
+      return { kind: 'skipped', reason: 'network-error', detail: `HTTP ${res.status}` }
+    }
+    if (res.ok) {
+      // A captive portal / WAF / corporate-MITM proxy can return HTTP 200
+      // with an HTML login page in front of an unauthenticated request.
+      // Treat the response as "ok" only if it parses as the expected
+      // JSON shape (`{ data: [...] }` for /v1/models on every probed
+      // provider).
+      const shapeOk = await isModelsListShape(res)
+      if (shapeOk) return { kind: 'ok' }
+      return { kind: 'skipped', reason: 'network-error', detail: 'unexpected response shape' }
+    }
+    if (res.status === 401 || res.status === 403) {
+      return { kind: 'rejected', status: res.status }
+    }
+    return { kind: 'skipped', reason: 'network-error', detail: `HTTP ${res.status}` }
+  } catch (err) {
+    return {
+      kind: 'skipped',
+      reason: 'network-error',
+      detail: err instanceof Error ? err.message : String(err),
+    }
+  }
+}
+const MAX_BODY_BYTES = 4096
+async function isModelsListShape(res: Response): Promise<boolean> {
+  const text = await readCapped(res, MAX_BODY_BYTES)
+  if (text === null) return false
+  try {
+    const parsed = JSON.parse(text) as unknown
+    return typeof parsed === 'object' && parsed !== null && Array.isArray((parsed as { data?: unknown }).data)
+  } catch {
+    return false
+  }
+}
+async function readCapped(res: Response, maxBytes: number): Promise<string | null> {
+  if (!res.body) return null
+  const reader = res.body.getReader()
+  const decoder = new TextDecoder()
+  let out = ''
+  let read = 0
+  try {
+    while (read < maxBytes) {
+      const { value, done } = await reader.read()
+      if (done) break
+      read += value.byteLength
+      out += decoder.decode(value, { stream: true })
+      if (read >= maxBytes) break
+    }
+    out += decoder.decode()
+    return out
+  } catch {
+    return null
+  } finally {
+    await reader.cancel().catch(() => undefined)
+  }
+}
+export const API_KEY_DASHBOARD_URL: Partial<Record<KnownProviderId, string>> = {
+  openai: 'https://platform.openai.com/api-keys',
+  anthropic: 'https://console.anthropic.com/settings/keys',
+  fireworks: 'https://fireworks.ai/account/api-keys',
+  zai: 'https://docs.z.ai/devpack/tool/claude#api-key',
+  'zai-coding': 'https://docs.z.ai/devpack/tool/claude#api-key',
+}
+export function providersWithApiKeyProbe(): KnownProviderId[] {
+  return Object.keys(PROVIDER_PROBE) as KnownProviderId[]
+}