npm - smol-symphony - Versions diffs - 0.1.0 → 0.2.0 - Mend

smol-symphony 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (140) hide show

package/AGENTS.md +105 -38
package/PRODUCT.md +2 -1
package/README.md +195 -98
package/SPEC.md +543 -1915
package/WORKFLOW.md +654 -179
package/WORKFLOW.template.md +761 -121
package/dist/acp-bridge.js +324 -0
package/dist/acp-bridge.js.map +1 -0
package/dist/actions/cache.js +191 -0
package/dist/actions/cache.js.map +1 -0
package/dist/actions/effects.js +41 -0
package/dist/actions/effects.js.map +1 -0
package/dist/actions/executor.js +570 -0
package/dist/actions/executor.js.map +1 -0
package/dist/actions/index.js +13 -0
package/dist/actions/index.js.map +1 -0
package/dist/actions/parsing.js +273 -0
package/dist/actions/parsing.js.map +1 -0
package/dist/actions/predicate-env.js +27 -0
package/dist/actions/predicate-env.js.map +1 -0
package/dist/actions/predicates.js +49 -0
package/dist/actions/predicates.js.map +1 -0
package/dist/actions/templating.js +66 -0
package/dist/actions/templating.js.map +1 -0
package/dist/actions/types.js +15 -0
package/dist/actions/types.js.map +1 -0
package/dist/agent/acp.js +232 -63
package/dist/agent/acp.js.map +1 -1
package/dist/agent/adapter-names.js +159 -0
package/dist/agent/adapter-names.js.map +1 -0
package/dist/agent/adapters.js +338 -102
package/dist/agent/adapters.js.map +1 -1
package/dist/agent/credential-extractors.js +342 -0
package/dist/agent/credential-extractors.js.map +1 -0
package/dist/agent/credential-secrets.js +628 -0
package/dist/agent/credential-secrets.js.map +1 -0
package/dist/agent/credential-ticker.js +57 -0
package/dist/agent/credential-ticker.js.map +1 -0
package/dist/agent/gondolin-creds-staging.js +356 -0
package/dist/agent/gondolin-creds-staging.js.map +1 -0
package/dist/agent/gondolin-dispatch.js +375 -0
package/dist/agent/gondolin-dispatch.js.map +1 -0
package/dist/agent/gondolin.js +124 -0
package/dist/agent/gondolin.js.map +1 -0
package/dist/agent/runner-decisions.js +134 -0
package/dist/agent/runner-decisions.js.map +1 -0
package/dist/agent/runner.js +1352 -290
package/dist/agent/runner.js.map +1 -1
package/dist/agent/tool-call-summary.js +102 -0
package/dist/agent/tool-call-summary.js.map +1 -0
package/dist/agent/vm-acp-mapping.js +73 -0
package/dist/agent/vm-acp-mapping.js.map +1 -0
package/dist/agent/vm-guards.js +262 -0
package/dist/agent/vm-guards.js.map +1 -0
package/dist/agent/vm-port.js +22 -0
package/dist/agent/vm-port.js.map +1 -0
package/dist/agent/vm-process-registry.js +79 -0
package/dist/agent/vm-process-registry.js.map +1 -0
package/dist/bin/cli-args.js +105 -0
package/dist/bin/cli-args.js.map +1 -0
package/dist/bin/symphony.js +719 -130
package/dist/bin/symphony.js.map +1 -1
package/dist/errors.js +15 -0
package/dist/errors.js.map +1 -0
package/dist/http-disk.js +135 -0
package/dist/http-disk.js.map +1 -0
package/dist/http-handlers.js +180 -0
package/dist/http-handlers.js.map +1 -0
package/dist/http.js +1476 -764
package/dist/http.js.map +1 -1
package/dist/issues.js +178 -0
package/dist/issues.js.map +1 -0
package/dist/logging.js +163 -5
package/dist/logging.js.map +1 -1
package/dist/mcp.js +391 -163
package/dist/mcp.js.map +1 -1
package/dist/memory.js +85 -0
package/dist/memory.js.map +1 -0
package/dist/orchestrator-decisions.js +331 -0
package/dist/orchestrator-decisions.js.map +1 -0
package/dist/orchestrator.js +1189 -303
package/dist/orchestrator.js.map +1 -1
package/dist/prompt.js +5 -5
package/dist/prompt.js.map +1 -1
package/dist/reconciler/cache.js +65 -0
package/dist/reconciler/cache.js.map +1 -0
package/dist/reconciler/index.js +448 -0
package/dist/reconciler/index.js.map +1 -0
package/dist/reconciler/ledger.js +131 -0
package/dist/reconciler/ledger.js.map +1 -0
package/dist/reconciler/pr-adapters.js +174 -0
package/dist/reconciler/pr-adapters.js.map +1 -0
package/dist/reconciler/pr-decide.js +167 -0
package/dist/reconciler/pr-decide.js.map +1 -0
package/dist/reconciler/pr.js +422 -0
package/dist/reconciler/pr.js.map +1 -0
package/dist/reconciler/types.js +12 -0
package/dist/reconciler/types.js.map +1 -0
package/dist/reconciler/vm.js +243 -0
package/dist/reconciler/vm.js.map +1 -0
package/dist/reconciler/workspace-defaults.js +83 -0
package/dist/reconciler/workspace-defaults.js.map +1 -0
package/dist/reconciler/workspace.js +272 -0
package/dist/reconciler/workspace.js.map +1 -0
package/dist/runlog.js +403 -0
package/dist/runlog.js.map +1 -0
package/dist/scaffold.js +165 -0
package/dist/scaffold.js.map +1 -0
package/dist/trackers/local.js +234 -133
package/dist/trackers/local.js.map +1 -1
package/dist/trackers/types.js +1 -1
package/dist/trackers/types.js.map +1 -1
package/dist/types.js +1 -1
package/dist/util/clock.js +12 -0
package/dist/util/clock.js.map +1 -0
package/dist/util/crypto.js +25 -0
package/dist/util/crypto.js.map +1 -0
package/dist/util/frontmatter.js +70 -0
package/dist/util/frontmatter.js.map +1 -0
package/dist/util/fs-issues.js +22 -0
package/dist/util/fs-issues.js.map +1 -0
package/dist/util/process.js +152 -0
package/dist/util/process.js.map +1 -0
package/dist/util/workspace-key.js +10 -0
package/dist/util/workspace-key.js.map +1 -0
package/dist/workflow-loader.js +147 -0
package/dist/workflow-loader.js.map +1 -0
package/dist/workflow.js +656 -219
package/dist/workflow.js.map +1 -1
package/dist/workspace-types.js +8 -0
package/dist/workspace-types.js.map +1 -0
package/dist/workspace.js +367 -120
package/dist/workspace.js.map +1 -1
package/package.json +14 -6
package/scripts/vm-agent.mjs +211 -0
package/dist/agent/codex.js +0 -439
package/dist/agent/codex.js.map +0 -1
package/dist/agent/smolvm.js +0 -174
package/dist/agent/smolvm.js.map +0 -1
package/scripts/build-vm.sh +0 -67

package/WORKFLOW.template.md CHANGED Viewed

@@ -22,39 +22,385 @@ Notation:
 # tracker — where issues come from.
 # ─────────────────────────────────────────────────────────────────────────────
 tracker:
-  # kind (required): 'local' or 'linear'.
-  #   local  — markdown files under `root`, one per issue, organized by state.
-  #   linear — Linear API (workspace + project_slug).
+  # kind (required): currently the only supported value is 'local' (markdown
+  # files under `root`, one per issue, organized by state subdirectory).
   kind: local
-  # root (path): local-tracker only. Directory containing `<state>/<id>.md`
-  # files. Required when kind=local. Resolved relative to the workflow file
-  # if not absolute.
+  # root (path): directory containing `<state>/<id>.md` files. Required.
+  # Resolved relative to the workflow file if not absolute.
   root: ./issues
-  # endpoint (string): linear-tracker only. API endpoint.
-  # Default: Linear's public GraphQL endpoint.
-  endpoint: https://api.linear.app/graphql
-  # api_key (string): linear-tracker only. Personal API key. Required for
-  # kind=linear. Pulled from $LINEAR_API_KEY if you use `$LINEAR_API_KEY`.
-  api_key: $LINEAR_API_KEY
-  # project_slug (string): linear-tracker only. Required for kind=linear.
-  project_slug: my-team/my-project
+# ─────────────────────────────────────────────────────────────────────────────
+# states — per-state configuration map. REQUIRED. Every workflow must declare
+# at least one `active`, one `terminal`, and one `holding` state; a workflow
+# missing the `states:` block (or missing any of those roles) is rejected at
+# parse time. This map is the only place state names and roles are configured;
+# there are no separate active/terminal lists to keep in sync.
+#
+# Keys are state names; values are config objects with these fields:
+#   role (required, enum):
+#     active   — orchestrator dispatches issues in this state.
+#     terminal — orchestrator treats issues in this state as complete; the
+#                workspace is removed after the run unwinds.
+#     holding  — directory exists on disk, but the orchestrator never
+#                dispatches issues from it. Triage is the canonical example
+#                and the landing directory for `symphony.propose_issue`.
+#   adapter   (string, optional): override the workflow-level `acp.adapter` for
+#             agents dispatched in this state. Must be a known profile (claude,
+#             codex, opencode). All use host-side credential substitution at
+#             Gondolin egress and are startup-probed so a missing credential
+#             fails fast. claude has a
+#             single host credential file (~/.claude/.credentials.json) that is
+#             probed for readability; codex passes when either ~/.codex/auth.json
+#             holds a token (ChatGPT-OAuth tokens.access_token or a top-level
+#             OPENAI_API_KEY) or the host OPENAI_API_KEY env var is set; opencode
+#             passes when either ~/.local/share/opencode/auth.json holds a
+#             github-copilot token (run `opencode auth login` -> GitHub Copilot
+#             on the host) or a COPILOT_GITHUB_TOKEN/GH_TOKEN/GITHUB_TOKEN env
+#             var is set.
+#   model     (string, optional): override `acp.model` for this state.
+#             Blank or whitespace-only values normalize to "use the adapter
+#             default" (same as the workflow-level acp.model semantics).
+#   effort    (string, optional): override `acp.effort` for this state. Same
+#             undefined-vs-null semantics as `model`: omit to inherit
+#             `acp.effort`; blank/whitespace normalizes to null ("use the
+#             adapter default for this state"). Valid values are adapter- and
+#             model-specific (see `acp.effort`).
+#   max_turns (int, optional): override `agent.max_turns` for this state.
+#   max_concurrent (int, optional): cap on agents the orchestrator runs
+#             simultaneously for issues in THIS state. Symmetric with
+#             `max_turns` — concurrency and turn budget both live on the state.
+#             Omit for "no per-state cap; only the global
+#             `agent.max_concurrent_agents` ceiling applies". The sum of every
+#             state's `max_concurrent` must not exceed that global ceiling
+#             (validated at startup).
+#   allowed_transitions (string[]|null, optional): when set, restricts which
+#             states agents in this state may transition to via the MCP
+#             `transition` tool. Each entry must be a declared state. Omit (or
+#             explicitly set to null) for "any declared state is reachable".
+#             An empty list (`allowed_transitions: []`) means "no transitions
+#             allowed out of this state" — the agent's `transition` calls will
+#             always be rejected with `transition_not_allowed`. Useful for
+#             review-style states that should pause until a human re-routes.
+#   eval_mode (bool, optional): when true, the runner adds two extra read-only
+#             bind mounts to every per-issue VM dispatched in this state so an
+#             in-VM agent can inspect symphony's own state for evaluation /
+#             debugging:
+#               • `tracker.root` → `/symphony/issues` (every issue file across
+#                 every state directory)
+#               • `logs.root`    → `/symphony/logs`   (per-issue JSONL run-log
+#                 transcripts captured by RunLog — ACP frames, stderr,
+#                 typed-action output, system events — plus the compact
+#                 `<key>.summary.json` outcome records the reflector reads; see
+#                 the `logs:` block below)
+#             Either mount is skipped silently if the corresponding root is
+#             unset. Each VFS mount has a cost, so this is opt-in per state rather
+#             than a workflow-wide default — flip it on for a dedicated eval
+#             state, not for the routine implement/review flow. Default: false.
+#             The canonical consumer is the "sleep cycle" reflection pattern —
+#             see the SLEEP CYCLE section below the states block.
+#   actions   (list, optional): typed action DAG (issue 36, reconciler v2).
+#             The single glue mechanism attached to a state — there is no shell
+#             `hooks:` surface. When set on a `terminal` state, this list runs
+#             on transition INTO the state (the canonical Done-state pair is
+#             push_branch + create_pr_if_missing). For arbitrary in-sandbox
+#             commands use a `run_in_vm` action; per-VM tooling belongs in the
+#             agent image (`images/agents/`); first-creation workspace setup is
+#             owned by the orchestrator's `setupWorkspaceDir`.
+#             Each entry is a closed-kind record:
+#
+#                 - kind: push_branch
+#                   remote: origin
+#                   ref: $branch
+#                   if: $repo
+#
+#             Recognized kinds:
+#               push_branch          { remote, ref }
+#               create_pr_if_missing { base, head, title_from, body_from }
+#               ensure_branch        { name, seed_from? }
+#               checkout             { ref }
+#               merge                { source, target, on_conflict }
+#               delete_branch        { name, scope: local|remote|both, remote? }
+#               run_in_vm            { name, cmd: [...], env?, timeout? }
+#               propose_followup     { title, body?, labels?, priority? }
+#
+#             Templating: `$varname` references the fixed ActionContext
+#             namespace ($identifier, $workspace, $branch, $base_branch,
+#             $issue_title, $issue_body, $repo, $pr_title, $pr_body_file).
+#             Unknown $vars throw at run-time (no silent "" expansion).
+#
+#             Conditional: optional `if:` field supports three predicates
+#               - `if: $repo`                       (env-var-truthy)
+#               - `if: { branch_exists: <ref> }`    (workspace branch)
+#               - `if: { file_present: <path> }`    (workspace file)
+#
+#             Retry: optional `on_error.retry: { count, backoff_ms }`. Default
+#             policy is 3 retries with exponential backoff starting at 1s,
+#             then abort. `on_error.then: { route_to: <state> }` reroutes the
+#             issue to a holding state instead of aborting.
+#
+#             merge's `on_conflict: { route_to: <state> }` is a fast-path
+#             reroute. Use `on_conflict: abort` to fail the action and abort
+#             the cleanup pass without a state move.
+#
+#             run_in_vm has content-hash caching: identical (workspace tree
+#             ⊕ cmd ⊕ env) tuples skip execution and re-use the prior
+#             successful result. The workspace-tree hash reflects live
+#             contents (tracked + modified + untracked-not-gitignored), so
+#             an uncommitted agent edit forces a cache miss. Cache lives
+#             under `~/.cache/symphony/actions/run_in_vm/<name>/<sha256>/`.
+#             `symphony rerun --check=<name>` drops the whole `<name>/`
+#             namespace dir so the next dispatch re-runs that one check.
+#   pr        (map, optional): PR autopilot routing for this state (issue 139).
+#             Valid only on a `terminal` state, and only acts when the
+#             top-level `pr:` engine block (below) has `enabled: true`. This is
+#             where the routing the engine used to name by string now lives —
+#             on the state it describes. Two shapes:
+#               • Merge state:  pr: { auto_merge: squash|merge|rebase,
+#                                     on_conflict: { route_to: <active state> } }
+#                 A MERGEABLE PR for an issue in this state has GitHub
+#                 auto-merge armed with `auto_merge`; a CONFLICTING one is
+#                 routed back to `on_conflict.route_to` (defaults to the first
+#                 declared active state when omitted) for the dispatched agent
+#                 to rebase. While the engine is enabled, transitions INTO this
+#                 state do not fire the standard terminal workspace cleanup —
+#                 the pr resource owns the workspace until the PR merges/closes.
+#               • Close state:  pr: { close: true }
+#                 An open PR for an issue in this state is closed without merge
+#                 and its remote branch is best-effort-deleted. Standard
+#                 terminal cleanup still runs (the close path needs no workspace).
+#             The merge/close/route targets are DERIVED by scanning states for
+#             this field — there is no named-string sibling block. At most one
+#             terminal state may declare `auto_merge`, and at most one may
+#             declare `close`; an `on_conflict.route_to` naming an undeclared
+#             state is rejected at parse time.
+#
+# Declaration order matters: role-filtered listings (active states, terminal
+# states) follow it, and the dashboard renders state columns in the same order.
+# ─────────────────────────────────────────────────────────────────────────────
+states:
+  Todo:
+    role: active
+    adapter: claude
+    model: claude-opus-4-7
+    effort: xhigh
+    max_turns: 10
+    max_concurrent: 1          # at most one implementer agent at a time
+  Review:
+    role: active
+    adapter: codex
+    model: gpt-5-codex
+    max_turns: 4
+    allowed_transitions: [Todo, Done]
+  Done:
+    role: terminal
+    # PR autopilot merge state (issue 139). Acts only when the top-level `pr:`
+    # engine block (below) is enabled. Derived as the merge state because it
+    # declares `auto_merge`.
+    # pr:
+    #   auto_merge: squash
+    #   on_conflict: { route_to: Todo }
+    # Terminal-state handoff via typed actions (issue 36). On transition into
+    # Done, push the branch (if SYMPHONY_REPO is set → $repo non-empty) and
+    # open a PR if one does not already exist. Templates resolve against the
+    # fixed ActionContext namespace; the orchestrator stages $pr_title and
+    # $pr_body_file from the issue file before firing.
+    # actions:
+    #   - { kind: push_branch, remote: origin, ref: $branch, if: $repo }
+    #   - kind: create_pr_if_missing
+    #     base: $base_branch
+    #     head: $branch
+    #     title_from: $pr_title
+    #     body_from: $pr_body_file
+    #     if: $repo
+  Cancelled:
+    role: terminal
+    # PR autopilot close state (issue 139). Derived as the close state because
+    # it declares `close: true` — an open PR is closed without merge.
+    # pr:
+    #   close: true
+  Triage:
+    role: holding
-  # active_states (string[]): states the orchestrator dispatches against.
-  # Default: [Todo, In Progress]
-  active_states:
-    - Todo
-    - In Progress
+# ─────────────────────────────────────────────────────────────────────────────
+# SLEEP CYCLE — a reflection state that mines finished work for harness
+# improvements (issue 122). Optional, opt-in pattern; layered on top of the
+# states block above. The shipped smol-symphony WORKFLOW.md wires it for the
+# dogfooding (symphony-on-symphony) setup.
+#
+# The idea: every dispatch starts from the same static prompt + config, no
+# matter what the last 100 issues taught us about where agents stall, get
+# rejected, burn their turn budget, or fight the harness. A periodic
+# "reflection" turn closes that feedback loop — it reads completed-task history
+# (the read-only mounts `eval_mode` exposes), distils *recurring* friction, and
+# files improvement proposals against the HARNESS (this WORKFLOW.md's prompt
+# branches and per-state model/max_turns/allowed_transitions/effort/actions, the
+# gondolin image config, acceptance criteria, timeouts) — never the product code under
+# review. Proposals land in Triage via `propose_issue`, so a human stays the
+# gate. This is the "self-improving agent" pattern aimed at the harness rather
+# than the product.
+#
+# Two states implement it:
+#
+#   Reflect (role: active, eval_mode: true):
+#     - eval_mode binds /symphony/issues (all state dirs, incl. the Done/*.md
+#       handoff transcripts) + /symphony/logs (per-issue JSONL run logs)
+#       read-only into the VM. No extra mount plumbing — it reuses the existing
+#       eval_mode mounts.
+#     - Give it a capable adapter/model (large context helps: a reflection turn
+#       reads many transcripts + logs) and a higher max_turns than your
+#       implement/review states.
+#     - allowed_transitions: [Dormant] — the reflector may ONLY go dormant. It
+#       cannot route itself into the implement/review/done flow. Filing
+#       improvements goes through propose_issue (→ Triage), which is independent
+#       of allowed_transitions.
+#     - The prompt body's `when "Reflect"` branch encodes the
+#       read → distil → propose loop and the GUARDRAILS below.
+#
+#   Dormant (role: holding):
+#     - Resting place for the single recurring "Sleep cycle" issue between runs.
+#       Holding → never dispatched. Declare it AFTER your Triage state so Triage
+#       stays the first holding state (the `propose_issue` landing + triage
+#       approve/discard target both resolve the FIRST declared holding state).
+#     - Dashboard caveat: the dashboard currently renders triage approve/discard
+#       buttons on every holding row, and the tracker resolves a move by issue
+#       id regardless of source directory — so clicking those buttons on a
+#       Dormant issue would mis-route it. Re-arm via cron/CLI/filesystem, not the
+#       dashboard buttons.
+#
+# GUARDRAILS (this is a self-modifying loop — keep the human in it):
+#   - Output is proposals into Triage (holding, never auto-dispatched). The
+#     operator approves/discards. Do not bypass this gate.
+#   - Constrain the proposal surface to harness config. Forbid any proposal that
+#     weakens the Review state, the test/lint gates, or the Triage gate itself.
+#   - Each proposal must cite the issue ids that motivated it, so the operator
+#     checks the lesson against the evidence rather than the reflector's summary.
+#
+# CADENCE (v1 — operator/scheduled-triggered, no orchestrator trigger logic):
+#   A single recurring issue (e.g. titled "Sleep cycle") oscillates Reflect ↔
+#   Dormant. The operator drops it into Reflect (dashboard, or `mv` on disk), or
+#   an external cron / a `symphony reflect` verb arms it. After it files
+#   proposals it transitions to Dormant and waits to be re-armed. Auto-arm on
+#   idle (no active issues) or after N transitions into Done is a deliberate
+#   follow-up, out of scope for v1.
+#
+# Example states to add (names are yours to choose):
+#
+#   states:
+#     # ... your active/terminal states ...
+#     Reflect:
+#       role: active
+#       adapter: claude
+#       model: claude-opus-4-8[1m]   # large context for reading transcripts
+#       max_turns: 20                # higher than implement/review
+#       eval_mode: true
+#       allowed_transitions: [Dormant]
+#     Triage:
+#       role: holding                # declared before Dormant
+#     Dormant:
+#       role: holding
+# ─────────────────────────────────────────────────────────────────────────────
-  # terminal_states (string[]): states the orchestrator treats as complete;
-  # mark_done moves issues to the first listed state.
-  # Default: [Done]
-  terminal_states:
-    - Done
-    - Cancelled
+# ─────────────────────────────────────────────────────────────────────────────
+# pr — PR autopilot engine toggle: arm GitHub auto-merge when a terminal-state
+# PR is mergeable; route non-mergeable PRs back to the implementing state.
+#
+# Optional. This is the SLIM host-global half only — the on/off switch and the
+# per-PR `gh pr view` cache TTL. The merge/close/route targets and the
+# auto-merge strategy live ON the terminal states they describe, as
+# `states.<name>.pr` (see the `pr:` field doc in the states block above):
+#   • the MERGE state declares `pr: { auto_merge: <strategy>,
+#     on_conflict: { route_to: <active state> } }`
+#   • the CLOSE state declares `pr: { close: true }`
+# The reconciler derives the targets by scanning states for that field — there
+# is no named-string sibling block here.
+#
+# When `enabled: true` the reconciler grows a `pr` resource that, on every tick,
+# looks up each issue in the merge state via `gh pr list --head agent/<id>`,
+# fetches its detail with `gh pr view`, and:
+#
+#   • Arms GitHub's auto-merge when the PR is `mergeable: MERGEABLE`
+#     (`gh pr merge --auto --<strategy> --delete-branch`, where `<strategy>` is
+#     the merge state's `pr.auto_merge`). GitHub merges as soon as required
+#     checks pass and review requirements are satisfied.
+#   • When the PR is `mergeable: CONFLICTING`, appends a structured notes block
+#     to the issue file and routes the issue from the merge state back to that
+#     state's `pr.on_conflict.route_to` (default: the first declared
+#     `role: active` state). The workspace + `agent/<id>` branch are preserved.
+#     Before the next dispatch symphony runs `git fetch origin <base>` so
+#     `origin/<base>` is current, and the Todo prompt's first step is
+#     `git rebase origin/<base>` — resolving the conflict is the agent's normal
+#     flow, not an out-of-band autopilot operation.
+#   • For an issue in the close state with an open PR, closes the PR without
+#     merge and best-effort-deletes the remote branch.
+#
+# Requires `gh` authenticated on the host (`gh auth status` clean). The token
+# never enters the VM. Auto-merge ALSO requires at least one branch protection
+# rule on the base branch, or `gh pr merge --auto` will error — set one in
+# the repo's GitHub settings before flipping `enabled: true`.
+#
+# When `enabled: false` (or the block is absent) the autopilot is fully inert:
+# the resource is never constructed and the orchestrator's existing Done-state
+# behavior (workspace cleanup + the Done-state `actions:` block that pushes the
+# branch and opens the PR + operator-merge) is unchanged.
+#
+# Workspace lifecycle gotcha: when `enabled: true`, transitions into the merge
+# state no longer fire the standard terminal workspace cleanup. The pr resource
+# owns the workspace from that point on and removes it once the PR has merged
+# (or been closed). Transitions into the close state (and any other terminal
+# state) keep the standard cleanup-on-transition behavior.
+# ─────────────────────────────────────────────────────────────────────────────
+pr:
+  # enabled (bool): master switch. Default false.
+  enabled: false
+  # poll_interval_ms (int): per-PR GitHub view cache TTL, milliseconds. The
+  # reconciler may tick more often than this; a single PR view is reused
+  # within the window. Default 30000.
+  poll_interval_ms: 30000
+# ----------------------------------------------------------------------------
+# SLEEP CYCLE (auto-arm) — issue 140 moved this trigger ONTO the active state it
+# arms. There is NO top-level `sleep_cycle:` block anymore; declare an `arm:`
+# block on the active state (e.g. Reflect) in the `states:` map above:
+#
+#   states:
+#     Reflect:
+#       role: active
+#       arm:
+#         issue: sleep-cycle      # the recurring issue to auto-enter this state
+#         from: Dormant           # the holding state it rests in between runs
+#         on_idle: true           # arm when idle with >=1 terminal since last run
+#         after_terminal: 10      # arm after N terminal transitions (0 disables)
+#
+# SEMANTICS (unchanged from the old sleep_cycle block):
+#   - on_idle: arm when the orchestrator is idle (nothing running, claimed, or
+#     pending retry, and no active candidate this poll) AND >=1 issue has reached
+#     a terminal state since the last run. The ">=1 since last run" gate is
+#     load-bearing: without it an idle orchestrator re-arms in a tight loop with
+#     nothing new to mine.
+#   - after_terminal: a backstop for busy stretches that never go idle — arm once
+#     this many issues have reached a terminal state (Done/Cancelled) since the
+#     last run. 0 disables the count trigger.
+# The terminal-transition counter resets to 0 the moment the issue is armed and
+# is held in orchestrator memory only (a restart resets it).
+#
+# VALIDATION (structural, from each state's own role — no dedicated re-validator):
+# `arm:` is only valid on an `active` state, `arm.from` must be a declared
+# `holding` state, `arm.issue` is required, and at most one active state may
+# declare `arm`.
+#
+# GUARDRAILS: arming ONLY moves the issue into the armed state. The proposals the
+# reflector files still land in Triage and still require human approve/discard —
+# arming does not bypass the human gate. Requires a single issue with id
+# `arm.issue` resting in `arm.from` (created by the operator); the trigger is
+# inert until that issue exists.
+#
+# MIGRATION: a deprecated top-level `sleep_cycle:` block is still parsed for one
+# release and folded onto states.<reflect_state>.arm (dormant_state -> from,
+# reflect_state -> the armed state, issue_id -> issue, arm_on_idle -> on_idle,
+# arm_after_done -> after_terminal) with a startup deprecation warning. Prefer
+# the per-state `arm:` block.
+# ----------------------------------------------------------------------------
 # ─────────────────────────────────────────────────────────────────────────────
 # polling — how often to poll the tracker.
@@ -72,59 +418,156 @@ workspace:
   # Default: $TMPDIR/symphony_workspaces
   root: ./.symphony/workspaces
+  # github_repo (string | null): the GitHub `owner/repo` slug symphony pushes the
+  # per-issue `agent/<id>` branch to and opens a PR against on the Done-state
+  # transition. This is the config-file home for what was previously the
+  # `SYMPHONY_REPO` env var only.
+  #   • unset / null / "none" → LOCAL-ONLY mode: no `origin` is restored, nothing
+  #     is pushed, and the branch is left in the workspace for `git log agent/<id>`.
+  #   • "owner/repo"          → PR mode: the canonical workspace setup restores an
+  #     `origin` at https://github.com/<owner>/<repo>.git and the Done-state
+  #     actions push + `gh pr create`. Requires `gh auth status` clean on the host
+  #     (the token never enters the VM).
+  # GitHub-only by construction (the origin URL and `gh` are hardwired). There is
+  # NO auto-detection — set the literal slug or leave it local-only. A malformed
+  # value (a URL, a bare name, extra slashes/whitespace) is REJECTED at parse time
+  # rather than silently falling back to local-only.
+  #
+  # Precedence: the `SYMPHONY_REPO` env var, when set non-empty, OVERRIDES this
+  # field (so existing exports keep working); otherwise this value is used.
+  # Default: null.
+  # github_repo: owner/repo
+  # base_branch (string): the branch the per-issue workspace clones from and
+  # (in PR mode) targets as the PR base. The source repo's local
+  # `<base_branch>` is the canonical base ref — symphony does NOT implicitly
+  # fetch `origin/<base_branch>` at setup time; update the source repo before
+  # the next dispatch to move the base.
+  # Precedence: the `SYMPHONY_BASE_BRANCH` env var, when set non-empty,
+  # OVERRIDES this field; otherwise this value is used.
+  # Default: main.
+  base_branch: main
 # ─────────────────────────────────────────────────────────────────────────────
-# hooks — shell scripts the orchestrator runs at workspace lifecycle points.
+# logs — per-issue JSONL run logs (everything to/from the VM, plus typed-action
+# output) AND the orchestrator-side text log mirrored to disk for offline debugging.
+#
+# Per-issue: one file per issue at `<root>/<sanitized-identifier>.jsonl`,
+# appended across attempts AND across symphony process restarts. Each line is
+# a self-describing JSON object with `ts`, `issue_id`, `attempt`, and a
+# `channel` discriminator:
+#
+#   channel: "acp"     — JSON-RPC frame between host and the in-VM adapter.
+#                        `direction` ("host_to_vm" | "vm_to_host") and `frame`
+#                        (parsed JSON) — or `kind: "unparseable"` + `raw`.
+#   channel: "stderr"  — raw byte chunk from the adapter / VM stderr.
+#   channel: "hook"    — stdout/stderr chunk from a terminal-state `actions:`
+#                        run, plus a final `kind: "result"` line (exit_code,
+#                        signal, timed_out). The `hook` field names the action
+#                        group (e.g. `actions`). (The channel name is a holdover
+#                        from the retired workflow-hook surface.)
+#   channel: "system"  — orchestrator lifecycle events (attempt_started — which
+#                        also carries the per-state `max_turns` budget,
+#                        attempt_ended, transition, reconciliation_terminating,
+#                        etc.). The `transition` event records each state move
+#                        (from_state, to_state, notes, actor, terminal,
+#                        rerouted) so the trajectory is reconstructable.
+#
+# Per-issue run summary (for the sleep-cycle reflector): alongside each
+# `<root>/<key>.jsonl`, the orchestrator writes a compact, versioned
+# `<root>/<key>.summary.json` at the issue's terminal unwind. It is a pure
+# REDUCTION over the lifecycle (`system`) events already in the JSONL — no extra
+# hot-path logging — so a reflection turn can read dozens of summaries without
+# re-parsing multi-MB frame logs. Fields (schema_version 1):
+#   • state_path        — distinct states visited, terminal appended
+#                         (e.g. ["Todo","Review","Todo","Review","Done"]);
+#   • attempts          — total dispatched attempts;
+#   • per_state[]       — {state, attempts, turns_used, max_turns,
+#                         budget_exhausted, wall_clock_ms};
+#   • review_rejections + rejection_notes[] — count and each reviewer kick-back's
+#                         notes (a non-reroute transition back to the INITIAL
+#                         implementing state, i.e. a Review→Todo rework);
+#   • turn_budget_exhausted, timeouts[] (stall / prompt_timeout / transport);
+#   • conflict_routes[] — PR-autopilot / action reroutes (rebase churn);
+#   • terminal_state + terminal_outcome (completed | cancelled | incomplete);
+#   • pr_number / pr_url (best-effort, scraped from the Done-state actions
+#                         stdout; null when unavailable);
+#   • first/last_event_at, wall_clock_ms_total, generated_at.
+# Graceful absence / backfill: the summary is best-effort. Issues that closed
+# BEFORE this feature shipped have no `*.summary.json`; a write failure or a
+# mid-issue process restart (the in-memory accumulator only sees post-restart
+# attempts) can leave it missing or partial. The reflector MUST treat an absent
+# or partial summary as "no signal for this issue" and fall back to the raw
+# JSONL (or skip the issue) — never as an error. No backfill job is run; old
+# issues simply carry no summary.
 #
-# All hooks run on the HOST (not inside the VM), with cwd set to the per-issue
-# workspace path. Each hook is a multi-line shell snippet. Available env vars:
+# Orchestrator-side: a single `<root>/symphony.log` (created on demand) gets
+# every structured log line symphony emits — workflow loads, dispatch
+# decisions, action results, reconciler ticks, shutdown — in `key=value` text
+# format. Lets an agent reviewing a finished run (typically with
+# `.symphony/logs/` mounted into a VM) replay orchestrator-side events
+# alongside the per-issue JSONL traces in the same directory. Set the
+# `SYMPHONY_LOG_FILE` env var to override the path; set it to the empty
+# string to disable the file sink entirely (stderr remains).
 #
-#   PWD                  — the workspace directory (cwd at hook start).
-#   SYMPHONY_ISSUE_ID    — the issue identifier.
-#   SYMPHONY_ISSUE_STATE — the issue's current state.
-#   SYMPHONY_ATTEMPT     — 1-based attempt counter.
-#   SYMPHONY_WORKFLOW    — absolute path to the workflow file.
+# Console routing: while the file sink is active (the default), the structured
+# stream goes to the file ONLY — the console shows just the startup banner
+# (workflow, tracker root, dashboard URL, log-file path). `tail -f` the log
+# file to follow the detail. Pass `--verbose` (alias `--foreground`) to mirror
+# the structured stream back onto the console for interactive debugging. With
+# no file sink configured, the structured stream stays on stderr.
 #
-# Plus any env var the operator exports before launching `symphony`. The
-# common pattern is to plumb tracker root / repo / base via env so the same
-# workflow file works against multiple repos. See WORKFLOW.md for an example.
+# Intended for later evaluation — typically by another agent running inside a VM
+# — so the schema is verbose on purpose. Writes are best-effort: a failure to
+# write a log line never crashes the orchestrator.
+# ─────────────────────────────────────────────────────────────────────────────
+logs:
+  # root (path): directory holding per-issue JSONL files and symphony.log.
+  # Default: ./.symphony/logs
+  root: ./.symphony/logs
+# ─────────────────────────────────────────────────────────────────────────────
+# workspace lifecycle — no shell `hooks:` surface.
+#
+# Symphony has no `hooks:` block (workflow-level or per-state). The behaviors
+# the old `after_create` / `before_run` / `after_run` / `before_remove` hooks
+# covered now live in typed, testable homes:
+#
+#   • First-creation workspace setup (clone + base checkout + `agent/<id>`
+#     branch cut + origin/identity) is owned by the orchestrator's TypeScript
+#     `setupWorkspaceDir`. The workspace arrives at the agent with: a hardlinked
+#     `git clone --local --no-tags` of the source repo (`SYMPHONY_SOURCE_REPO`,
+#     default: the dir containing WORKFLOW.md) on the base branch
+#     (`SYMPHONY_BASE_BRANCH`, default `main`); all network remotes stripped; an
+#     `origin` restored to the canonical HTTPS URL when `workspace.github_repo`
+#     (or the `SYMPHONY_REPO` env override) is set (so the Done-state push can
+#     reach a remote — `gh auth setup-git` runs host-side; the token never
+#     enters the VM); pinned `--local` git identity;
+#     and `agent/<id>` checked out off the base SHA.
+#   • Per-VM tooling (extra CLIs, language runtimes, dependency bootstrap) is
+#     baked into the agent image — see `gondolin.image` and `images/agents/`.
+#   • Arbitrary in-sandbox commands run from a state's `actions:` via a
+#     `run_in_vm` action (executes inside the per-issue VM, not on the host).
+#   • The post-attempt handoff (push branch, open PR) is the Done state's
+#     `actions:` block — see `states.Done.actions` above for the canonical pair
+#     (push_branch + create_pr_if_missing). The action executor exposes
+#     `$branch`, `$base_branch`, `$pr_title`, `$pr_body_file`, `$repo`.
+#
+# Workspace removal is a plain best-effort `rm -rf` of the per-issue dir once
+# the run unwinds; there is no pre-removal artifact-rescue hook (rescue what you
+# need via a terminal-state action before transitioning).
 # ─────────────────────────────────────────────────────────────────────────────
-hooks:
-  # timeout_ms (int): max wall time for a single hook invocation.
-  # Default: 60000
-  timeout_ms: 120000
-  # after_create (string | null): runs right after the workspace directory is
-  # created, before the first dispatch. Use for git clone, dependency install,
-  # etc. Default: null.
-  after_create: |
-    set -eu
-    # ... your setup ...
-  # before_run (string | null): runs before each turn. Default: null. Use for
-  # cheap "make sure the workspace is sane" checks; expensive setup belongs in
-  # after_create.
-  before_run: |
-    set -eu
-    # ... pre-turn checks ...
-  # after_run (string | null): runs after each turn, regardless of outcome.
-  # Inspect cwd or the tracker to decide whether work is complete. Default: null.
-  after_run: |
-    set -eu
-    # ... post-turn handoff (push, format-patch, …) ...
-  # before_remove (string | null): runs before the workspace directory is
-  # deleted. Use to extract artifacts you want to keep. Default: null.
-  before_remove: |
-    set -eu
-    # ... rescue artifacts ...
 # ─────────────────────────────────────────────────────────────────────────────
 # agent — concurrency and turn budget.
 # ─────────────────────────────────────────────────────────────────────────────
 agent:
-  # max_concurrent_agents (int): cap on simultaneously-running agents across
-  # the whole workflow. Default: 10
+  # max_concurrent_agents (int): GLOBAL host ceiling on simultaneously-running
+  # agents across the whole workflow. This is the cross-state RAM bound that
+  # memory admission clamps (see memory_admission_enabled below); the sum of
+  # every state's `max_concurrent` is validated against it at startup. It stays
+  # top-level — not on a state — because it bounds total host memory across all
+  # VMs at once. Default: 10
   max_concurrent_agents: 2
   # max_turns (int): hard ceiling on autonomous turns per issue. Steering-reply
@@ -135,27 +578,120 @@ agent:
   # after recoverable failures. Default: 300000
   max_retry_backoff_ms: 120000
-  # max_concurrent_agents_by_state (map<string, int>): optional per-state
-  # concurrency cap. Sums must not exceed max_concurrent_agents. Default: {}.
-  max_concurrent_agents_by_state:
-    Todo: 1
-    In Progress: 1
+  # memory_admission_enabled (bool): when true, before each dispatch the
+  # orchestrator reads `/proc/meminfo` (MemAvailable) and clamps the effective
+  # concurrency cap to what currently fits at `gondolin.mem_mib` per VM after
+  # subtracting `host_memory_reserve_mib`. This is a defense-in-depth backstop
+  # for hosts where the static `max_concurrent_agents` is set generously: when
+  # MemAvailable drops, new dispatches are gated so a misconfigured cap can't
+  # walk the host into OOM (issue 27). On hosts without `/proc/meminfo`
+  # (macOS, BSD) the probe degrades gracefully and the static cap is used
+  # unchanged. Default: true.
+  memory_admission_enabled: true
+  # host_memory_reserve_mib (int): headroom (MiB) the memory admission cap
+  # keeps for the orchestrator process itself, the per-VM Gondolin runners, and
+  # the kernel's own working set. Only consulted when
+  # `memory_admission_enabled` is true. Raise on hosts with heavy non-symphony
+  # workloads; lower on dedicated worker hosts. Default: 2048.
+  host_memory_reserve_mib: 2048
+  # circuit_breaker_threshold (int): after this many CONSECUTIVE dispatch
+  # attempts fail with the *same* (normalized) reason, the orchestrator stops
+  # retrying the issue and routes it to a holding state (the first declared
+  # `role: holding` state) for a human to inspect, instead of looping forever
+  # on a deterministically-failing dispatch (issue 128 — a persistent
+  # `401 invalid_api_key` once looped ~324 attempts over ~13h). The streak
+  # resets the moment an attempt fails with a different reason or exits
+  # cleanly, so transient/varied failures still retry under the normal backoff
+  # (`max_retry_backoff_ms`). The tripped issue's body gets a diagnostic note
+  # explaining the trip so the dashboard shows "stuck on identical failure"
+  # rather than a silent loop. Set to 0 to disable; must otherwise be >= 2
+  # (1 would trip on the first failure, never retrying). Default: 5.
+  circuit_breaker_threshold: 5
 # ─────────────────────────────────────────────────────────────────────────────
 # acp — Agent Client Protocol adapter selection.
 # ─────────────────────────────────────────────────────────────────────────────
 acp:
-  # adapter (string): one of symphony's known profiles. The profile encodes the
-  # binary to launch and the host credential file to stage. Default: 'claude'.
-  #   claude   — claude-agent-acp; stages ~/.claude/.credentials.json
-  #   codex    — codex-acp;        stages ~/.codex/auth.json
+  # adapter (string): one of symphony's known profiles. Default: 'claude'.
+  #   claude   — claude-agent-acp. The guest holds a placeholder bearer; the host
+  #              substitutes the real Anthropic OAuth token at Gondolin egress.
+  #              No real credential enters the VM.
+  #   codex    — codex-acp (issue 116). Same model: the guest holds a placeholder
+  #              bearer (in a fake ~/.codex/auth.json); the host substitutes the
+  #              real OpenAI/ChatGPT token at egress. No real credential — and no
+  #              real OPENAI_API_KEY — enters the VM.
+  #   opencode — opencode acp, backed by GitHub Copilot (issue 130). The host
+  #              exchanges the operator's `opencode auth login` GitHub OAuth token
+  #              for a short-lived Copilot token host-side and substitutes it at
+  #              egress — the GitHub token never enters the VM. One Copilot
+  #              credential unlocks many models (GPT-4o/4.1, Claude Sonnet,
+  #              Gemini, o-series, …).
   adapter: claude
-  # command (string | null): optional shell override. When set, replaces the
-  # auto-generated launch command and OPTS OUT of credential staging — you
-  # become responsible for placing whatever credentials the adapter needs.
-  # Leave null for the supported zero-config flow. Default: null.
-  command: null
+  # Credentials never enter the VM (issue 113; codex generalized in 116). The
+  # guest holds only a token-shaped placeholder; on every outbound request the
+  # host substitutes the real upstream credential at Gondolin egress (TLS-MITM,
+  # see src/agent/credential-secrets.ts). The real refresh/durable token always
+  # stays host-side.
+  #
+  # For claude: the host reads the live access token from
+  # ~/.claude/.credentials.json (refreshing host-side via `claude -p "ok"` under
+  # flock when the cache is stale) and injects it at egress to api.anthropic.com.
+  # A minimal ~/.claude.json is staged for identity only — NO refreshToken, NO
+  # accessToken on the VM.
+  #
+  # For codex: the host reads the live credential (`tokens.access_token` from
+  # ~/.codex/auth.json, with an OPENAI_API_KEY env fallback — NEVER the refresh
+  # token) and injects it at egress to chatgpt.com / api.openai.com. A COMPLETE
+  # fake ~/.codex/auth.json is staged (JWT-shaped placeholder tokens + the
+  # non-secret account_id/auth_mode/last_refresh codex's completeness check needs),
+  # so codex-acp runs in its native mode without an in-VM OAuth handshake or
+  # refresh (both stay host-side). Every credential-bearing var is stripped from
+  # the forwarded VM boot env.
+  #
+  # For opencode: a staged opencode.json (at /root/.config/opencode/opencode.json)
+  # declares a custom @ai-sdk/openai-compatible provider whose baseURL/apiKey read
+  # the OPENCODE_PROXY_* env vars (a `gho_`-shaped placeholder bearer). The host
+  # reads the durable GitHub OAuth token from ~/.local/share/opencode/auth.json
+  # (COPILOT_GITHUB_TOKEN/GH_TOKEN/GITHUB_TOKEN env fallback), exchanges it
+  # host-side at api.github.com/copilot_internal/v2/token for a short-lived Copilot
+  # token (cached + TTL-refreshed before expiry), injects the Copilot editor
+  # headers, and substitutes it at egress to api.githubcopilot.com. The durable
+  # GitHub token never enters the VM — so do NOT also list it in
+  # `gondolin.forward_env`. See docs/research/opencode-copilot-accept-matrix.md.
+  # model (string | null): optional model selector forwarded to the chosen adapter.
+  # Each adapter profile knows how to surface it natively:
+  #   claude  — exported as ANTHROPIC_MODEL on the adapter process. Accepts anything
+  #             claude-agent-acp would (aliases like "opus", "sonnet", or full IDs
+  #             like "claude-opus-4-7").
+  #   codex   — passed as `-c model="<value>"` argv to codex-acp (parsed as TOML).
+  #   opencode— baked into the staged opencode.json as model="symphony-copilot/<value>".
+  #             Use a Copilot chat-completions model id (e.g. gpt-4o, gpt-4.1,
+  #             claude-sonnet-4.5, gemini-2.5-pro); codex-class models served only
+  #             on Copilot's /responses path are NOT reachable. Default: gpt-4o.
+  # Leave unset / null to use the adapter's own default model. Default: null.
+  # model: claude-opus-4-7
+  # effort (string | null): optional reasoning-effort lever forwarded to the chosen
+  # adapter. Profile-specific surface:
+  #   claude  — written into a staged `settings.json` ({"effortLevel": "<value>"})
+  #             copied to /root/.claude/settings.json in the VM before claude-agent-acp
+  #             starts. Valid values are `low|medium|high|xhigh|max`, gated per-model
+  #             by claude-agent-acp's `supportedEffortLevels` (Opus supports `xhigh` and
+  #             `max`; Haiku does not). Symphony does not validate the value — the
+  #             adapter rejects unsupported choices at startup, which keeps symphony
+  #             from drifting from the adapter's own supported list.
+  #   codex   — not wired (codex-acp has no first-class effort knob on the wrapper);
+  #             setting `acp.effort` for a codex-backed state is a no-op.
+  # Leave unset / null for the adapter's own default. Default: null.
+  # effort: xhigh
+  # NOTE: the launch shape is fixed (an in-VM agent dials back over the bridge
+  # and spawns the chosen adapter). Customizing what the agent spawns requires
+  # forking that agent and rebuilding the VM image with the fork in place.
   # shell (string): shell used to run the ACP launch command. Default: 'bash'.
   shell: bash
@@ -173,18 +709,69 @@ acp:
   # the turn is killed and retried. Default: 300000
   stall_timeout_ms: 300000
+  # bridge — host-side TCP listener the in-VM agent dials back to for ACP traffic.
+  #
+  # This replaced the earlier in-VM-exec stdio path. Symphony writes ACP JSON-RPC frames
+  # onto an authenticated TCP socket; the in-VM agent (`/opt/symphony/vm-agent.mjs`)
+  # spawns the adapter via `child_process.spawn` with kernel pipes and bridges the
+  # socket to the adapter's stdio. This decouples symphony from any particular
+  # sandbox's stdio quirks — any sandbox that can launch a process with env vars and
+  # reach the host loopback works unchanged.
+  bridge:
+    # bind_host (string): host symphony binds the listener on. 0.0.0.0 allows any
+    # in-VM interface to reach the host loopback (Gondolin maps a synthetic guest host to
+    # host loopback transparently). Default: 0.0.0.0
+    bind_host: 0.0.0.0
+    # bind_port (int): port symphony binds the listener on. 0 picks an ephemeral
+    # port (used port surfaces via the in-VM SYMPHONY_ACP_URL env var). Default: 8788
+    bind_port: 8788
+    # reach_host (string): host the in-VM agent dials back to. Under Gondolin this is
+    # 127.0.0.1 because the guest loopback hits the host loopback. Other sandboxes
+    # may need a different alias. Default: 127.0.0.1
+    reach_host: 127.0.0.1
+    # reach_url (string|null): full URL override for the in-VM agent's dial
+    # destination, e.g. through a reverse proxy or different scheme. When null,
+    # symphony constructs `tcp://<reach_host>:<bind_port>`. Default: null
+    # reach_url: null
+    # connect_timeout_ms (int): how long to wait for the in-VM agent to connect after
+    # the sandbox is launched, before failing the attempt. Default: 30000
+    connect_timeout_ms: 30000
 # ─────────────────────────────────────────────────────────────────────────────
-# smolvm — microVM execution environment.
+# credentials — host credential lifecycle (issue 113). The host substitutes the
+# real OAuth access token into each VM's outbound request at Gondolin egress; the
+# ticker keeps the host's cached access token warm by periodically running
+# `claude -p "ok"` — Claude Code's own OAuth path detects the stale token,
+# refreshes against Anthropic, and atomically writes the rotated tuple back to
+# `~/.claude/.credentials.json`. Symphony never implements OAuth; Anthropic's own
+# client does.
 # ─────────────────────────────────────────────────────────────────────────────
-smolvm:
-  # from (path | null): path to a packed .smolmachine.smolmachine artifact.
-  # Built once with `scripts/build-vm.sh`. Mutually exclusive with `image`.
-  # Default: null.
-  from: ./.vm/symphony.smolmachine.smolmachine
+credentials:
+  # ticker_interval_ms (int): how often the host ticker spawns `claude -p "ok"`
+  # to refresh the OAuth cache. Each live VM also refreshes proactively before its
+  # cached token expires, so the ticker is belt-to-the-braces for idle periods.
+  # Set to 0 to disable the in-symphony ticker entirely (operator runs their own
+  # systemd timer instead). Default: 21600000 (6 hours).
+  ticker_interval_ms: 21600000
-  # image (string | null): container image to pull instead of a packed artifact.
-  # Mutually exclusive with `from`. Default: null.
-  image: null
+# ─────────────────────────────────────────────────────────────────────────────
+# gondolin — microVM execution environment (Gondolin substrate).
+# ─────────────────────────────────────────────────────────────────────────────
+gondolin:
+  # image (string | null): the agent rootfs the VM boots, expressed as a Gondolin
+  # image selector. Build it ONCE with `npm run build:image` (see images/agents/) —
+  # the build prints a content-addressed build id (a digest); pin that id here for
+  # an immutable, reproducible reference. A `name:tag` ref (e.g.
+  # `symphony-agents:latest`) or a path to an exported asset directory also work.
+  # The image bakes a Node.js runtime, every ACP-capable coding agent
+  # (claude-agent-acp, codex-acp, opencode), and the in-VM launcher at
+  # /opt/symphony/vm-agent.mjs — so dispatch needs no runtime mounts. REQUIRED:
+  # the runner fails fast at boot when this is unset. Default: null.
+  image: symphony-agents:latest
   # cpus (int): vCPU count per VM. Default: 2.
   cpus: 2
@@ -192,19 +779,12 @@ smolvm:
   # mem_mib (int): RAM per VM in MiB. Default: 2048.
   mem_mib: 4096
-  # net (bool): whether the VM has outbound networking. Default: true.
-  # Setting false isolates the VM at the cost of breaking adapters that fetch
-  # tokens, models, or dependencies at run time.
-  net: true
-  # bin_path (path | null): legacy mount; host directory containing the codex
-  # binary, mounted read-only at /opt/codex. Default: null.
-  bin_path: null
-  # volumes (list): additional host:guest bind mounts. smolvm has a small
-  # per-VM mount cap (the workspace itself already consumes one slot), so keep
-  # this list small. Each entry: { host: path, guest: path, readonly?: bool }.
-  # Default: [].
+  # volumes (list): additional host:guest VFS mounts beyond the auto-mounted
+  # workspace. Gondolin's VFS is programmable (no hard per-VM mount cap), but keep
+  # this lean — if ANY state sets `eval_mode: true` it adds two read-only mounts
+  # (/symphony/issues + /symphony/logs) on top of the workspace. Prefer baking
+  # static tooling into the image over a runtime mount. Each entry:
+  # { host: path, guest: path, readonly?: bool }. Default: [].
   volumes:
     - host: ~/.cache/npm
       guest: /root/.npm
@@ -212,13 +792,42 @@ smolvm:
   # forward_env (string[]): host env vars forwarded into the VM exec.
   # Default: [OPENAI_API_KEY, ANTHROPIC_API_KEY]
+  # NOTE: the runner strips EVERY credential-bearing var from the forwarded boot
+  # env before launch — the guest holds only a token-shaped placeholder that
+  # Gondolin substitutes with the real token at egress — so listing a credential
+  # var here does NOT plant the real key in the VM's PID-1 env.
   forward_env:
     - OPENAI_API_KEY
     - ANTHROPIC_API_KEY
-  # endpoint (string): smolvm server. unix:// or http:// URI.
-  # Default: unix://$XDG_RUNTIME_DIR/smolvm.sock (or /run/user/1000/smolvm.sock)
-  endpoint: unix:///run/user/1000/smolvm.sock
+# ─────────────────────────────────────────────────────────────────────────────
+# egress — general dev-tooling firewall for the in-VM agent.
+#
+# Gondolin denies guest egress to non-allowlisted hosts by default. The agent can
+# always reach its own inference host (that is handled by the credential layer,
+# which substitutes the real upstream token at egress). This block additionally
+# opens the dev-tooling hosts the agent needs so gates can run inside the VM —
+# `npm install`, git-based dependencies, release-binary downloads.
+#
+# SECURITY: this is the firewall ONLY. No credential is ever substituted for a host
+# listed here — the real token substitutes solely on each adapter's inference host
+# (see src/agent/credential-secrets.ts `substitutionHosts`). The effective
+# per-adapter allowlist handed to Gondolin is THIS list UNION that adapter's
+# substitution host(s). Listing a host therefore grants plain network egress, never
+# a token. Keep the list tight — every entry widens the network surface of
+# semi-trusted in-VM code.
+# ─────────────────────────────────────────────────────────────────────────────
+egress:
+  # allowed_hosts (string[]): hostnames the in-VM agent may reach for dev tooling.
+  # Default: [] (no extra hosts — the agent can reach only its inference host).
+  # Bare hostnames ONLY — no scheme, port, or path (`github.com`, not
+  # `https://github.com/...`). A malformed entry fails safe (the host simply stays
+  # blocked, never opened). Each entry is matched against the request host exactly.
+  allowed_hosts:
+    - registry.npmjs.org             # npm install
+    - github.com                     # git-based deps / release pages
+    - codeload.github.com            # GitHub tarball fetch
+    - objects.githubusercontent.com  # release-binary downloads
 # ─────────────────────────────────────────────────────────────────────────────
 # server — HTTP dashboard + MCP endpoint listener.
@@ -236,11 +845,24 @@ server:
 # mcp — Model Context Protocol server exposed to in-VM agents.
 #
 # The orchestrator runs a JSON-RPC endpoint scoped to each active issue at
-# /api/v1/issues/<id>/mcp, gated by a per-dispatch bearer token. Two tools live
-# there:
+# /api/v1/issues/<id>/mcp, gated by a per-dispatch bearer token. Three tools
+# live there:
 #
-#   • symphony.mark_done({ title, summary })
+#   • symphony.transition({ to_state, notes? })
+#     — canonical (and only) exit verb. Moves the issue into another declared
+#       state, optionally appending `notes` (markdown) to the issue body before
+#       the move so the next agent (in `to_state`) reads them as part of
+#       `issue.description`. Terminal targets clean the workspace; active and
+#       holding targets preserve it so the same `agent/<id>` git branch
+#       survives the handoff. Rejected transitions return MCP tool-result
+#       errors (isError:true) the agent can read and retry.
 #   • symphony.request_human_steering({ question, context? })
+#   • symphony.propose_issue({ title, description?, labels?, priority? })
+#     — drops a new issue into the first declared `role: holding` state
+#       directory (literal Triage if none declared). The orchestrator does NOT
+#       dispatch it; the operator approves or discards from the dashboard. The
+#       calling issue is recorded as proposed_by in the new file's
+#       front-matter.
 # ─────────────────────────────────────────────────────────────────────────────
 mcp:
   # enabled (bool): when false, the orchestrator refuses to dispatch (MCP is
@@ -248,8 +870,8 @@ mcp:
   enabled: true
   # host (string): hostname or IP the agent uses to reach the orchestrator
-  # from inside the smolvm. The port is resolved at runtime from the
-  # actually-bound HTTP server. Default: '127.0.0.1' (smolvm proxies VM
+  # from inside the VM. The port is resolved at runtime from the
+  # actually-bound HTTP server. Default: '127.0.0.1' (Gondolin maps VM
   # loopback to host loopback; verified empirically).
   host: 127.0.0.1
@@ -264,17 +886,27 @@ Liquid-templated prompt body. Rendered once per dispatched issue. Context:
   issue.identifier   — the issue's external id (e.g. "DEMO-42").
   issue.title        — issue title (string).
-  issue.state        — current state (string, matches active_states[]).
-  issue.description  — body text (string or empty).
+  issue.state        — current state (string, matches a key in `states:`).
+  issue.description  — body text (string or empty). `symphony.transition`
+                       appends its `notes` block here before the file moves,
+                       so the next state's agent reads the previous state's
+                       handoff message verbatim.
   issue.priority     — number or null.
   issue.labels       — list of strings (lowercased).
   attempt            — int, 1-based attempt counter; absent on first attempt.
 Available Liquid filters: standard Shopify Liquid plus `escape_once`.
+Per-state prompt branching (V1 pattern): when `states:` declares more than
+one active role (e.g. Todo + Review), wrap the state-specific instructions in
+a `{% case issue.state %}` / `{% when "..." %}` / `{% else %}` block. The
+runner renders the prompt fresh on every dispatch, so each state's agent sees
+only its own instructions plus whatever common preamble / postamble lives
+outside the case. See WORKFLOW.md in this repo for a worked example.
 The body below is the literal prompt sent to the agent. Keep it specific to
-this workflow; orchestrator behavior (mark_done, request_human_steering) is
-the same no matter what you write here.
+this workflow; orchestrator behavior (transition, request_human_steering,
+propose_issue) is the same no matter what you write here.
 -->
 You are picking up a single issue and shepherding it through the workflow.
@@ -294,12 +926,20 @@ Goals:
 1. Work in the current directory only; treat it as the issue workspace.
 2. Make the smallest correct change that satisfies the issue.
-3. Call `symphony.mark_done({ title, summary })` when done. This is the only
-   way to signal completion. The orchestrator atomically moves the issue file
-   to the terminal state and stops dispatching.
+3. Hand off when done. `symphony.transition({ to_state, notes? })` is the
+   canonical (and only) exit verb: pass a declared state name and optional
+   markdown notes that get appended to the issue body for the next agent.
+   For single-agent workflows, transition straight into the first declared
+   `role: terminal` state to end the run.
 4. If you cannot proceed without human input, call
    `symphony.request_human_steering({ question, context? })`. Your turn ends
    immediately; the human's reply arrives as your next prompt.
+5. If you notice work out of scope for this issue — unrelated bugs, follow-ups
+   a human should size, refactors worth a separate dispatch — call
+   `symphony.propose_issue({ title, description?, labels?, priority? })`. It
+   lands in the first declared `role: holding` state directory (defaults to
+   `Triage/`); the operator approves or discards. Do not graft unrelated
+   edits onto this branch.
 {% if attempt -%}
 This is continuation/retry attempt {{ attempt }}. Inspect the workspace before