npm - loki-mode - Versions diffs - 7.30.0 → 7.32.0 - Mend

loki-mode 7.30.0 → 7.32.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

package/README.md +4 -2
package/SKILL.md +2 -2
package/VERSION +1 -1
package/autonomy/context-tracker.py +8 -0
package/autonomy/loki +799 -123
package/autonomy/mcp-launch.sh +149 -36
package/autonomy/run.sh +168 -4
package/bin/loki +71 -0
package/dashboard/__init__.py +1 -1
package/dashboard/server.py +326 -1
package/dashboard/static/index.html +105 -39
package/docs/INSTALLATION.md +1 -1
package/docs/competitive/replit-lovable-analysis.md +1 -1
package/loki-ts/data/model-pricing.json +1 -0
package/loki-ts/dist/loki.js +233 -231
package/mcp/__init__.py +1 -1
package/mcp/_sdk_loader.py +157 -0
package/mcp/lsp_proxy.py +61 -61
package/mcp/server.py +35 -129
package/package.json +1 -1
package/providers/claude.sh +76 -19
package/providers/model_catalog.json +9 -0
package/skills/model-selection.md +49 -1

package/autonomy/mcp-launch.sh CHANGED Viewed

@@ -26,10 +26,20 @@
 #   * The ONLY command run on the user's behalf is, after explicit consent:
 #       <venv>/bin/pip install -r mcp/requirements.txt
 #     The exact command is printed before it runs.
-#   * Non-interactive / CI: NEVER install. Print the manual command to stderr
-#     and exit 2 (mirrors autonomy/provider-offer.sh gate semantics).
+#   * Non-interactive / CI: NEVER install by default. Print the manual command
+#     to stderr and exit 2 (mirrors autonomy/provider-offer.sh gate semantics).
+#     EXCEPTION: LOKI_MCP_AUTO_BOOTSTRAP (1/true/yes/on, case-insensitive) is
+#     explicit-env written consent. MCP
+#     clients (Claude Desktop etc.) spawn the server non-interactively over piped
+#     stdio; a user who writes LOKI_MCP_AUTO_BOOTSTRAP=1 into their client config
+#     has consented in advance. On that flag, a missing-SDK non-TTY launch
+#     bootstraps the venv exactly like the interactive consent path, but with ALL
+#     progress on STDERR (stdout stays clean for JSON-RPC: the client is already
+#     attached to it), then execs the server. LOKI_NO_INSTALL_OFFER=1 still wins
+#     (explicit no beats explicit yes).
 #   * Opt-out: LOKI_NO_INSTALL_OFFER=1 -> never prompt, print manual command,
 #     exit 2. --yes / LOKI_ASSUME_YES / LOKI_AUTO_CONFIRM=true -> auto-accept.
+#     LOKI_MCP_AUTO_BOOTSTRAP=1 -> non-interactive written consent (see above).
 #
 # Self-containment: depends only on bash builtins + python3 on PATH. Defines
 # its own colors so it behaves identically whether sourced by autonomy/loki or
@@ -58,10 +68,20 @@ _ml_repo_root() {
     (cd "$self_dir/.." && pwd)
 }
+# _ml_truthy <value>: true (0) when the value is a conventional affirmative
+# spelling (1/true/yes/on/y), case-insensitive. Centralizes consent parsing so
+# every knob accepts the same spellings rather than each hard-coding "1".
+_ml_truthy() {
+    case "$(printf '%s' "${1:-}" | tr '[:upper:]' '[:lower:]')" in
+        1|true|yes|on) return 0 ;;
+        *) return 1 ;;
+    esac
+}
 # _ml_assume_yes: true when the user opted into unattended confirmation.
 _ml_assume_yes() {
-    [ "${LOKI_ASSUME_YES:-}" = "1" ] && return 0
-    [ "${LOKI_AUTO_CONFIRM:-}" = "true" ] && return 0
+    _ml_truthy "${LOKI_ASSUME_YES:-}" && return 0
+    _ml_truthy "${LOKI_AUTO_CONFIRM:-}" && return 0
     return 1
 }
@@ -93,15 +113,22 @@ _ml_python() {
 # `--check-sdk` probe, which runs the exact loader the server uses and exits 0
 # only when FastMCP loaded.
 #
-# Critical: we set PYTHONPATH to the install root and DO NOT cd into it, so the
-# probe exercises the SAME module resolution as the real launch (which preserves
-# the user's cwd). The redirect of stdin from /dev/null is insurance: if the
-# pip SDK's own `mcp.server` were ever reached, its stub starts a stdio receive
-# loop; the EOF makes it exit instead of hanging.
+# Critical: we probe with the SAME FILE-EXEC form the launch uses
+# (`"$root/mcp/server.py"`, NOT `-m mcp.server`), with PYTHONPATH set to the
+# install root and WITHOUT cd-ing into it, so the probe exercises byte-identical
+# module resolution to the real launch (which preserves the user's cwd). This
+# matters because `-m mcp.server` puts the user's cwd at sys.path[0] AHEAD of
+# PYTHONPATH=$root, so a cwd that happens to contain a regular `mcp/` python
+# package would shadow Loki's server during the probe (false SDK-missing) while
+# the file-exec launch -- immune to cwd shadowing -- would succeed. Probing by
+# file path keeps probe and launch resolving the IDENTICAL module. The redirect
+# of stdin from /dev/null is insurance: if the pip SDK's own `mcp.server` were
+# ever reached, its stub starts a stdio receive loop; the EOF makes it exit
+# instead of hanging.
 _ml_sdk_importable() {
     local py="$1" root="$2"
     PYTHONPATH="$root${PYTHONPATH:+:$PYTHONPATH}" \
-        "$py" -m mcp.server --check-sdk </dev/null >/dev/null 2>&1
+        "$py" "$root/mcp/server.py" --check-sdk </dev/null >/dev/null 2>&1
 }
 # _ml_print_manual <root> <venv>: print the honest manual install commands.
@@ -109,10 +136,13 @@ _ml_sdk_importable() {
 # requirements.txt is shipped under the install root.
 _ml_print_manual() {
     local root="$1" venv="$2"
+    # Display-only quoting: single-quote the substituted paths so the printed
+    # commands copy-paste correctly even when the project root or venv path
+    # contains spaces. This is presentation only; nothing is executed here.
     printf 'Install the MCP server dependencies manually:\n' >&2
-    printf '  python3 -m venv %s\n' "$venv" >&2
-    printf '  %s/bin/pip install -r %s/mcp/requirements.txt\n' "$venv" "$root" >&2
-    printf '  PYTHONPATH=%s %s/bin/python -m mcp.server\n' "$root" "$venv" >&2
+    printf "  python3 -m venv '%s'\n" "$venv" >&2
+    printf "  '%s/bin/pip' install -r '%s/mcp/requirements.txt'\n" "$venv" "$root" >&2
+    printf "  PYTHONPATH='%s' '%s/bin/python' '%s/mcp/server.py'\n" "$root" "$venv" "$root" >&2
 }
 _ml_help() {
@@ -135,27 +165,73 @@ Options:
   --help, -h              Show this help and exit.
 Environment:
-  LOKI_MCP_VENV=/abs/path   Use a custom venv location instead of .loki/mcp-venv.
-  LOKI_NO_INSTALL_OFFER=1   Never prompt to install; print the manual command.
-  --yes / LOKI_ASSUME_YES=1 Auto-accept the dependency install.
+  LOKI_MCP_VENV=/abs/path     Use a custom venv location instead of .loki/mcp-venv.
+  LOKI_NO_INSTALL_OFFER=1     Never prompt to install; print the manual command.
+                              Wins over LOKI_MCP_AUTO_BOOTSTRAP (explicit no beats
+                              explicit yes).
+  LOKI_MCP_AUTO_BOOTSTRAP=1   Written consent for non-interactive bootstrap. MCP
+                              clients (Claude Desktop etc.) spawn the server over
+                              piped stdio with no TTY; set this in your client
+                              config to authorize the one-time venv bootstrap when
+                              the SDK is missing. Progress goes to stderr only so
+                              stdout stays clean for JSON-RPC. On a TTY it also
+                              skips the consent prompt (consent already given).
+                              Accepts 1/true/yes/on (case-insensitive).
+  --yes / LOKI_ASSUME_YES=1   Auto-accept the dependency install. --yes is a
+                              launcher flag (equivalent to LOKI_ASSUME_YES=1); it
+                              is consumed here and never forwarded to the server.
+                              LOKI_ASSUME_YES / LOKI_AUTO_CONFIRM accept
+                              1/true/yes/on (case-insensitive).
-Behavior in non-interactive / CI shells: never installs. Prints the manual
+Argument handling: launcher flags (--help, --yes) are consumed here; every other
+argument is forwarded verbatim to the server, which accepts --transport/--port.
+A bare `--` ends launcher parsing so anything after it reaches the server as-is.
+Behavior in non-interactive / CI shells: never installs UNLESS
+LOKI_MCP_AUTO_BOOTSTRAP is set (1/true/yes/on). Without it, prints the manual
 install command to stderr and exits 2.
 EOF
 }
 # mcp_launch_main: dispatcher invoked by cmd_mcp() (autonomy/loki) or directly.
 mcp_launch_main() {
-    # Parse only flags we own; everything else is forwarded to the server.
+    # Split argv into launcher-owned flags (consumed here) and server argv
+    # (forwarded verbatim to the file-exec launch `python "$root/mcp/server.py"`).
+    # The server's argparse only
+    # accepts --transport/--port/--check-sdk; forwarding a launcher flag like
+    # --yes would make it abort with exit 2, so launcher flags MUST be stripped.
+    # A bare `--` ends launcher parsing: everything after it is forwarded as-is
+    # (escape hatch for any future server flag that collides with a launcher one).
     local arg
+    local _ml_server_argv=()
+    local _ml_after_sep=0
     for arg in "$@"; do
+        if [ "$_ml_after_sep" -eq 1 ]; then
+            _ml_server_argv+=("$arg")
+            continue
+        fi
         case "$arg" in
+            --)
+                _ml_after_sep=1
+                ;;
             --help|-h|help)
                 _ml_help
                 return 0
                 ;;
+            --yes)
+                # Launcher-owned: equivalent to LOKI_ASSUME_YES=1. Consumed here,
+                # never forwarded to the server.
+                LOKI_ASSUME_YES=1
+                ;;
+            *)
+                _ml_server_argv+=("$arg")
+                ;;
         esac
     done
+    # Replace the positional parameters with the filtered server argv so every
+    # downstream `exec ... "$@"` forwards only server-valid arguments. Safe
+    # empty-array expansion (bash 3.2 + set -u when no server args remain).
+    set -- ${_ml_server_argv[@]+"${_ml_server_argv[@]}"}
     local root
     root="$(_ml_repo_root)"
@@ -175,39 +251,72 @@ mcp_launch_main() {
     local venv="${LOKI_MCP_VENV:-$PWD/${LOKI_DIR:-.loki}/mcp-venv}"
     local venv_py="$venv/bin/python"
+    # Progress destination for the bootstrap. On an interactive TTY, progress goes
+    # to stdout (the user is watching a terminal). On the non-interactive
+    # auto-bootstrap path (LOKI_MCP_AUTO_BOOTSTRAP=1 over piped stdio), stdout is
+    # the JSON-RPC channel to the MCP client and MUST stay clean, so ALL progress
+    # (printfs AND the stdout of venv/pip) is routed to fd 2. Keyed on
+    # non-interactive, not on the flag: TTY+flag still prints to the terminal.
+    local out_fd=1
+    if _ml_non_interactive; then
+        out_fd=2
+    fi
     # 3. If the venv already has the SDK, use it directly. The server is launched
-    #    with PYTHONPATH=$root (NOT by cd-ing) so the user's cwd is preserved for
+    #    by FILE PATH ($root/mcp/server.py) rather than `-m mcp.server`, with
+    #    PYTHONPATH=$root (NOT by cd-ing) so the user's cwd is preserved for
     #    .loki resolution; see _ml_sdk_importable for why.
-    #    Known narrow residual: if the user's cwd itself contains a Python
-    #    package literally named mcp/ with a server submodule, python -m puts
-    #    the cwd ahead of PYTHONPATH and that package wins. Essentially never
-    #    true for real projects; documented rather than fought.
+    #    Running the file directly avoids the runpy RuntimeWarning that `-m`
+    #    emits (the local mcp/ package is imported during SDK-namespace setup
+    #    before runpy executes mcp.server). server.py uses only absolute imports
+    #    (e.g. `from mcp._sdk_loader import ...`), which resolve via PYTHONPATH=$root
+    #    under file execution. File-exec also removes the old narrow cwd-shadowing
+    #    residual: an explicit path can never be shadowed by a cwd `mcp/` package.
     if [ -x "$venv_py" ] && _ml_sdk_importable "$venv_py" "$root"; then
-        exec env PYTHONPATH="$root${PYTHONPATH:+:$PYTHONPATH}" "$venv_py" -m mcp.server "$@"
+        exec env PYTHONPATH="$root${PYTHONPATH:+:$PYTHONPATH}" "$venv_py" "$root/mcp/server.py" "$@"
     fi
     # 4. If the BASE python already has the SDK (e.g. user pip-installed it),
     #    use it -- no venv needed.
     if _ml_sdk_importable "$base_py" "$root"; then
-        exec env PYTHONPATH="$root${PYTHONPATH:+:$PYTHONPATH}" "$base_py" -m mcp.server "$@"
+        exec env PYTHONPATH="$root${PYTHONPATH:+:$PYTHONPATH}" "$base_py" "$root/mcp/server.py" "$@"
     fi
     # 5. SDK missing. Decide whether we may bootstrap.
-    if [ "${LOKI_NO_INSTALL_OFFER:-}" = "1" ]; then
+    #    Precedence: LOKI_NO_INSTALL_OFFER (explicit no) wins over
+    #    LOKI_MCP_AUTO_BOOTSTRAP (explicit yes).
+    if _ml_truthy "${LOKI_NO_INSTALL_OFFER:-}"; then
+        if _ml_truthy "${LOKI_MCP_AUTO_BOOTSTRAP:-}"; then
+            printf 'LOKI_NO_INSTALL_OFFER overrides LOKI_MCP_AUTO_BOOTSTRAP (explicit no beats explicit yes); not installing.\n' >&2
+        fi
         printf '%sMCP SDK not installed.%s\n' "$_ML_YELLOW" "$_ML_NC" >&2
         _ml_print_manual "$root" "$venv"
         return 2
     fi
+    # Track whether we reached the bootstrap via non-interactive written consent.
+    # When true, the consent prompt is skipped and all progress goes to fd 2.
+    local auto_consent=0
     if _ml_non_interactive; then
-        printf '%sMCP SDK not installed%s and this is a non-interactive shell, so Loki will not install it automatically.\n' "$_ML_YELLOW" "$_ML_NC" >&2
-        _ml_print_manual "$root" "$venv"
-        return 2
+        if _ml_truthy "${LOKI_MCP_AUTO_BOOTSTRAP:-}"; then
+            # Written consent: bootstrap non-interactively, progress to stderr
+            # only (stdout is the client's JSON-RPC channel). Fall through to the
+            # bootstrap below with auto-accept.
+            printf '%sMCP SDK not installed.%s LOKI_MCP_AUTO_BOOTSTRAP set: bootstrapping the project venv non-interactively (progress on stderr; stdout reserved for JSON-RPC).\n' "$_ML_YELLOW" "$_ML_NC" >&2
+            auto_consent=1
+        else
+            printf '%sMCP SDK not installed%s and this is a non-interactive shell, so Loki will not install it automatically. Set LOKI_MCP_AUTO_BOOTSTRAP=1 (also accepts true/yes) to authorize this for MCP clients.\n' "$_ML_YELLOW" "$_ML_NC" >&2
+            _ml_print_manual "$root" "$venv"
+            return 2
+        fi
     fi
-    # 6. Interactive TTY: offer the consent-gated bootstrap.
+    # 6. Offer the consent-gated bootstrap. Consent is already given when:
+    #    - we arrived via the non-interactive auto-bootstrap path (auto_consent), or
+    #    - LOKI_MCP_AUTO_BOOTSTRAP=1 is set on a TTY (explicit yes skips the prompt), or
+    #    - --yes / LOKI_ASSUME_YES / LOKI_AUTO_CONFIRM.
     local answer=""
-    if _ml_assume_yes; then
+    if [ "$auto_consent" -eq 1 ] || _ml_truthy "${LOKI_MCP_AUTO_BOOTSTRAP:-}" || _ml_assume_yes; then
         answer="y"
     else
         printf '\n'
@@ -239,8 +348,10 @@ mcp_launch_main() {
             _ml_print_manual "$root" "$venv"
             return 2
         fi
-        printf 'Creating virtualenv (%s) ...\n' "$venv"
-        if ! "$base_py" -m venv "$venv"; then
+        printf 'Creating virtualenv (%s) ...\n' "$venv" >&"$out_fd"
+        # Route venv's stdout to out_fd (stderr on the auto path) so the JSON-RPC
+        # channel stays clean; its stderr is left as-is for real diagnostics.
+        if ! "$base_py" -m venv "$venv" >&"$out_fd"; then
             printf '%sFailed to create virtualenv at %s.%s\n' "$_ML_RED" "$venv" "$_ML_NC" >&2
             _ml_print_manual "$root" "$venv"
             return 2
@@ -253,9 +364,11 @@ mcp_launch_main() {
         printf '%smcp/requirements.txt not found at %s.%s\n' "$_ML_RED" "$req" "$_ML_NC" >&2
         return 2
     fi
-    printf 'Installing MCP dependencies (%s/bin/pip install -r %s) ...\n' "$venv" "$req"
+    printf 'Installing MCP dependencies (%s/bin/pip install -r %s) ...\n' "$venv" "$req" >&"$out_fd"
     local code=0
-    "$venv/bin/pip" install -r "$req" || code=$?
+    # pip writes its progress to stdout; route it to out_fd (stderr on the auto
+    # path) so the JSON-RPC channel stays clean. pip's stderr is left as-is.
+    "$venv/bin/pip" install -r "$req" >&"$out_fd" || code=$?
     if [ "$code" -ne 0 ]; then
         printf '%sInstall failed (pip exited %s).%s You can retry manually:\n' "$_ML_RED" "$code" "$_ML_NC" >&2
         _ml_print_manual "$root" "$venv"
@@ -272,7 +385,7 @@ mcp_launch_main() {
         return 2
     fi
     printf "%sMCP dependencies ready. Launching server over stdio ...%s\n" "$_ML_BOLD" "$_ML_NC" >&2
-    exec env PYTHONPATH="$root${PYTHONPATH:+:$PYTHONPATH}" "$venv_py" -m mcp.server "$@"
+    exec env PYTHONPATH="$root${PYTHONPATH:+:$PYTHONPATH}" "$venv_py" "$root/mcp/server.py" "$@"
 }
 # Executed directly (tests, manual): run the dispatcher.

package/autonomy/run.sh CHANGED Viewed

@@ -1809,9 +1809,31 @@ get_provider_tier_param() {
     case "${PROVIDER_NAME:-claude}" in
         claude)
             case "$tier" in
-                planning) echo "${PROVIDER_MODEL_PLANNING:-opus}" ;;
+                planning)
+                    # Evidence-based routing (scoped): the official model-config
+                    # docs explicitly name "architecture decisions" and
+                    # "root-cause investigations" as where Fable 5's extra
+                    # investigation and self-verification pay off. So the
+                    # planning/architecture tier may opt in to Fable via
+                    # LOKI_FABLE_ARCHITECT=1. Default OFF because Fable is 2x
+                    # Opus per token; reserve it for the REASON/architecture
+                    # iterations the user explicitly wants. An explicit
+                    # PROVIDER_MODEL_PLANNING still wins (operator override).
+                    if [ -n "${PROVIDER_MODEL_PLANNING:-}" ]; then
+                        echo "${PROVIDER_MODEL_PLANNING}"
+                    elif [ "${LOKI_FABLE_ARCHITECT:-0}" = "1" ]; then
+                        echo "fable"
+                    else
+                        echo "opus"
+                    fi
+                    ;;
                 development) echo "${PROVIDER_MODEL_DEVELOPMENT:-opus}" ;;
                 fast) echo "${PROVIDER_MODEL_FAST:-sonnet}" ;;
+                # Honor the fable lever here too: without this arm an
+                # unsourced-claude.sh environment (this static fallback) would
+                # silently downgrade a fable-pinned tier to sonnet via the `*`
+                # default. Matches resolve_model_for_tier's explicit fable) arm.
+                fable) echo "fable" ;;
                 *) echo "sonnet" ;;
             esac
             ;;
@@ -3803,6 +3825,8 @@ _write_pricing_json() {
   "updated": "${updated}",
   "source": "static",
   "models": {
+    "fable":           {"input": 10.00, "output": 50.00, "label": "Fable 5 (top, 2x Opus)", "provider": "claude"},
+    "claude-fable-5":  {"input": 10.00, "output": 50.00, "label": "Fable 5 (top, 2x Opus)", "provider": "claude"},
     "opus":            {"input": 5.00,  "output": 25.00, "label": "Opus (latest)",   "provider": "claude"},
     "sonnet":          {"input": 3.00,  "output": 15.00, "label": "Sonnet (latest)", "provider": "claude"},
     "haiku":           {"input": 1.00,  "output": 5.00,  "label": "Haiku (latest)",  "provider": "claude"},
@@ -7648,6 +7672,21 @@ BUILD_PROMPT
             prompt_text=$(cat "$review_prompt_file")
             case "${PROVIDER_NAME:-claude}" in
                 claude)
+                    # SECURITY-REVIEW MODEL GUARD (evidence-based routing, item 4b):
+                    # Reviewers deliberately do NOT pass --model, so they run on
+                    # the account default model and are NEVER routed to Fable by a
+                    # mid-flight model override or LOKI_FABLE_ARCHITECT (those only
+                    # rewrite the iteration's tier_param, not this dispatch). This
+                    # must stay true. The official model-config docs CONTRADICT
+                    # routing security review to Fable: Fable's safety classifiers
+                    # refuse cybersecurity content, and in non-interactive (-p)
+                    # mode a flagged request ends the turn with stop_reason
+                    # "refusal" instead of a transparent Opus re-run. A refused
+                    # security reviewer would return no VERDICT and break the
+                    # unanimous-council gate. Defensive-cyber capability lives in
+                    # Mythos 5 (Project Glasswing), not Fable. If a future change
+                    # adds --model here, the security-sentinel reviewer must be
+                    # pinned to opus, never fable.
                     claude --dangerously-skip-permissions -p "$prompt_text" \
                         --output-format text > "$review_output" 2>/dev/null
                     ;;
@@ -9058,6 +9097,8 @@ check_budget_limit() {
 import json, glob
 total = 0.0
 pricing = {
+    'fable': {'input': 10.00, 'output': 50.00},
+    'claude-fable-5': {'input': 10.00, 'output': 50.00},
     'opus': {'input': 5.00, 'output': 25.00},
     'sonnet': {'input': 3.00, 'output': 15.00},
     'haiku': {'input': 1.00, 'output': 5.00},
@@ -12052,6 +12093,23 @@ run_autonomous() {
     _LOKI_RUN_START_SHA="$(cat "$_start_sha_file" 2>/dev/null || echo "")"
     export _LOKI_RUN_START_SHA
+    # Session-scope the mid-flight model override (model-honesty fix). The
+    # override file (.loki/state/model-override) is a LIVE-RUN control: the
+    # dashboard UI and docs state it "applies to the current run". A leftover
+    # file from a previous run must NOT silently pin every future `loki start`
+    # to that model (and to its cost). So clear it once at the start of a FRESH
+    # run (ITERATION_COUNT==0). A genuine resume (ITERATION_COUNT>0) and any
+    # mid-flight switch made at iteration>0 are preserved, because the clear is
+    # guarded on the fresh-run condition only.
+    if [ "${ITERATION_COUNT:-0}" -eq 0 ] && [ -f ".loki/state/model-override" ]; then
+        local _stale_override
+        _stale_override="$(cat .loki/state/model-override 2>/dev/null | tr -d '[:space:]')"
+        rm -f ".loki/state/model-override" 2>/dev/null || true
+        if [ -n "$_stale_override" ]; then
+            log_info "Cleared leftover model override ('$_stale_override') at session start; the override applies to the current run only."
+        fi
+    fi
     # Trust-metrics instrumentation marker: record one run_start event per
     # fresh run so the trust-metrics denominator counts ONLY instrumented runs.
     # This is what lets the aggregator distinguish "0 blocks measured" from
@@ -12270,14 +12328,60 @@ except Exception as exc:
             # helpers (which expect tier names) resolve correctly. Unknown
             # model strings are passed through as-is; provider loaders fall
             # back to a sane default.
-            case "${LOKI_SESSION_MODEL:-sonnet}" in
+            #
+            # Normalize case + surrounding whitespace BEFORE the match so
+            # 'OPUS' and ' opus ' resolve identically to 'opus'. We do NOT use
+            # loki_normalize_model_alias here: that helper is the narrow
+            # OVERRIDE-file allowlist (haiku|sonnet|opus|fable) and would strip
+            # the documented tier-name pins (planning|development|fast) to
+            # empty, collapsing them onto the default tier. The session pin
+            # legitimately accepts tier names (skills/model-selection.md), and
+            # the estimator + dashboard mirror this exact tier route, so the
+            # canonical session-pin rule is trim+lowercase WITHOUT the alias
+            # allowlist. Interior whitespace is preserved (so 'fab le' stays a
+            # junk value that falls through the '*' default arm), matching the
+            # estimator/dashboard ports.
+            local _session_pin="${LOKI_SESSION_MODEL:-sonnet}"
+            _session_pin="${_session_pin#"${_session_pin%%[![:space:]]*}"}"
+            _session_pin="${_session_pin%"${_session_pin##*[![:space:]]}"}"
+            _session_pin="$(printf '%s' "$_session_pin" | tr '[:upper:]' '[:lower:]')"
+            case "$_session_pin" in
                 opus)   CURRENT_TIER="planning" ;;
                 sonnet) CURRENT_TIER="development" ;;
                 haiku)  CURRENT_TIER="fast" ;;
-                planning|development|fast) CURRENT_TIER="${LOKI_SESSION_MODEL}" ;;
-                *)      CURRENT_TIER="${LOKI_SESSION_MODEL}" ;;
+                fable)  CURRENT_TIER="fable" ;;
+                planning|development|fast) CURRENT_TIER="$_session_pin" ;;
+                *)      CURRENT_TIER="$_session_pin" ;;
             esac
         fi
+        # Architect opt-in (LOKI_FABLE_ARCHITECT=1): route ONLY the first
+        # iteration (the architecture/REASON pass) to Fable, then fall back to
+        # the session tier for all later iterations. This is the honest
+        # implementation of "fable for architecture only": run.sh is the only
+        # scope that has ITERATION_COUNT, so the decision lives here (not in the
+        # stateless provider resolver). An EXPLICIT planning-model override still
+        # wins, and the LOKI_MAX_TIER ceiling clamps fable down via the resolver.
+        # Default OFF (Fable is 2x Opus). Without this scoping, a session pinned
+        # to opus would route EVERY iteration to fable.
+        #
+        # NOTE on the index: ITERATION_COUNT is incremented at the TOP of the
+        # loop (see "((ITERATION_COUNT++))" above), so the FIRST in-loop pass
+        # has ITERATION_COUNT==1, not 0. The guard matches 1 so the architecture
+        # iteration actually fires (a -eq 0 guard here would be a silent no-op,
+        # the exact bug this fix removes). The estimator models this same first
+        # iteration as its 0-indexed range() i==0, so quote and run agree.
+        #
+        # PRECEDENCE: a mid-flight model override (.loki/state/model-override,
+        # applied later in this iteration body) WINS over this architect pin.
+        # Deliberate: a live user action in the dashboard outranks an env
+        # opt-in set at launch. The override is still clamped by LOKI_MAX_TIER.
+        if [ "${ITERATION_COUNT:-0}" -eq 1 ] \
+           && [ "${LOKI_FABLE_ARCHITECT:-0}" = "1" ] \
+           && [ -z "${LOKI_CLAUDE_MODEL_PLANNING:-}" ] \
+           && [ -z "${LOKI_MODEL_PLANNING:-}" ]; then
+            CURRENT_TIER="fable"
+            log_info "LOKI_FABLE_ARCHITECT=1: routing the first (architecture) iteration to fable; later iterations use the session tier"
+        fi
         # Export LOKI_CURRENT_TIER so provider helper functions
         # can resolve the correct model.
         # Without this, LOKI_CURRENT_TIER is always empty and defaults to "planning".
@@ -12285,6 +12389,66 @@ except Exception as exc:
         export LOKI_CURRENT_TIER
         local rarv_phase=$(get_rarv_phase_name "$ITERATION_COUNT")
         local tier_param=$(get_provider_tier_param "$CURRENT_TIER")
+        # Mid-flight model override: the dashboard (POST /api/session/model) or a
+        # CLI user may rewrite .loki/state/model-override between iterations to
+        # change the model a live run uses. Read it here, after tier_param is
+        # resolved and before the claude argv is built (--model "$tier_param" is
+        # assembled below), so the override flows through effort/budget/fallback
+        # with no other change. Each iteration spawns a fresh `claude -p`, so the
+        # switch takes effect at THIS iteration boundary and never mid-invocation
+        # (claude -p fixes the model per call). Clearing/emptying the file reverts
+        # to the tier mapping. The file is fed straight into --model, so only an
+        # allowlisted alias is honored; invalid content is ignored with one warn.
+        # The override applies ONLY to the claude provider; other providers map
+        # tier_param to effort/model strings and have no fable equivalent.
+        if [ "${PROVIDER_NAME:-claude}" = "claude" ] && [ -s ".loki/state/model-override" ]; then
+            local _loki_override_file _loki_override_alias
+            _loki_override_file="$(cat .loki/state/model-override 2>/dev/null)"
+            # Canonical normalization shared with the dashboard + estimator
+            # (trim + lowercase + exact allowlist). "fab le" and other non-exact
+            # values normalize to empty and are rejected, so all three readers
+            # agree on what the file means. Falls back to a local case only if
+            # the provider helper is somehow not in scope.
+            if type loki_normalize_model_alias >/dev/null 2>&1; then
+                _loki_override_alias="$(loki_normalize_model_alias "$_loki_override_file")"
+            else
+                # Fallback only if the provider helper is not sourced. Mirror the
+                # canonical rule EXACTLY: trim ends + lowercase + exact allowlist,
+                # so interior whitespace ("fab le") is REJECTED here too (do NOT
+                # use `tr -d [:space:]`, which would collapse it into a false
+                # accept and re-introduce the normalization divergence).
+                _loki_override_alias=""
+                local _loki_ov_trim="$_loki_override_file"
+                _loki_ov_trim="${_loki_ov_trim#"${_loki_ov_trim%%[![:space:]]*}"}"
+                _loki_ov_trim="${_loki_ov_trim%"${_loki_ov_trim##*[![:space:]]}"}"
+                _loki_ov_trim="$(printf '%s' "$_loki_ov_trim" | tr '[:upper:]' '[:lower:]')"
+                case "$_loki_ov_trim" in
+                    haiku|sonnet|opus|fable) _loki_override_alias="$_loki_ov_trim" ;;
+                esac
+            fi
+            if [ -n "$_loki_override_alias" ]; then
+                # Apply the SAME LOKI_MAX_TIER ceiling the tier resolver uses, so
+                # a mid-flight override cannot silently bypass the operator's cost
+                # cap. Clamp via the shared helper when available.
+                local _loki_override_effective="$_loki_override_alias"
+                if type loki_apply_max_tier_clamp >/dev/null 2>&1; then
+                    _loki_override_effective="$(loki_apply_max_tier_clamp "$_loki_override_alias" "$_loki_override_alias")"
+                fi
+                if [ "$_loki_override_effective" != "$_loki_override_alias" ]; then
+                    tier_param="$_loki_override_effective"
+                    log_warn "model override '$_loki_override_alias' exceeds LOKI_MAX_TIER=${LOKI_MAX_TIER}; clamped to $tier_param (applies this iteration)"
+                    echo "=== Model override: $_loki_override_alias clamped to $tier_param by LOKI_MAX_TIER=${LOKI_MAX_TIER} (applies this iteration $ITERATION_COUNT) ===" | tee -a "$log_file" "$agent_log"
+                else
+                    tier_param="$_loki_override_effective"
+                    log_info "model override: $tier_param (applies this iteration)"
+                    echo "=== Model override: $tier_param (applies this iteration $ITERATION_COUNT) ===" | tee -a "$log_file" "$agent_log"
+                fi
+            elif [ -z "$(printf '%s' "$_loki_override_file" | tr -d '[:space:]')" ]; then
+                : # empty file means no override; fall back to tier mapping
+            else
+                log_warn "Ignoring invalid model override '$_loki_override_file' (allowed: haiku, sonnet, opus, fable); using tier $tier_param"
+            fi
+        fi
         echo "=== RARV Phase: $rarv_phase, Tier: $CURRENT_TIER ($tier_param) ===" | tee -a "$log_file" "$agent_log"
         log_info "RARV Phase: $rarv_phase -> Tier: $CURRENT_TIER ($tier_param)"

package/bin/loki CHANGED Viewed

@@ -65,6 +65,21 @@ elif [ "${BUN_FROM_SOURCE:-0}" = "1" ] || [ "${BUN_FROM_SOURCE:-}" = "true" ]; t
     fi
 elif [ -f "$REPO_ROOT/loki-ts/dist/loki.js" ]; then
     BUN_CLI="$REPO_ROOT/loki-ts/dist/loki.js"
+    # Stale-dist freshness guard. dist/loki.js is gitignored (loki-ts/.gitignore)
+    # and rebuilt by package.json's prepack and the release Docker build, so on
+    # released channels (npm/Docker/brew) src/cli.ts is absent and this guard is
+    # a no-op -- dist is always current there. On a DEV machine / worktree the
+    # gitignored dist can predate the current dispatcher: e.g. a new shim->Bun
+    # route (`report kpis`) added in src that the old dist bundle does not know,
+    # which would make the canonical form fail with "Unknown command" while a
+    # deprecated alias the old dist still knows silently works -- the exact
+    # deprecation inversion the report-kpis route exists to prevent. So when src
+    # exists AND is newer than dist (`-nt`, available on bash 3.2), prefer the src
+    # form so dev runs never execute a stale dispatcher. Released channels have no
+    # src, so they keep using dist unchanged.
+    if [ -f "$REPO_ROOT/loki-ts/src/cli.ts" ] && [ "$REPO_ROOT/loki-ts/src/cli.ts" -nt "$REPO_ROOT/loki-ts/dist/loki.js" ]; then
+        BUN_CLI="$REPO_ROOT/loki-ts/src/cli.ts"
+    fi
 elif [ -f "$REPO_ROOT/loki-ts/src/cli.ts" ]; then
     BUN_CLI="$REPO_ROOT/loki-ts/src/cli.ts"
 else
@@ -112,6 +127,62 @@ if ! command -v bun &>/dev/null; then
     exec "$BASH_CLI" "$@"
 fi
+# CLI consolidation (Phase A): `trust detail` is the grouped form of the
+# trust-metrics breakdown. The Bun `trust` handler only knows the trajectory
+# view (it rejects unknown args), and Phase A moves no handler logic, so the
+# `detail` subcommand lives only in bash (cmd_trust -> cmd_trust_metrics).
+# Force the bash route whenever `detail` appears as a trust arg (flag-anywhere:
+# `trust detail`, `trust --json detail`, `trust detail --json` all resolve
+# identically to the bash `trust-metrics` breakdown). Without this, only the
+# exact `trust detail` order routed to bash and `trust --json detail` hit the
+# Bun handler, which rejected `detail` to stderr while bash rejects to stdout --
+# divergent error channels for the same malformed input. Bare `trust` /
+# `trust --json` (no `detail`) stay on the Bun-native trajectory path above.
+if [ "${1:-}" = "trust" ]; then
+    for _trust_arg in "${@:2}"; do
+        if [ "$_trust_arg" = "detail" ]; then
+            exec "$BASH_CLI" "$@"
+        fi
+    done
+fi
+# CLI consolidation (Phase B): `report kpis` is the canonical form of the
+# Bun-only KPI snapshot. The `report` noun is otherwise bash-owned (every other
+# subcommand -- session/metrics/cost/export/share/dogfood -- routes to bash
+# cmd_report), so it is NOT in the Bun allowlist below. But kpis has no bash
+# implementation (it reuses the canonical cost arithmetic in runner/budget.ts),
+# so the canonical `report kpis` must reach the Bun handler -- otherwise the
+# canonical form would print the honest "requires Bun" message on a Bun machine
+# while the deprecated `kpis` alias actually worked, inverting the deprecation.
+# Route `report kpis` to Bun when `kpis` is the report SUBCOMMAND, i.e. the FIRST
+# non-flag token after `report`. This satisfies `report kpis`, `report kpis
+# --json`, and `report --json kpis` (the flag-anywhere orderings the trust-detail
+# precedent established), while NOT hijacking `kpis` when it appears as a
+# positional VALUE of a different report subcommand. `report export json kpis`
+# (kpis = the export output filename) must keep working exactly as on main
+# (v7.31.0): exit 0, file `kpis` created. So we scan past leading flags, take the
+# first real token, and only route to Bun if it is literally `kpis`. Fire the
+# same cli_command telemetry the Bun case-arm below fires (command=report), so a
+# Bun-routed `report kpis` is not invisible to usage analytics (the v7.8.2 parity
+# the case-arm comment documents). Backgrounded, FD-detached, opt-out honored by
+# loki_telemetry itself.
+if [ "${1:-}" = "report" ]; then
+    _report_first_sub=""
+    for _report_arg in "${@:2}"; do
+        case "$_report_arg" in
+            -*) continue ;;
+            *) _report_first_sub="$_report_arg"; break ;;
+        esac
+    done
+    if [ "$_report_first_sub" = "kpis" ]; then
+        if command -v curl &>/dev/null && [ -f "$REPO_ROOT/autonomy/telemetry.sh" ]; then
+            ( SCRIPT_DIR="$REPO_ROOT/autonomy"; source "$SCRIPT_DIR/telemetry.sh" 2>/dev/null && loki_telemetry "cli_command" "command=${1:-}" 2>/dev/null ) >/dev/null 2>&1 </dev/null &
+            disown 2>/dev/null || true
+        fi
+        exec bun "$BUN_CLI" "$@"
+    fi
+fi
 # Commands ported in Phase 2 -- route to Bun. Everything else goes to bash.
 # Two-token routes (provider show/list, memory list/index) match on the first
 # token only; the Bun dispatcher handles subcommand routing internally.

package/dashboard/__init__.py CHANGED Viewed

@@ -7,7 +7,7 @@ Modules:
     control: Session control API (start/stop/pause/resume)
 """
-__version__ = "7.30.0"
+__version__ = "7.32.0"
 # Expose the control app for easy import
 try: