RubyGems - octo-agent - Versions diffs - 0.11.2 - Mend

octo-agent 0.11.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (319) hide show

checksums.yaml +7 -0
data/.clacky/skills/commit/SKILL.md +423 -0
data/.clacky/skills/gem-release/SKILL.md +199 -0
data/.clacky/skills/gem-release/scripts/release.sh +304 -0
data/.clacky/skills/oss-upload/SKILL.md +47 -0
data/.octorules +106 -0
data/.rspec +3 -0
data/.rubocop.yml +8 -0
data/CHANGELOG.md +76 -0
data/CODE_OF_CONDUCT.md +132 -0
data/CONTRIBUTING.md +92 -0
data/Dockerfile +28 -0
data/LICENSE.txt +22 -0
data/POSITIONING.md +46 -0
data/README.md +134 -0
data/README_CN.md +134 -0
data/Rakefile +34 -0
data/benchmark/fixtures/sample_project/Gemfile +3 -0
data/benchmark/fixtures/sample_project/lib/api_handler.rb +32 -0
data/benchmark/fixtures/sample_project/lib/order_calculator.rb +23 -0
data/benchmark/fixtures/sample_project/lib/user_renderer.rb +20 -0
data/benchmark/fixtures/sample_project/spec/order_calculator_spec.rb +20 -0
data/benchmark/results/EVALUATION_REPORT.md +165 -0
data/benchmark/results/baseline_20260511_174424.json +128 -0
data/benchmark/results/report_20260511_175256.json +271 -0
data/benchmark/results/report_20260511_175444.json +271 -0
data/benchmark/results/treatment_20260511_175103.json +130 -0
data/benchmark/runner.rb +441 -0
data/bin/octo +7 -0
data/docs/agent-first-ui-design.md +77 -0
data/docs/billing-system.md +318 -0
data/docs/channel-architecture.md +235 -0
data/docs/engineering-article.md +343 -0
data/docs/session-skill-invocation.md +69 -0
data/docs/time_machine_design.md +247 -0
data/docs/ui2-architecture.md +124 -0
data/homebrew/README.md +96 -0
data/homebrew/openocto.rb +24 -0
data/lib/octo/agent/hook_manager.rb +61 -0
data/lib/octo/agent/llm_caller.rb +800 -0
data/lib/octo/agent/memory_updater.rb +246 -0
data/lib/octo/agent/message_compressor.rb +225 -0
data/lib/octo/agent/message_compressor_helper.rb +869 -0
data/lib/octo/agent/next_message_suggester.rb +215 -0
data/lib/octo/agent/session_serializer.rb +685 -0
data/lib/octo/agent/skill_auto_creator.rb +114 -0
data/lib/octo/agent/skill_evolution.rb +61 -0
data/lib/octo/agent/skill_manager.rb +466 -0
data/lib/octo/agent/skill_reflector.rb +89 -0
data/lib/octo/agent/system_prompt_builder.rb +101 -0
data/lib/octo/agent/time_machine.rb +214 -0
data/lib/octo/agent/tool_executor.rb +454 -0
data/lib/octo/agent/tool_registry.rb +150 -0
data/lib/octo/agent.rb +2180 -0
data/lib/octo/agent_config.rb +989 -0
data/lib/octo/agent_profile.rb +112 -0
data/lib/octo/anthropic_stream_aggregator.rb +137 -0
data/lib/octo/background_task_registry.rb +324 -0
data/lib/octo/banner.rb +34 -0
data/lib/octo/bedrock_stream_aggregator.rb +137 -0
data/lib/octo/block_font.rb +331 -0
data/lib/octo/cli.rb +968 -0
data/lib/octo/client.rb +623 -0
data/lib/octo/default_agents/SOUL.md +3 -0
data/lib/octo/default_agents/USER.md +1 -0
data/lib/octo/default_agents/base_prompt.md +66 -0
data/lib/octo/default_agents/coding/profile.yml +2 -0
data/lib/octo/default_agents/coding/system_prompt.md +67 -0
data/lib/octo/default_agents/general/profile.yml +2 -0
data/lib/octo/default_agents/general/system_prompt.md +16 -0
data/lib/octo/default_parsers/doc_parser.rb +69 -0
data/lib/octo/default_parsers/docx_parser.rb +188 -0
data/lib/octo/default_parsers/pdf_parser.rb +120 -0
data/lib/octo/default_parsers/pdf_parser_ocr.py +103 -0
data/lib/octo/default_parsers/pdf_parser_plumber.py +62 -0
data/lib/octo/default_parsers/pptx_parser.rb +140 -0
data/lib/octo/default_parsers/xlsx_parser.rb +121 -0
data/lib/octo/default_skills/browser-setup/SKILL.md +426 -0
data/lib/octo/default_skills/channel-manager/SKILL.md +623 -0
data/lib/octo/default_skills/channel-manager/dingtalk_setup.rb +191 -0
data/lib/octo/default_skills/channel-manager/discord_setup.rb +199 -0
data/lib/octo/default_skills/channel-manager/feishu_setup.rb +574 -0
data/lib/octo/default_skills/channel-manager/import_lark_skills.rb +97 -0
data/lib/octo/default_skills/channel-manager/install_feishu_skills.rb +105 -0
data/lib/octo/default_skills/channel-manager/weixin_setup.rb +274 -0
data/lib/octo/default_skills/code-explorer/SKILL.md +36 -0
data/lib/octo/default_skills/cron-task-creator/SKILL.md +257 -0
data/lib/octo/default_skills/cron-task-creator/evals/evals.json +38 -0
data/lib/octo/default_skills/onboard/SKILL.md +578 -0
data/lib/octo/default_skills/onboard/scripts/import_external_skills.rb +413 -0
data/lib/octo/default_skills/onboard/scripts/install_builtin_skills.rb +97 -0
data/lib/octo/default_skills/persist-memory/SKILL.md +59 -0
data/lib/octo/default_skills/personal-website/SKILL.md +113 -0
data/lib/octo/default_skills/personal-website/publish.rb +235 -0
data/lib/octo/default_skills/product-help/SKILL.md +123 -0
data/lib/octo/default_skills/product-help/docs/agent-config.md +74 -0
data/lib/octo/default_skills/product-help/docs/best-practices.md +49 -0
data/lib/octo/default_skills/product-help/docs/browser-tool.md +53 -0
data/lib/octo/default_skills/product-help/docs/built-in-skills.md +43 -0
data/lib/octo/default_skills/product-help/docs/cli-reference.md +82 -0
data/lib/octo/default_skills/product-help/docs/create-your-first-skill.md +47 -0
data/lib/octo/default_skills/product-help/docs/faq.md +98 -0
data/lib/octo/default_skills/product-help/docs/how-to-use-a-skill.md +58 -0
data/lib/octo/default_skills/product-help/docs/installation.md +59 -0
data/lib/octo/default_skills/product-help/docs/memory-system.md +61 -0
data/lib/octo/default_skills/product-help/docs/octorules.md +62 -0
data/lib/octo/default_skills/product-help/docs/session-management.md +63 -0
data/lib/octo/default_skills/product-help/docs/skill-basics.md +55 -0
data/lib/octo/default_skills/product-help/docs/skill-frontmatter.md +61 -0
data/lib/octo/default_skills/product-help/docs/web-server.md +49 -0
data/lib/octo/default_skills/product-help/docs/what-is-octo.md +37 -0
data/lib/octo/default_skills/product-help/docs/windows-installation.md +36 -0
data/lib/octo/default_skills/product-help/docs/writing-tips.md +53 -0
data/lib/octo/default_skills/recall-memory/SKILL.md +65 -0
data/lib/octo/default_skills/skill-add/SKILL.md +59 -0
data/lib/octo/default_skills/skill-add/scripts/install_from_zip.rb +295 -0
data/lib/octo/default_skills/skill-creator/SKILL.md +602 -0
data/lib/octo/default_skills/skill-creator/agents/analyzer.md +274 -0
data/lib/octo/default_skills/skill-creator/agents/comparator.md +202 -0
data/lib/octo/default_skills/skill-creator/agents/grader.md +223 -0
data/lib/octo/default_skills/skill-creator/eval-viewer/generate_review.py +471 -0
data/lib/octo/default_skills/skill-creator/eval-viewer/viewer.html +1325 -0
data/lib/octo/default_skills/skill-creator/references/schemas.md +430 -0
data/lib/octo/default_skills/skill-creator/scripts/__init__.py +0 -0
data/lib/octo/default_skills/skill-creator/scripts/aggregate_benchmark.py +401 -0
data/lib/octo/default_skills/skill-creator/scripts/generate_report.py +326 -0
data/lib/octo/default_skills/skill-creator/scripts/improve_description.py +310 -0
data/lib/octo/default_skills/skill-creator/scripts/quick_validate.py +103 -0
data/lib/octo/default_skills/skill-creator/scripts/run_eval.py +317 -0
data/lib/octo/default_skills/skill-creator/scripts/run_loop.py +331 -0
data/lib/octo/default_skills/skill-creator/scripts/utils.py +47 -0
data/lib/octo/default_skills/skill-creator/scripts/validate_skill_frontmatter.rb +143 -0
data/lib/octo/idle_compression_timer.rb +115 -0
data/lib/octo/json_ui_controller.rb +204 -0
data/lib/octo/message_format/anthropic.rb +409 -0
data/lib/octo/message_format/bedrock.rb +361 -0
data/lib/octo/message_format/open_ai.rb +222 -0
data/lib/octo/message_history.rb +373 -0
data/lib/octo/openai_stream_aggregator.rb +130 -0
data/lib/octo/plain_ui_controller.rb +166 -0
data/lib/octo/providers.rb +534 -0
data/lib/octo/server/browser_manager.rb +397 -0
data/lib/octo/server/channel/adapters/base.rb +82 -0
data/lib/octo/server/channel/adapters/dingtalk/adapter.rb +314 -0
data/lib/octo/server/channel/adapters/dingtalk/api_client.rb +391 -0
data/lib/octo/server/channel/adapters/dingtalk/stream_client.rb +203 -0
data/lib/octo/server/channel/adapters/discord/adapter.rb +229 -0
data/lib/octo/server/channel/adapters/discord/api_client.rb +107 -0
data/lib/octo/server/channel/adapters/discord/gateway_client.rb +270 -0
data/lib/octo/server/channel/adapters/feishu/adapter.rb +320 -0
data/lib/octo/server/channel/adapters/feishu/bot.rb +478 -0
data/lib/octo/server/channel/adapters/feishu/file_processor.rb +36 -0
data/lib/octo/server/channel/adapters/feishu/message_parser.rb +129 -0
data/lib/octo/server/channel/adapters/feishu/ws_client.rb +423 -0
data/lib/octo/server/channel/adapters/telegram/adapter.rb +375 -0
data/lib/octo/server/channel/adapters/telegram/api_client.rb +205 -0
data/lib/octo/server/channel/adapters/wecom/adapter.rb +148 -0
data/lib/octo/server/channel/adapters/wecom/media_downloader.rb +115 -0
data/lib/octo/server/channel/adapters/wecom/ws_client.rb +395 -0
data/lib/octo/server/channel/adapters/weixin/adapter.rb +692 -0
data/lib/octo/server/channel/adapters/weixin/api_client.rb +402 -0
data/lib/octo/server/channel/channel_config.rb +178 -0
data/lib/octo/server/channel/channel_manager.rb +468 -0
data/lib/octo/server/channel/channel_ui_controller.rb +224 -0
data/lib/octo/server/channel.rb +33 -0
data/lib/octo/server/discover.rb +77 -0
data/lib/octo/server/epipe_safe_io.rb +105 -0
data/lib/octo/server/http_server.rb +3554 -0
data/lib/octo/server/scheduler.rb +317 -0
data/lib/octo/server/server_master.rb +325 -0
data/lib/octo/server/session_registry.rb +431 -0
data/lib/octo/server/web_ui_controller.rb +487 -0
data/lib/octo/session_manager.rb +385 -0
data/lib/octo/skill.rb +466 -0
data/lib/octo/skill_loader.rb +328 -0
data/lib/octo/tools/base.rb +118 -0
data/lib/octo/tools/browser.rb +625 -0
data/lib/octo/tools/edit.rb +165 -0
data/lib/octo/tools/file_reader.rb +549 -0
data/lib/octo/tools/glob.rb +162 -0
data/lib/octo/tools/grep.rb +356 -0
data/lib/octo/tools/invoke_skill.rb +96 -0
data/lib/octo/tools/list_tasks.rb +54 -0
data/lib/octo/tools/redo_task.rb +41 -0
data/lib/octo/tools/request_user_feedback.rb +84 -0
data/lib/octo/tools/security.rb +333 -0
data/lib/octo/tools/terminal/output_cleaner.rb +63 -0
data/lib/octo/tools/terminal/persistent_session.rb +268 -0
data/lib/octo/tools/terminal/safe_rm.sh +106 -0
data/lib/octo/tools/terminal/session_manager.rb +213 -0
data/lib/octo/tools/terminal.rb +1828 -0
data/lib/octo/tools/todo_manager.rb +374 -0
data/lib/octo/tools/trash_manager.rb +388 -0
data/lib/octo/tools/undo_task.rb +35 -0
data/lib/octo/tools/web_fetch.rb +242 -0
data/lib/octo/tools/web_search.rb +260 -0
data/lib/octo/tools/write.rb +77 -0
data/lib/octo/ui2/block_font.rb +10 -0
data/lib/octo/ui2/components/base_component.rb +163 -0
data/lib/octo/ui2/components/command_suggestions.rb +290 -0
data/lib/octo/ui2/components/common_component.rb +96 -0
data/lib/octo/ui2/components/inline_input.rb +226 -0
data/lib/octo/ui2/components/input_area.rb +1338 -0
data/lib/octo/ui2/components/message_component.rb +99 -0
data/lib/octo/ui2/components/modal_component.rb +419 -0
data/lib/octo/ui2/components/todo_area.rb +149 -0
data/lib/octo/ui2/components/tool_component.rb +107 -0
data/lib/octo/ui2/components/welcome_banner.rb +139 -0
data/lib/octo/ui2/layout_manager.rb +807 -0
data/lib/octo/ui2/line_editor.rb +363 -0
data/lib/octo/ui2/markdown_renderer.rb +100 -0
data/lib/octo/ui2/output_buffer.rb +370 -0
data/lib/octo/ui2/progress_handle.rb +362 -0
data/lib/octo/ui2/progress_indicator.rb +55 -0
data/lib/octo/ui2/screen_buffer.rb +273 -0
data/lib/octo/ui2/terminal_detector.rb +119 -0
data/lib/octo/ui2/theme_manager.rb +85 -0
data/lib/octo/ui2/themes/base_theme.rb +105 -0
data/lib/octo/ui2/themes/hacker_theme.rb +62 -0
data/lib/octo/ui2/themes/minimal_theme.rb +56 -0
data/lib/octo/ui2/thinking_verbs.rb +26 -0
data/lib/octo/ui2/ui_controller.rb +1625 -0
data/lib/octo/ui2/view_renderer.rb +177 -0
data/lib/octo/ui2.rb +40 -0
data/lib/octo/ui_interface.rb +154 -0
data/lib/octo/utils/arguments_parser.rb +191 -0
data/lib/octo/utils/browser_detector.rb +195 -0
data/lib/octo/utils/encoding.rb +92 -0
data/lib/octo/utils/environment_detector.rb +140 -0
data/lib/octo/utils/file_ignore_helper.rb +170 -0
data/lib/octo/utils/file_processor.rb +601 -0
data/lib/octo/utils/gitignore_parser.rb +154 -0
data/lib/octo/utils/limit_stack.rb +152 -0
data/lib/octo/utils/logger.rb +124 -0
data/lib/octo/utils/login_shell.rb +72 -0
data/lib/octo/utils/model_pricing.rb +646 -0
data/lib/octo/utils/parser_manager.rb +165 -0
data/lib/octo/utils/path_helper.rb +15 -0
data/lib/octo/utils/scripts_manager.rb +59 -0
data/lib/octo/utils/string_matcher.rb +158 -0
data/lib/octo/utils/trash_directory.rb +112 -0
data/lib/octo/utils/workspace_rules.rb +46 -0
data/lib/octo/version.rb +5 -0
data/lib/octo/web/app.css +7141 -0
data/lib/octo/web/app.js +543 -0
data/lib/octo/web/apple-touch-icon.png +0 -0
data/lib/octo/web/auth.js +150 -0
data/lib/octo/web/channels.js +276 -0
data/lib/octo/web/datepicker.js +205 -0
data/lib/octo/web/favicon.png +0 -0
data/lib/octo/web/i18n.js +1073 -0
data/lib/octo/web/icon-512.png +0 -0
data/lib/octo/web/icon-dark.svg +25 -0
data/lib/octo/web/icon.svg +29 -0
data/lib/octo/web/index.html +871 -0
data/lib/octo/web/marked.min.js +69 -0
data/lib/octo/web/onboard.js +491 -0
data/lib/octo/web/profile.js +442 -0
data/lib/octo/web/sessions.js +4421 -0
data/lib/octo/web/settings.js +913 -0
data/lib/octo/web/sidebar.js +32 -0
data/lib/octo/web/skills.js +885 -0
data/lib/octo/web/tasks.js +297 -0
data/lib/octo/web/theme.js +105 -0
data/lib/octo/web/trash.js +343 -0
data/lib/octo/web/vendor/hljs/highlight.min.js +1244 -0
data/lib/octo/web/vendor/hljs/hljs-theme.css +95 -0
data/lib/octo/web/vendor/katex/auto-render.min.js +1 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_AMS-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Caligraphic-Bold.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Caligraphic-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Fraktur-Bold.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Fraktur-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Main-Bold.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Main-BoldItalic.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Main-Italic.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Main-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Math-BoldItalic.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Math-Italic.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_SansSerif-Bold.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_SansSerif-Italic.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_SansSerif-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Script-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Size1-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Size2-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Size3-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Size4-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/fonts/KaTeX_Typewriter-Regular.woff2 +0 -0
data/lib/octo/web/vendor/katex/katex.min.css +1 -0
data/lib/octo/web/vendor/katex/katex.min.js +1 -0
data/lib/octo/web/version.js +449 -0
data/lib/octo/web/weixin-qr.html +209 -0
data/lib/octo/web/ws-dispatcher.js +357 -0
data/lib/octo/web/ws.js +128 -0
data/lib/octo.rb +145 -0
data/scripts/build/build.sh +329 -0
data/scripts/build/lib/apt.sh +56 -0
data/scripts/build/lib/brew.sh +89 -0
data/scripts/build/lib/colors.sh +17 -0
data/scripts/build/lib/gem.sh +95 -0
data/scripts/build/lib/mise.sh +125 -0
data/scripts/build/lib/network.sh +157 -0
data/scripts/build/lib/os.sh +57 -0
data/scripts/build/lib/shell.sh +37 -0
data/scripts/build/src/install.sh.cc +174 -0
data/scripts/build/src/install_browser.sh.cc +101 -0
data/scripts/build/src/install_full.sh.cc +290 -0
data/scripts/build/src/install_rails_deps.sh.cc +145 -0
data/scripts/build/src/install_system_deps.sh.cc +123 -0
data/scripts/build/src/uninstall.sh.cc +101 -0
data/scripts/install.ps1 +532 -0
data/scripts/install.sh +567 -0
data/scripts/install_browser.sh +479 -0
data/scripts/install_full.sh +838 -0
data/scripts/install_rails_deps.sh +746 -0
data/scripts/install_system_deps.sh +518 -0
data/scripts/uninstall.sh +287 -0
data/sig/octo.rbs +4 -0
metadata +614 -0

data/lib/octo/agent.rb ADDED Viewed

@@ -0,0 +1,2180 @@
+# frozen_string_literal: true
+require "securerandom"
+require "json"
+require "cgi"
+require "tty-prompt"
+require "set"
+require_relative "utils/arguments_parser"
+require_relative "utils/file_processor"
+require_relative "utils/environment_detector"
+# Load all agent modules
+require_relative "agent/message_compressor"
+require_relative "agent/message_compressor_helper"
+require_relative "agent/tool_executor"
+require_relative "agent/session_serializer"
+require_relative "agent/skill_manager"
+require_relative "agent/system_prompt_builder"
+require_relative "agent/llm_caller"
+require_relative "agent/time_machine"
+require_relative "agent/memory_updater"
+require_relative "agent/next_message_suggester"
+require_relative "agent/skill_evolution"
+require_relative "agent/skill_reflector"
+require_relative "agent/skill_auto_creator"
+require_relative "background_task_registry"
+module Octo
+  class Agent
+    # Include all functionality modules
+    include MessageCompressorHelper
+    include ToolExecutor
+    include SessionSerializer
+    include SkillManager
+    include SystemPromptBuilder
+    include LlmCaller
+    include TimeMachine
+    include MemoryUpdater
+    include NextMessageSuggester
+    include SkillEvolution
+    include SkillReflector
+    include SkillAutoCreator
+    attr_reader :session_id, :name, :history, :iterations, :working_dir, :created_at, :total_tasks, :todos,
+                :cache_stats, :ui, :skill_loader, :agent_profile,
+                :status, :error, :updated_at, :source,
+                :latest_latency,  # Hash of latency metrics from the most recent LLM call (see Client#send_messages_with_tools)
+                :reasoning_effort
+    attr_accessor :pinned
+    REASONING_EFFORTS = %w[low medium high].freeze
+    def permission_mode
+      @config&.permission_mode&.to_s || ""
+    end
+    def reasoning_effort=(value)
+      @reasoning_effort = normalize_reasoning_effort(value)
+    end
+    private def normalize_reasoning_effort(value)
+      return nil if value.nil?
+      str = value.to_s.strip.downcase
+      return nil if str.empty? || str == "off" || str == "none"
+      return str if REASONING_EFFORTS.include?(str)
+      nil
+    end
+    public
+    def initialize(client, config, working_dir:, ui:, profile:, session_id:, source:)
+      @client = client  # Client for current model
+      @config = config.is_a?(AgentConfig) ? config : AgentConfig.new(config)
+      @agent_profile = AgentProfile.load(profile)
+      @source = source.to_sym  # :manual | :cron | :channel
+      @tool_registry = ToolRegistry.new
+      @hooks = HookManager.new
+      @session_id = session_id
+      @name = ""
+      @pinned = false
+      @history = MessageHistory.new
+      @todos = []  # Store todos in memory
+      @iterations = 0
+      @cache_stats = {
+        cache_creation_input_tokens: 0,
+        cache_read_input_tokens: 0,
+        total_requests: 0,
+        cache_hit_requests: 0,
+        raw_api_usage_samples: []  # Store raw API usage for debugging
+      }
+      @start_time = nil
+      @working_dir = working_dir || Dir.pwd
+      @created_at = Time.now.iso8601
+      @total_tasks = 0
+      @previous_total_tokens = 0  # Track tokens from previous iteration for delta calculation
+      @latest_latency = nil  # Most recent LLM call's latency metrics (see Client#send_messages_with_tools)
+      @reasoning_effort = nil  # Per-session reasoning effort override; nil = provider default
+      @ui = ui  # UIController for direct UI interaction
+      @debug_logs = []  # Debug logs for troubleshooting
+      @pending_injections = []     # Pending inline skill injections to flush after observe()
+      @pending_script_tmpdirs = [] # Decrypted-script tmpdirs to shred when agent.run completes
+      @pending_error_rollback = false  # Deferred rollback flag set by restore_session on error
+      @in_run_loop = false         # True while agent.run() is active (set under @state_mutex)
+      # Unified inbox for events that should land in @history at the next
+      # iteration boundary inside the run loop. Items are typed:
+      #   {kind: :bg_notification, content:, bubble:, enqueued_at:}
+      #   {kind: :user_msg,        content:, files:, enqueued_at:}
+      # Drained chronologically by drain_inbox_into_history! (run loop top).
+      @inbox = []
+      @inbox_run_pending = false   # Set true after enqueue_user_message decides to spawn a run; cleared at run() entry. Dedupes concurrent spawns.
+      @state_mutex = Mutex.new     # Protects @in_run_loop, @inbox, @inbox_run_pending, @current_run_thread, @discard_threshold
+      @run_mutex = Mutex.new       # Serializes every Agent#run invocation regardless of caller
+      @checkpoint_index = 0        # Tracks how many messages have been persisted to incremental log
+      @on_checkpoint = nil         # Callback proc(messages) for incremental persistence
+      @current_run_thread = nil    # Thread currently inside run()'s body — set under @state_mutex; used by interrupt_current_run!
+      @discard_threshold = nil     # Time. Stale run attempts whose enqueue time predates this are dropped.
+      # Compression tracking
+      @compression_level = 0  # Tracks how many times we've compressed (for progressive summarization)
+      @compressed_summaries = []  # Store summaries from previous compressions for reference
+      # Message compressor for LLM-based intelligent compression
+      # Uses LLM to preserve key decisions, errors, and context while reducing token count
+      @message_compressor = MessageCompressor.new(@client, model: current_model)
+      # Skill loader for skill management
+      @skill_loader = SkillLoader.new(working_dir: @working_dir)
+      # Initialize Time Machine
+      init_time_machine
+      # Register built-in tools
+      register_builtin_tools
+      # Ensure user-space parsers are in place (~/.octo/parsers/)
+      Utils::ParserManager.setup!
+      # Ensure bundled shell scripts are in place (~/.octo/scripts/)
+      Utils::ScriptsManager.setup!
+    end
+    # Restore from a saved session
+    def self.from_session(client, config, session_data, ui: nil, profile:)
+      working_dir = session_data[:working_dir] || session_data["working_dir"] || Dir.pwd
+      original_id = session_data[:session_id] || session_data["session_id"] || Octo::SessionManager.generate_id
+      # Restore source from persisted data; fall back to :manual for legacy sessions
+      source = (session_data[:source] || session_data["source"] || "manual").to_sym
+      agent = new(client, config, working_dir: working_dir, ui: ui, profile: profile,
+                  session_id: original_id, source: source)
+      agent.restore_session(session_data)
+      agent
+    end
+    def add_hook(event, &block)
+      @hooks.add(event, &block)
+    end
+    # Register a callback that receives newly-added messages after each
+    # iteration checkpoint. Used by the server layer for incremental
+    # persistence (.jsonl crash-recovery logs).
+    def on_checkpoint(&block)
+      @on_checkpoint = block
+    end
+    # Reset the checkpoint cursor so the next checkpoint! captures
+    # everything added from this point forward.
+    def reset_checkpoint!
+      @checkpoint_index = @history.to_a.size
+    end
+    # Emit any messages added to @history since the last checkpoint
+    # through the registered @on_callback handler.
+    def checkpoint!
+      return unless @on_checkpoint
+      current = @history.to_a
+      new_msgs = current[@checkpoint_index..] || []
+      return if new_msgs.empty?
+      @on_checkpoint.call(new_msgs)
+      @checkpoint_index = current.size
+    end
+    # Switch this session to a different model, identified by its stable
+    # runtime id. Ids survive list reorders, additions, and field edits,
+    # which is why we no longer expose an index-based API.
+    # @param id [String] Model id (see AgentConfig#parse_models)
+    # @return [Boolean] true if switched successfully, false otherwise
+    def switch_model_by_id(id)
+      return false unless @config.switch_model_by_id(id)
+      rebuild_client_for_current_model!
+      true
+    end
+    # Rebuild the underlying Client (and dependent components) to pick up
+    # credentials/model name from the currently-selected model in @config.
+    private def rebuild_client_for_current_model!
+      @client = Octo::Client.new(
+        @config.api_key,
+        base_url: @config.base_url,
+        model: @config.model_name,
+        anthropic_format: @config.anthropic_format?
+      )
+      # Update message compressor with new client and model
+      @message_compressor = MessageCompressor.new(@client, model: current_model)
+      # Inject a new session context to notify the AI of the model switch
+      inject_session_context
+    end
+    # Change the working directory for this session
+    # Injects a new session context to notify the AI of the directory change
+    def change_working_dir(new_dir)
+      @working_dir = new_dir
+      inject_session_context
+      true
+    end
+    # Get list of available model names
+    def available_models
+      @config.model_names
+    end
+    # Get current model configuration info
+    def current_model_info
+      model = @config.current_model
+      return nil unless model
+      {
+        id: model["id"],
+        name: model["name"],
+        model: model["model"],
+        base_url: model["base_url"]
+      }
+    end
+    # Get current model name (respects any active fallback override)
+    private def current_model
+      @config.effective_model_name
+    end
+    # Rename this session. Called by auto-naming (first message) or user explicit rename.
+    def rename(new_name)
+      @name = new_name.to_s.strip
+    end
+    # Entry point for an agent turn. Two modes:
+    #
+    #   run("user typed this")  — user message mode
+    #   run                     — drain-only mode: nothing to append directly;
+    #                              the inbox drain at iteration top is expected
+    #                              to find something. If the inbox is also empty,
+    #                              the loop exits immediately (no wasted LLM call).
+    def run(user_input = nil, files: [], system_notification: nil, _bg_enqueued_at: nil)
+      # 救法 1: bg-notification runs carry their enqueue timestamp. If a user
+      # interrupt has bumped @discard_threshold past that timestamp, the
+      # notification's "ticket" is stale — drop it before we grab the heavy
+      # @run_mutex (which a real user message may be waiting behind us for).
+      if system_notification && _bg_enqueued_at
+        @state_mutex.synchronize do
+          return if @discard_threshold && _bg_enqueued_at < @discard_threshold
+        end
+      end
+      # Serialize every Agent#run invocation so concurrent callers cannot
+      # mutate @history, @iterations, etc. simultaneously.
+      @run_mutex.synchronize do
+        if system_notification && _bg_enqueued_at
+          @state_mutex.synchronize do
+            return if @discard_threshold && _bg_enqueued_at < @discard_threshold
+          end
+        end
+        @state_mutex.synchronize do
+          @in_run_loop = true
+          @current_run_thread = Thread.current
+          # We're entering run() — any concurrent caller that observed
+          # @inbox_run_pending == true and decided NOT to spawn can rely
+          # on this run absorbing their inbox items. Clear the flag.
+          @inbox_run_pending = false
+        end
+        # Drain-only mode: no direct input, and nothing queued either. Don't
+        # bother the LLM with an empty turn.
+        if user_input.nil? && system_notification.nil?
+          empty_inbox = @state_mutex.synchronize { @inbox.empty? }
+          if empty_inbox
+            @state_mutex.synchronize do
+              @in_run_loop = false
+              @current_run_thread = nil
+            end
+            Octo::Logger.info("agent.drain_only_run_empty_inbox", session_id: @session_id)
+            return
+          end
+        end
+      # Show the "thinking" indicator as early as possible so the user gets
+      # immediate feedback after sending a message. Without this the UI stays
+      # silent during synchronous setup work (system prompt assembly, file
+      # parsing, history compression checks) before the first LLM call. The
+      # subsequent `think` call will re-emit show_progress, which is an
+      # idempotent update on the same progress UI element.
+      @ui&.show_progress
+      # Start new task for Time Machine
+      task_id = start_new_task
+      @start_time = Time.now
+      @task_truncation_count = 0  # Reset truncation counter for each task
+      @task_timeout_hint_injected = false  # Reset read-timeout hint injection (see LlmCaller)
+      @task_upstream_truncation_hint_injected = false  # Reset upstream-truncation hint injection (see LlmCaller)
+      # Note: Do NOT reset @previous_total_tokens here - it should maintain the value from the last iteration
+      # across tasks to correctly calculate delta tokens in each iteration
+      @task_start_iterations = @iterations  # Track starting iterations for this task
+      # Track cache stats for current task
+      @task_cache_stats = {
+        cache_creation_input_tokens: 0,
+        cache_read_input_tokens: 0,
+        total_requests: 0,
+        cache_hit_requests: 0
+      }
+      # Deferred error rollback: if the previous session ended with an error,
+      # trim history back to just before that failed user message now — at the
+      # point the user actually sends a new message, not at restore time.
+      # (Trimming at restore time caused replay_history to return empty results.)
+      if @pending_error_rollback
+        @pending_error_rollback = false
+        last_user_index = @history.last_real_user_index
+        if last_user_index
+          @history.truncate_from(last_user_index)
+          @hooks.trigger(:session_rollback, {
+            reason: "Previous session ended with error — rolling back before new message",
+            rolled_back_message_index: last_user_index
+          })
+        end
+      end
+      # Add system prompt as the first message if this is the first run
+      if @history.empty?
+        system_prompt = build_system_prompt
+        @history.append({ role: "system", content: system_prompt })
+      end
+      # Inject session context (date + model) if not yet present or date has changed
+      inject_session_context_if_needed
+      # Inject chunk index card if archived chunks exist and index is stale
+      inject_chunk_index_if_needed
+      if system_notification
+        # System notification mode — triggered by background task completion.
+        # Skip all user input processing; inject the notification directly.
+        @history.append({
+          role: "user",
+          content: system_notification,
+          system_injected: true,
+          task_id: task_id,
+          created_at: Time.now.to_f
+        })
+      elsif user_input.nil? || user_input.empty?
+        # Drain-only mode: nothing to append now. The iteration drain at the
+        # top of the loop will pick up whatever's in @inbox (which is why we
+        # were started — see http_server's follow-up run spawn).
+      else
+        # Normal user message mode — files may or may not be attached.
+        processed = process_files_for_user_message(user_input, files)
+        append_processed_user_message_to_history!(processed, task_id)
+        # If the user typed a slash command targeting a skill with disable-model-invocation: true,
+        # inject the skill content as a synthetic assistant message so the LLM can act on it.
+        # Skills already in the system prompt (model_invocation_allowed?) are skipped.
+        inject_skill_command_as_assistant_message(user_input, task_id)
+      end
+      @hooks.trigger(:on_start, system_notification ? "[background task notification]" : user_input)
+      begin
+        # Track if request_user_feedback was called
+        awaiting_user_feedback = false
+        # Track if task was interrupted by user (denied tool execution)
+        task_interrupted = false
+        loop do
+          @iterations += 1
+          @hooks.trigger(:on_iteration, @iterations)
+          # Drain any inbox items (queued user messages) since the last
+          # iteration. Without this, items sit in the queue until the WHOLE
+          # run completes — latency drops from "minutes" to "one LLM turn".
+          drain_inbox_into_history!(task_id)
+          # Persist drained inbox messages immediately so they survive a
+          # crash during the upcoming think() call.
+          checkpoint!
+          # Think: LLM reasoning with tool support
+          response = think
+          @last_token_usage = response[:token_usage] if response && response[:token_usage]
+          # Debug: check for potential infinite loops
+          if @config.verbose
+            @ui&.log("Iteration #{@iterations}: finish_reason=#{response[:finish_reason]}, tool_calls=#{response[:tool_calls]&.size || 'nil'}", level: :debug)
+          end
+          # Skip if compression happened (response is nil)
+          if response.nil?
+            checkpoint!
+            next
+          end
+          # Checkpoint immediately after think() so the assistant message
+          # (and any tool_calls it contains) is persisted before we enter
+          # act(). If a crash happens between think() and the next
+          # iteration-boundary checkpoint, recovery can at least restore
+          # the model's intent.
+          checkpoint!
+          # [DIAG] Only log when finish_reason=="stop" AND tool_calls non-empty —
+          # the suspicious combo that indicates an upstream-truncated tool_use
+          # response. Normal responses produce no log line here to avoid noise.
+          begin
+            tool_calls = response[:tool_calls] || []
+            if response[:finish_reason] == "stop" && !tool_calls.empty?
+              tc_summary = tool_calls.map do |c|
+                args_str = c[:arguments].is_a?(String) ? c[:arguments] : c[:arguments].to_s
+                {
+                  name: c[:name].to_s,
+                  args_len: args_str.length,
+                  args_head: args_str[0, 120]
+                }
+              end
+              Octo::Logger.warn("agent.think_response",
+                session_id: @session_id,
+                iteration: @iterations,
+                finish_reason: response[:finish_reason].to_s,
+                tool_calls_count: tool_calls.size,
+                tool_calls: tc_summary,
+                content_len: response[:content].to_s.length,
+                completion_tokens: response.dig(:token_usage, :completion_tokens),
+                ttft_ms: response.dig(:latency, :ttft_ms),
+                suspicious_truncation: true
+              )
+            end
+          rescue StandardError => e
+            Octo::Logger.warn("agent.think_response.log_failed", error: e.message)
+          end
+          # Check if done (no more tool calls needed).
+          #
+          # Defensive rule: we ONLY exit on empty/missing tool_calls.
+          # We used to also short-circuit on finish_reason=="stop", but
+          # upstream routers (OpenRouter → Anthropic/Bedrock) can return the
+          # contradictory combo `finish_reason=="stop" + non-empty tool_calls
+          # with truncated args`, which caused the agent to silently treat a
+          # truncated response as "task complete". Truncation is now caught
+          # earlier by LlmCaller#detect_upstream_truncation! (which raises
+          # UpstreamTruncatedError → RetryableError); this branch stays as
+          # a belt-and-braces guard: if that detector ever misses a new
+          # truncation pattern, we still won't silently exit while the model
+          # is mid-tool_call.
+          if response[:tool_calls].nil? || response[:tool_calls].empty?
+            # [DIAG] Pin down exactly which sub-condition triggered the task exit.
+            Octo::Logger.info("agent.loop_break_normal",
+              session_id: @session_id,
+              iteration: @iterations,
+              branch: (response[:tool_calls].nil? ? "tool_calls_nil" : "tool_calls_empty"),
+              finish_reason: response[:finish_reason].to_s,
+              tool_calls_count: (response[:tool_calls] || []).size
+            )
+            if response[:content] && !response[:content].empty?
+              emit_assistant_message(response[:content], reasoning_content: response[:reasoning_content])
+            end
+            # Debug: log why we're stopping
+            if @config.verbose && (response[:tool_calls].nil? || response[:tool_calls].empty?)
+              reason = response[:finish_reason] == "stop" ? "API returned finish_reason=stop" : "No tool calls in response"
+              @ui&.log("Stopping: #{reason}", level: :debug)
+              if response[:content] && response[:content].is_a?(String)
+                preview = response[:content].length > 200 ? response[:content][0...200] + "..." : response[:content]
+                @ui&.log("Response content: #{preview}", level: :debug)
+              end
+            end
+            # A queued user message may have landed between this think() and
+            # now. Don't break — loop back so the next iteration's drain
+            # injects it and the LLM addresses it within the same warm-cache
+            # run. Saves the full-context replay of a fresh run().
+            if inbox_pending?
+              Octo::Logger.info("agent.loop_continue_for_pending_inbox",
+                session_id: @session_id,
+                iteration: @iterations
+              )
+              checkpoint!
+              next
+            end
+            checkpoint!
+            break
+          end
+          # Show assistant message if there's content before tool calls
+          if response[:content] && !response[:content].empty?
+            emit_assistant_message(response[:content], reasoning_content: response[:reasoning_content])
+          end
+          # Act: Execute tool calls
+          action_result = act(response[:tool_calls])
+          # Check if request_user_feedback was called
+          if action_result[:awaiting_feedback]
+            awaiting_user_feedback = true
+            observe(response, action_result[:tool_results])
+            flush_pending_injections
+            checkpoint!
+            break
+          end
+          # Observe: Add tool results to conversation context
+          observe(response, action_result[:tool_results])
+          # Flush any inline skill injections enqueued by invoke_skill during act().
+          # Must happen AFTER observe() so toolResult is appended before skill instructions,
+          # producing a legal message sequence for all API providers (especially Bedrock).
+          flush_pending_injections
+          # Check if user denied any tool
+          if action_result[:denied]
+            task_interrupted = true
+            # If user provided feedback, treat it as a user question/instruction
+            if action_result[:feedback] && !action_result[:feedback].empty?
+              # Add user feedback as a new user message with system_injected marker
+              @history.append({
+                role: "user",
+                content: "The user has a question/feedback for you: #{action_result[:feedback]}\n\nPlease respond to the user's question/feedback before continuing with any actions.",
+                system_injected: true
+              })
+              checkpoint!
+              # Continue loop to let agent respond to feedback
+              next
+            else
+              # User just said "no" without feedback - stop and wait
+              @ui&.show_assistant_message("Tool execution was denied. Please give more instructions...", files: [])
+              checkpoint!
+              break
+            end
+          end
+          # Normal iteration end — persist incremental checkpoint before
+          # the next loop iteration so crash recovery captures this turn.
+          checkpoint!
+        end
+      result = build_result
+      # Save snapshots of modified files for Time Machine
+      if @modified_files_in_task && !@modified_files_in_task.empty?
+        save_modified_files_snapshot(@modified_files_in_task)
+        @modified_files_in_task = []  # Reset for next task
+      end
+        # Run skill evolution hooks after main loop completes
+        # Skip if task was interrupted by user (denied tool) or awaiting user feedback
+        # Only for main agent (not subagents) to avoid recursive evolution
+        unless @is_subagent || task_interrupted || awaiting_user_feedback
+          run_skill_evolution_hooks
+        end
+        # Run long-term memory update as a forked subagent BEFORE we print
+        # show_complete. Running it as a subagent (rather than inline in
+        # the main loop) gives us correct visual ordering structurally:
+        # the subagent blocks until done, its progress spinner finishes,
+        # and only then [OK] Task Complete is printed. No cleanup dance,
+        # no cross-method progress handle holding.
+        # Skip on interrupt / feedback / subagent (self-guarded inside too).
+        unless @is_subagent || task_interrupted || awaiting_user_feedback
+          run_memory_update_subagent
+        end
+        if @is_subagent
+          # Parent agent (skill_manager) prints the completion summary; skip here.
+        else
+          @ui&.show_complete(
+            iterations: result[:iterations],
+            duration: result[:duration_seconds],
+            cache_stats: result[:cache_stats],
+            awaiting_user_feedback: awaiting_user_feedback
+          )
+          # Show token usage once at task completion (not on every iteration)
+          @ui&.show_token_usage(@last_token_usage) if @last_token_usage
+        end
+        # Fire async ghost-text prediction for the user's next message. Must
+        # run AFTER show_complete (so the UI is in its idle "awaiting input"
+        # state) and is fire-and-forget — the suggestion arrives later via
+        # the UI's own +show_next_message_suggestion+ event.
+        # Same guards as run_memory_update_subagent: skip if interrupted,
+        # awaiting feedback, or running as a subagent.
+        unless @is_subagent || task_interrupted || awaiting_user_feedback
+          run_next_message_suggestion!
+        end
+        @hooks.trigger(:on_complete, result)
+        result
+      rescue Octo::AgentInterrupted
+        # Let CLI handle the interrupt message
+        raise
+      rescue StandardError => e
+        # Log complete error information to debug_logs for troubleshooting
+        @debug_logs << {
+          timestamp: Time.now.iso8601,
+          event: "agent_run_error",
+          error_class: e.class.name,
+          error_message: e.message,
+          backtrace: e.backtrace&.first(30) # Keep first 30 lines of backtrace
+        }
+        Octo::Logger.error("agent_run_error", error: e)
+        # 400 errors mean our request was malformed — roll back history so the bad
+        # message is not replayed on the next user turn.
+        # Other errors (auth, network, etc.) leave history intact for retry.
+        @pending_error_rollback = true if e.is_a?(Octo::BadRequestError)
+        # Build error result for session data, but let CLI handle error display
+        result = build_result(:error, error: e.message)  # rubocop:disable Lint/UselessAssignment
+        raise
+      ensure
+        @state_mutex.synchronize do
+          @in_run_loop = false
+          @current_run_thread = nil
+        end
+        # Safety net: ensure any lingering progress spinner is stopped.
+        # Normal paths close their own spinners; this guards against exceptions
+        # raised between a progress slot's active/done pair.
+        @ui&.show_progress(phase: "done")
+        # Reap stale completed background tasks so the registry doesn't grow
+        # unboundedly across a long session.
+        begin
+          BackgroundTaskRegistry.prune_completed(max_age: 3_600, agent_session_id: @session_id)
+        rescue => e
+          Octo::Logger.error("background_task_prune_error", error: e)
+        end
+        # If an inbox item arrived during the ensure block — i.e. AFTER the
+        # last in-loop drain but BEFORE we released @run_mutex — handle it
+        # on a fresh thread so we don't block the caller.
+        flush_inbox_after_run
+      end
+      end  # @run_mutex.synchronize
+    end
+    # Drain ALL pending inbox items into @history. Called at the top of every
+    # iteration inside the run loop so messages land within one LLM turn of
+    # arrival — never deferred until the whole run completes.
+    #
+    # Returns true if anything was drained, false if the inbox was empty.
+    private def drain_inbox_into_history!(task_id)
+      items = nil
+      @state_mutex.synchronize do
+        return false if @inbox.empty?
+        items = @inbox.dup
+        @inbox.clear
+      end
+      # Coalesce consecutive bg notifications into one system_injected msg
+      bg_bubbles = []
+      bg_bodies  = []
+      flush_bg = lambda do
+        next if bg_bodies.empty?
+        bg_bubbles.each { |b| emit_bubble_for_notification(b) }
+        @history.append({
+          role:            "user",
+          content:         bg_bodies.join("\n\n"),
+          system_injected: true,
+          task_id:         task_id,
+          created_at:      Time.now.to_f
+        })
+        bg_bubbles = []
+        bg_bodies  = []
+      end
+      items.each do |item|
+        case item[:kind]
+        when :bg_notification
+          bg_bubbles << item[:bubble]
+          bg_bodies  << format_notification_for_history(item[:content])
+        when :user_msg
+          flush_bg.call
+          created_at = item[:enqueued_at] || Time.now
+          if item[:processed]
+            append_processed_user_message_to_history!(item[:processed], task_id)
+            @ui&.show_user_message(
+              item[:processed][:user_content],
+              files: item[:processed][:display_files] || [],
+              created_at: created_at.to_f,
+              source: :web
+            )
+          else
+            @history.append({
+              role:       "user",
+              content:    item[:content],
+              task_id:    task_id,
+              created_at: created_at.to_f
+            })
+            @total_tasks += 1
+            @ui&.show_user_message(item[:content], created_at: created_at.to_f, source: :web)
+          end
+        else
+          Octo::Logger.warn("agent.unknown_inbox_kind", kind: item[:kind])
+        end
+      end
+      flush_bg.call
+      if items.any? { |i| i[:kind] == :user_msg }
+        remaining = @state_mutex.synchronize { @inbox.count { |i| i[:kind] == :user_msg } }
+        broadcast_user_message_queue_status(remaining)
+      end
+      Octo::Logger.info("agent.inbox_drained",
+        session_id: @session_id,
+        count:      items.size,
+        kinds:      items.group_by { |i| i[:kind] }.transform_values(&:size)
+      )
+      true
+    rescue => e
+      # Drain failed partway through: unprocessed items are lost from @inbox
+      # because we cleared it before the loop. Re-queue the survivors.
+      survivors = items.compact
+      unless survivors.empty?
+        @state_mutex.synchronize do
+          @inbox.unshift(*survivors)
+        end
+        Octo::Logger.warn("agent.drain_inbox_recovered",
+          session_id: @session_id,
+          recovered:  survivors.size,
+          error:      e.message
+        )
+      end
+      Octo::Logger.error("agent.drain_inbox_error",
+        session_id:    @session_id,
+        error:         e,
+        survivors:     survivors.size
+      )
+      false
+    end
+    # True if at least one item is currently queued in the inbox. Used by the
+    # run loop's "LLM said done — but should we really break?" check.
+    private def inbox_pending?
+      @state_mutex.synchronize { !@inbox.empty? }
+    end
+    # Public: count of pending :user_msg items in the inbox.
+    # Used by WebSocket reconnect to replay queue status to newly subscribed tabs.
+    def inbox_user_message_count
+      @state_mutex.synchronize { @inbox.count { |i| i[:kind] == :user_msg } }
+    end
+    # Public: snapshot of pending :user_msg items in the inbox, in a format
+    # ready for replay via UI#show_user_message on WebSocket reconnect.
+    # Each entry: { content:, files:, created_at: } — files is an array of
+    # display-file hashes (name, data_url, mime_type).
+    def inbox_user_messages_snapshot
+      @state_mutex.synchronize do
+        @inbox.select { |i| i[:kind] == :user_msg }.map do |item|
+          created_at = item[:enqueued_at] || Time.now
+          if item[:processed]
+            {
+              content:    item[:processed][:user_content],
+              files:      item[:processed][:display_files] || [],
+              created_at: created_at.to_f
+            }
+          else
+            {
+              content:    item[:content],
+              files:      [],
+              created_at: created_at.to_f
+            }
+          end
+        end
+      end
+    end
+    # Set @discard_threshold to now and (best-effort) raise AgentInterrupted
+    # into the thread currently inside Agent#run. Called by http_server's
+    # interrupt_session in addition to the existing session[:thread].raise —
+    # the existing path only catches user-msg runs (whose thread is tracked
+    # in session[:thread]).
+    #
+    # Idempotent: harmless to call multiple times. Best-effort: Thread#raise
+    # against a thread blocked deep in a syscall may not fire immediately;
+    # the watchdog in http_server escalates if needed.
+    def interrupt_current_run!
+      target = nil
+      @state_mutex.synchronize do
+        @discard_threshold = Time.now
+        target = @current_run_thread
+      end
+      return false unless target
+      begin
+        target.raise(Octo::AgentInterrupted, "Interrupted by user")
+      rescue StandardError
+        # Thread may have just exited; nothing to do.
+      end
+      true
+    end
+    # True iff a thread is currently inside Agent#run (between acquiring
+    # @run_mutex and releasing it). Server-layer callers use this to decide
+    # whether a new user message can be enqueued (run in flight will drain
+    # it) or needs a fresh run() to be spawned (agent is idle).
+    def in_run_loop?
+      @state_mutex.synchronize { @in_run_loop }
+    end
+    # Queue a user message (text and/or files) into the inbox. Returns a
+    # tristate describing what the caller should do next:
+    #   :running       — a run is currently in flight; the in-loop drain at
+    #                    the next iteration boundary will pick this up.
+    #                    Caller does NOT spawn a new run.
+    #   :spawn         — agent is idle AND no other caller has been told to
+    #                    spawn yet. Caller IS responsible for spawning a
+    #                    drain-only run (typically via run_agent_task so the
+    #                    thread is registered for interrupt_session).
+    #   :spawn_pending — agent is idle BUT another concurrent caller has
+    #                    already been told to spawn. Caller does NOT spawn —
+    #                    the other run will absorb this message too.
+    #
+    # Files are processed eagerly **on the caller's thread** (typically the
+    # HTTP-handler thread) so the processed payload is fully formed by the
+    # time it sits in the inbox. The agent thread's drain then just appends
+    # to @history — no @history mutation off-thread.
+    def enqueue_user_message(content, files: [])
+      processed = nil
+      if files && !files.empty?
+        processed = process_files_for_user_message(content, files)
+      end
+      result = nil
+      pending_user_msgs = 0
+      @state_mutex.synchronize do
+        @inbox << {
+          kind:        :user_msg,
+          content:     content.to_s,
+          processed:   processed,
+          enqueued_at: Time.now
+        }
+        pending_user_msgs = @inbox.count { |i| i[:kind] == :user_msg }
+        if @in_run_loop
+          result = :running
+        elsif @inbox_run_pending
+          result = :spawn_pending
+        else
+          @inbox_run_pending = true
+          result = :spawn
+        end
+      end
+      # Only broadcast the "N waiting" hint when the message will actually
+      # WAIT behind an in-flight run. For :spawn / :spawn_pending the agent
+      # will drain it within milliseconds, so flashing a count then
+      # immediately clearing it would just be visual noise.
+      if result == :running
+        broadcast_user_message_queue_status(pending_user_msgs)
+      end
+      Octo::Logger.info("agent.user_message_enqueued",
+        session_id: @session_id,
+        decision: result,
+        has_files: !processed.nil?,
+        pending_user_msgs: pending_user_msgs
+      )
+      result
+    end
+    private def broadcast_user_message_queue_status(count)
+      @ui&.update_user_message_queue_status(pending: count)
+    rescue => e
+      Octo::Logger.error("agent.user_queue_status_error",
+        session_id: @session_id,
+        error: e
+      )
+    end
+    # Called by BackgroundTaskRegistry when a fire-and-forget background task
+    # completes. Two delivery paths depending on agent state:
+    #   - Agent is mid-run  → enqueue; the per-iteration drain picks it up
+    #   - Agent is idle     → start a fresh run on the caller's thread
+    def resume_with_notification(notification_content, bubble: nil)
+      enqueue_at = Time.now
+      should_run = false
+      @state_mutex.synchronize do
+        if @in_run_loop
+          @inbox << {
+            kind:        :bg_notification,
+            content:     notification_content,
+            bubble:      bubble,
+            enqueued_at: enqueue_at
+          }
+          Octo::Logger.info("agent.notification_queued",
+            session_id: @session_id,
+            queue_size: @inbox.size
+          )
+          return
+        end
+        should_run = true
+      end
+      return unless should_run
+      emit_bubble_for_notification(bubble)
+      formatted = format_notification_for_history(notification_content)
+      run("", system_notification: formatted, _bg_enqueued_at: enqueue_at)
+    end
+    # Drain any items queued during this run's ensure window (after the last
+    # in-loop drain but before @run_mutex was released).
+    private def flush_inbox_after_run
+      drain_target = nil
+      @state_mutex.synchronize do
+        drain_target = @inbox.find { |i| i[:kind] == :user_msg } || @inbox.first
+      end
+      return unless drain_target
+      case drain_target[:kind]
+      when :user_msg
+        Thread.new do
+          Thread.current.name = "inbox-flush-user-#{@session_id[0, 8]}"
+          begin
+            run
+          rescue => e
+            Octo::Logger.error("agent.flush_inbox_user_error",
+              session_id: @session_id,
+              error: e
+            )
+          end
+        end
+      when :bg_notification
+        item = nil
+        @state_mutex.synchronize do
+          idx = @inbox.find_index { |i| i[:kind] == :bg_notification }
+          item = @inbox.delete_at(idx) if idx
+        end
+        return unless item
+        Thread.new do
+          Thread.current.name = "inbox-flush-bg-#{@session_id[0, 8]}"
+          begin
+            resume_with_notification(item[:content], bubble: item[:bubble])
+          rescue => e
+            Octo::Logger.error("agent.flush_inbox_bg_error",
+              session_id: @session_id,
+              error: e
+            )
+          end
+        end
+      end
+    end
+    private def format_notification_for_history(content)
+      <<~MSG.strip
+        [SYSTEM NOTIFICATION - NOT USER INPUT]
+        This is an automated background-task event, NOT a message from the user.
+        Do NOT interpret this as user acknowledgement, confirmation, or response
+        to any pending question.
+        <task-notification>
+        #{content}
+        </task-notification>
+      MSG
+    end
+    private def emit_bubble_for_notification(bubble)
+      return unless bubble && @ui
+      @ui.show_background_task_notice(
+        command: bubble[:command],
+        handle_id: bubble[:handle_id],
+        status: bubble[:status]
+      )
+    rescue => e
+      Octo::Logger.error("agent.bubble_emit_error",
+        session_id: @session_id,
+        error: e
+      )
+    end
+    private def broadcast_background_tasks_snapshot
+      return unless @ui
+      now = Time.now
+      snapshot = BackgroundTaskRegistry.list_running(agent_session_id: @session_id).map do |t|
+        elapsed = t[:started_at] ? (now - t[:started_at]).round : 0
+        {
+          handle_id:  t[:handle_id],
+          command:    t[:command],
+          started_at: t[:started_at],
+          elapsed:    elapsed
+        }
+      end
+      @ui.update_background_tasks(running: snapshot.size, tasks: snapshot)
+    rescue => e
+      Octo::Logger.error("agent.broadcast_bg_tasks_error",
+        session_id: @session_id,
+        error: e
+      )
+    end
+    private def format_terminal_notification(task_result, tool_use_id: nil)
+      handle_id       = task_result[:handle_id]
+      command         = task_result[:command]
+      output_file     = task_result[:output_file]
+      elapsed_seconds = task_result[:elapsed_seconds]
+      broadcast_background_tasks_snapshot
+      status, summary = derive_status_and_summary(task_result, command)
+      parts = []
+      parts << "<task-id>#{handle_id}</task-id>"            if handle_id
+      parts << "<tool-use-id>#{tool_use_id}</tool-use-id>"  if tool_use_id
+      parts << "<command>#{command}</command>"              if command
+      parts << "<status>#{status}</status>"
+      if task_result[:exit_code]
+        parts << "<exit-code>#{task_result[:exit_code]}</exit-code>"
+      end
+      if elapsed_seconds
+        parts << "<elapsed-seconds>#{elapsed_seconds}</elapsed-seconds>"
+      end
+      parts << "<output-file>#{output_file}</output-file>"  if output_file
+      if task_result[:full_output_file]
+        parts << "<full-output-file>#{task_result[:full_output_file]}</full-output-file>"
+      end
+      parts << "<summary>#{summary}</summary>"
+      siblings = BackgroundTaskRegistry.list_running(agent_session_id: @session_id)
+      if siblings.any?
+        sibling_lines = siblings.map do |s|
+          cmd = s[:command].to_s
+          cmd = cmd.length > 60 ? "#{cmd[0, 57]}..." : cmd
+          elapsed = s[:started_at] ? (Time.now - s[:started_at]).round : nil
+          elapsed_s = elapsed ? "#{elapsed}s" : "?"
+          "  <sibling-task><handle-id>#{s[:handle_id]}</handle-id><command>#{cmd}</command><elapsed>#{elapsed_s}</elapsed></sibling-task>"
+        end
+        parts << "<sibling-tasks>\n#{sibling_lines.join("\n")}\n</sibling-tasks>"
+      end
+      {
+        content: parts.join("\n"),
+        bubble:  { command: command, handle_id: handle_id, status: status }
+      }
+    end
+    private def derive_status_and_summary(task_result, command)
+      cmd_label = command ? "`#{command}`" : "background terminal task"
+      last_line = last_nonempty_line(task_result[:output])
+      if task_result[:cancelled]
+        ["cancelled", "#{cmd_label} cancelled by user"]
+      elsif task_result[:error]
+        ["error", "#{cmd_label} watcher error: #{task_result[:error]}"]
+      elsif task_result[:exit_code]
+        verb = task_result[:exit_code].zero? ? "exited 0" : "exited #{task_result[:exit_code]}"
+        body = "#{cmd_label} #{verb}"
+        body = "#{body} — last: #{last_line.inspect}" if last_line
+        [(task_result[:exit_code].zero? ? "success" : "failed"), body]
+      else
+        ["success", "#{cmd_label} completed"]
+      end
+    end
+    private def last_nonempty_line(output)
+      return nil if output.nil? || output.to_s.empty?
+      line = output.to_s.lines.map(&:chomp).reject { |l| l.strip.empty? }.last
+      return nil if line.nil? || line.empty?
+      line.length > 200 ? "#{line[0, 200]}…" : line
+    end
+    private def think
+      # Check API key before starting progress indicator
+      if @client.instance_variable_get(:@api_key).nil? || @client.instance_variable_get(:@api_key).empty?
+        @ui&.show_error("API key is not configured! Please run /config to set up your API key.")
+        raise AgentError, "API key is not configured"
+      end
+      # Ensure a thinking progress indicator is live for the duration of this
+      # LLM turn. This is idempotent — if `run` already started one at task
+      # entry (or a previous iteration left one running), the UI recognizes
+      # the bare reentry and preserves the existing spinner.
+      @ui&.show_progress
+      # Check if compression is needed
+      compression_context = compress_messages_if_needed(force: false)
+      # If compression is triggered, insert compression message and handle it
+      if compression_context
+        # Show compression start notification
+        @ui&.show_info(
+          "Message history compression starting (~#{compression_context[:original_token_count]} tokens, #{compression_context[:original_message_count]} messages) - Level #{compression_context[:compression_level]}"
+        )
+        compression_message = compression_context[:compression_message]
+        @history.append(compression_message)
+        compression_handled = false
+        # Open a dedicated quiet-style handle for the compression work.
+        # This sits on top of the outer thinking progress (if any); Plan B
+        # semantics detach the outer spinner until we finish here. On any
+        # exception the ensure block in with_progress guarantees the
+        # handle is released — no more orphan gray ticker colliding with
+        # a yellow ticker (the original flicker bug).
+        #
+        # NOTE: safe-navigation (+&.+) with blocks silently skips the
+        # block when the receiver is nil. We need the compression work to
+        # run even when @ui is nil (e.g. in tests), so branch explicitly.
+        begin
+          if @ui
+            @ui.with_progress(message: "Compressing message history...", style: :quiet) do |handle|
+              response = call_llm
+              handle_compression_response(response, compression_context, progress: handle)
+              compression_handled = true
+            end
+          else
+            response = call_llm
+            handle_compression_response(response, compression_context)
+            compression_handled = true
+          end
+        ensure
+          # If interrupted or failed, roll back the speculative compression message
+          # so it doesn't pollute future conversation turns.
+          unless compression_handled
+            @history.rollback_before(compression_message)
+            # Also restore compression_level since compress_messages_if_needed already incremented it.
+            # Failure to do so would cause the next call to start at level 2 instead of 1,
+            # and more importantly would re-trigger compression on the very next think() call
+            # (with the user's new message as the last entry), producing consecutive user messages
+            # that confuse the LLM into echoing compression instructions.
+            @compression_level -= 1
+          end
+        end
+        return nil
+      end
+      # Normal LLM call. call_llm no longer manages the progress lifecycle;
+      # we keep the spinner live across the call and finalize it here so the
+      # UI transitions cleanly to the assistant message that follows.
+      response = nil
+      begin
+        response = call_llm
+      rescue
+        # Ensure the spinner is stopped on any error path before it bubbles up.
+        @ui&.show_progress(phase: "done")
+        raise
+      end
+      # Handle truncated responses (when max_tokens limit is reached)
+      if response[:finish_reason] == "length"
+        # Count recent truncations to prevent infinite loops
+        @task_truncation_count = (@task_truncation_count || 0) + 1
+        if @task_truncation_count >= 3
+          # Too many truncations - task is too complex
+          @ui&.show_progress(phase: "done")
+          @ui&.show_error("Response truncated multiple times. Task is too complex.")
+          # Create a response that tells the user to break down the task
+          error_response = {
+            content: "I apologize, but this task is too complex to complete in a single response. " \
+                     "Please break it down into smaller steps, or reduce the amount of content to generate at once.\n\n" \
+                     "For example, when creating a long document:\n" \
+                     "1. First create the file with a basic structure\n" \
+                     "2. Then use edit() to add content section by section",
+            finish_reason: "stop",
+            tool_calls: nil
+          }
+          # Add this as an assistant message so it appears in conversation
+          @history.append({
+            role: "assistant",
+            content: error_response[:content]
+          })
+          return error_response
+        end
+        # Preserve the truncated assistant message (text only, drop incomplete tool_calls)
+        # so the LLM sees what it attempted before. This also maintains the required
+        # user/assistant alternation for Bedrock Converse API.
+        truncated_text = response[:content] || ""
+        truncated_text = "..." if truncated_text.strip.empty?
+        truncated_msg = {
+          role: "assistant",
+          content: truncated_text,
+          task_id: @current_task_id
+        }
+        # Preserve reasoning_content on truncated turns as well.
+        # This is the real LLM-emitted reasoning — keeping it here lets
+        # MessageHistory#to_api recognize we're in thinking mode and pad any
+        # other synthetic assistant messages in the history with an empty
+        # reasoning_content automatically (see message_history.rb).
+        truncated_msg[:reasoning_content] = response[:reasoning_content] if response[:reasoning_content]
+        @history.append(truncated_msg)
+        # Insert system message to guide LLM to retry with smaller steps
+        @history.append({
+          role: "user",
+          content: "[SYSTEM] Your previous response was truncated because it exceeded the output token limit (max_tokens=#{@config.max_tokens}). " \
+                   "The incomplete tool call has been discarded. Please retry with a different approach:\n" \
+                   "- For long file content: create the file with a basic structure first, then use edit() to add content section by section\n" \
+                   "- Break down large tasks into multiple smaller tool calls\n" \
+                   "- Keep each tool call argument under 2000 characters\n" \
+                   "- Use multiple tool calls instead of one large call",
+          truncated: true
+        })
+        # Close the current spinner so the warning appears cleanly;
+        # the recursive think() call below will reopen a new one.
+        @ui&.show_progress(phase: "done")
+        @ui&.show_warning("Response truncated (#{@task_truncation_count}/3). Retrying with smaller steps...")
+        # Persist the truncated assistant message and the system retry hint
+        # before the recursive think() so they survive a crash mid-retry.
+        checkpoint!
+        # Recursively retry
+        return think
+      end
+      # Add assistant response to history
+      msg = { role: "assistant", task_id: @current_task_id }
+      # Always include content field (some APIs require it even with tool_calls)
+      # Use empty string instead of null for better compatibility
+      msg[:content] = response[:content] || ""
+      # Only add tool_calls if they actually exist (don't add empty arrays)
+      if response[:tool_calls]&.any?
+        msg[:tool_calls] = format_tool_calls_for_api(response[:tool_calls])
+      end
+      # Store token_usage in the message so replay_history can re-emit it
+      msg[:token_usage] = response[:token_usage] if response[:token_usage]
+      # Store per-message latency — this is the source of truth (session.json)
+      # for all time-to-first-token / duration / throughput info. The status
+      # bar signal reads the last assistant message's latency; no separate
+      # config file or top-level session field is introduced.
+      if response[:latency]
+        msg[:latency] = response[:latency]
+        @latest_latency = response[:latency]
+        # Push to UI so the status-bar signal updates immediately after the
+        # model finishes (before any tool execution delays the next event).
+        @ui&.update_sessionbar(latency: response[:latency])
+      end
+      # Preserve reasoning_content from the real LLM response.
+      # This is the authoritative signal used by MessageHistory#to_api to
+      # detect thinking-mode providers (DeepSeek V4, Kimi K2 thinking, etc.)
+      # and automatically pad any synthetic assistant messages with an empty
+      # reasoning_content so every outgoing payload satisfies the provider's
+      # "reasoning_content must be passed back" contract.
+      msg[:reasoning_content] = response[:reasoning_content] if response[:reasoning_content]
+      @history.append(msg)
+      # Close the thinking spinner before returning. The caller (run loop)
+      # is about to render the assistant message and/or tool invocations,
+      # which should appear after the spinner disappears.
+      @ui&.show_progress(phase: "done")
+      response
+    end
+    private def act(tool_calls)
+      return { denied: false, feedback: nil, tool_results: [], awaiting_feedback: false } unless tool_calls
+      denied = false
+      feedback = nil
+      results = []
+      awaiting_feedback = false
+      tool_calls.each_with_index do |call, index|
+        # Resolve tool name: handle case-insensitive and common alias mismatches
+        # from different LLM providers (e.g. "read" → "file_reader", "Read" → "file_reader")
+        original_name = call[:name]
+        resolved = @tool_registry.resolve(call[:name])
+        if resolved && resolved != call[:name]
+          @debug_logs << {
+            timestamp: Time.now.iso8601,
+            event: "tool_name_resolved",
+            original: original_name,
+            resolved: resolved
+          }
+          call = call.merge(name: resolved)
+        elsif resolved.nil?
+          # Tool truly not found — let the rescue below handle it with a clear message
+        end
+        # Hook: before_tool_use
+        hook_result = @hooks.trigger(:before_tool_use, call)
+        if hook_result[:action] == :deny
+          @ui&.show_warning("Tool #{call[:name]} denied by hook")
+          results << build_error_result(call, hook_result[:reason] || "Tool use denied by hook")
+          next
+        end
+        # Show preview for edit and write tools even in auto-approve mode
+        if should_auto_execute?(call[:name], call[:arguments])
+          # In auto-approve mode, show preview for edit and write tools
+          if call[:name] == "edit" || call[:name] == "write"
+            show_tool_preview(call)
+          end
+        else
+          # Permission check (if not in auto-approve mode)
+          confirmation = confirm_tool_use?(call)
+          unless confirmation[:approved]
+            # Show denial warning only for user-initiated denials (not system-injected preview errors)
+            # Preview errors are already shown to user, no need to repeat
+            system_injected = confirmation[:system_injected]
+            unless system_injected
+              denial_message = "Tool #{call[:name]} denied"
+              if confirmation[:feedback] && !confirmation[:feedback].empty?
+                denial_message += ": #{confirmation[:feedback]}"
+              end
+              @ui&.show_warning(denial_message)
+            end
+            denied = true
+            user_feedback = confirmation[:feedback]
+            feedback = user_feedback if user_feedback
+            results << build_denied_result(call, user_feedback, system_injected)
+            # Auto-deny all remaining tools
+            remaining_calls = tool_calls[(index + 1)..-1] || []
+            remaining_calls.each do |remaining_call|
+              reason = user_feedback && !user_feedback.empty? ?
+                       user_feedback :
+                       "Auto-denied due to user rejection of previous tool"
+              results << build_denied_result(remaining_call, reason, system_injected)
+            end
+            break
+          end
+        end
+        # Special handling for request_user_feedback: don't show as tool call
+        unless call[:name] == "request_user_feedback"
+          @ui&.show_tool_call(call[:name], redact_tool_args(call[:arguments]))
+        end
+        # Execute tool
+        begin
+          tool = @tool_registry.get(call[:name])
+          # Parse and validate arguments with JSON repair capability
+          args = Utils::ArgumentsParser.parse_and_validate(call, @tool_registry)
+          # Special handling for TodoManager: inject todos array
+          if call[:name] == "todo_manager"
+            args[:todos_storage] = @todos
+          end
+          # Special handling for InvokeSkill: inject agent and skill_loader
+          if call[:name] == "invoke_skill"
+            args[:agent] = self
+            args[:skill_loader] = @skill_loader
+          end
+          # Special handling for Time Machine tools: inject agent
+          if ["undo_task", "redo_task", "list_tasks"].include?(call[:name])
+            args[:agent] = self
+          end
+          # Inject working_dir so tools don't rely on Dir.chdir global state
+          args[:working_dir] = @working_dir if @working_dir
+          # Show progress immediately for every tool execution so the user
+          # always knows the agent is working. Using +with_progress+ wraps
+          # the execution in an +ensure+ block so the spinner/ticker is
+          # released even if the tool raises or the user interrupts.
+          #
+          # +quiet_on_fast_finish: true+ means "if the tool completes in
+          # under FAST_FINISH_THRESHOLD_SECONDS, remove the progress line
+          # instead of leaving a permanent 'Executing edit… (0s)' log
+          # entry". The preceding `[=>] Edit(...)` tool-call line and the
+          # following `[<=] Modified 1 occurrence` result line already
+          # tell the full story — the middle progress frame is noise for
+          # instant tools like edit/write/read/glob/grep. Truly slow
+          # tools (terminal running a build, web_fetch) exceed the
+          # threshold and their final frame is preserved as usual.
+          result = nil
+          if @ui
+            progress_message = build_tool_progress_message(call[:name], args)
+            @ui.with_progress(
+              message: progress_message,
+              style: :quiet,
+              quiet_on_fast_finish: true
+            ) do
+              result = tool.execute(**args)
+            end
+          else
+            result = tool.execute(**args)
+          end
+          # Track modified files for Time Machine snapshots
+          track_modified_files(call[:name], args)
+          # If a terminal tool was started in async mode, register a callback
+          # so the agent is resumed when the task completes.
+          if call[:name] == "terminal" && result.is_a?(Hash) && result[:accepted] && result[:handle_id]
+            tool_use_id = call[:id]
+            BackgroundTaskRegistry.register_callback(
+              handle_id: result[:handle_id],
+              agent: self
+            ) do |task_result|
+              notification = format_terminal_notification(task_result, tool_use_id: tool_use_id)
+              resume_with_notification(notification[:content], bubble: notification[:bubble])
+            end
+            broadcast_background_tasks_snapshot
+          end
+          # After killing a terminal handle, immediately refresh the badge so
+          # the UI reflects the new count without waiting for a page reload.
+          if call[:name] == "terminal" && result.is_a?(Hash) && result[:killed]
+            broadcast_background_tasks_snapshot
+          end
+          # Hook: after_tool_use
+          @hooks.trigger(:after_tool_use, call, result)
+          # Update todos display after todo_manager execution
+          if call[:name] == "todo_manager"
+            @ui&.update_todos(@todos.dup)
+          end
+          # Special handling for request_user_feedback: emit as interactive feedback card
+          if call[:name] == "request_user_feedback"
+            # Pass the raw call arguments to show_tool_call so the WebUI controller
+            # can extract question/context/options and emit a "request_feedback" event
+            # (renders as a clickable card in the browser).
+            # Fallback UIs (terminal, IM channels) receive the formatted text message.
+            @ui&.show_tool_call(call[:name], call[:arguments])
+            if @config.permission_mode == :auto_approve
+              # auto_approve means no human is watching (unattended/scheduled tasks).
+              # Inject an auto_reply so the LLM makes a reasonable decision and keeps going.
+              result = result.merge(
+                auto_reply: "No user is available. Please make a reasonable decision based on the context and continue."
+              )
+            else
+              # confirm_all / confirm_safes — a human is present, truly wait for user input.
+              awaiting_feedback = true
+            end
+          else
+            # Use tool's format_result method to get display-friendly string
+            formatted_result = tool.respond_to?(:format_result) ? tool.format_result(result) : result.to_s
+            # Also try to get a structured UI representation for rich rendering
+            ui_payload = tool.respond_to?(:format_result_for_ui) ? tool.format_result_for_ui(result) : nil
+            @ui&.show_tool_result(formatted_result, ui_payload: ui_payload)
+          end
+          results << build_success_result(call, result)
+        rescue StandardError => e
+          # Log complete error information to debug_logs for troubleshooting
+          @debug_logs << {
+            timestamp: Time.now.iso8601,
+            event: "tool_execution_error",
+            tool_name: call[:name],
+            tool_args: call[:arguments],
+            error_class: e.class.name,
+            error_message: e.message,
+            backtrace: e.backtrace&.first(20) # Keep first 20 lines of backtrace
+          }
+          Octo::Logger.error("tool_execution_error", tool: call[:name], error: e)
+          @hooks.trigger(:on_tool_error, call, e)
+          @ui&.show_tool_error(e)
+          # Use build_denied_result with system_injected=true so LLM knows it can retry
+          results << build_denied_result(call, e.message, true)
+        end
+      end
+      {
+        denied: denied,
+        feedback: feedback,
+        tool_results: results,
+        awaiting_feedback: awaiting_feedback
+      }
+    end
+    private def observe(response, tool_results)
+      # Add tool results as messages
+      # Use Client to format results based on API type (Anthropic vs OpenAI)
+      return if tool_results.empty?
+      formatted_messages = @client.format_tool_results(response, tool_results, model: current_model)
+      formatted_messages.each { |msg| @history.append(msg.merge(task_id: @current_task_id)) }
+      # Append a follow-up `role:"user"` message for any image payloads that
+      # could not be delivered inside the tool message.
+      #
+      # Background: OpenAI-compatible APIs (OpenRouter, Gemini, GPT-4o, etc.)
+      # only accept image_url content blocks in `role:"user"` messages.  Putting
+      # base64 data in a `role:"tool"` message causes it to be JSON-encoded as
+      # plain text, inflating token counts by 20-40x.  The tool result carries a
+      # plain-text description for the LLM; the actual image is delivered here.
+      tool_results.each do |tr|
+        inject = tr[:image_inject]
+        next unless inject
+        mime_type  = inject[:mime_type]
+        base64_data = inject[:base64_data]
+        path       = inject[:path]
+        next unless mime_type && base64_data
+        data_url = "data:#{mime_type};base64,#{base64_data}"
+        label = path ? File.basename(path.to_s) : "image"
+        image_block = { type: "image_url", image_url: { url: data_url } }
+        image_block[:image_path] = path if path
+        image_content = [
+          { type: "text", text: "[Image: #{label}]" },
+          image_block
+        ]
+        @history.append({
+          role:             "user",
+          content:          image_content,
+          system_injected:  true,
+          task_id:          @current_task_id
+        })
+      end
+    end
+    # Enqueue an inline skill injection to be flushed after observe().
+    # Called by InvokeSkill#execute to avoid injecting during tool execution,
+    # which would break Bedrock's toolUse/toolResult pairing requirement.
+    # @param skill [Octo::Skill] The skill whose instructions should be injected
+    # @param task [String] The task description passed to the skill
+    def enqueue_injection(skill, task)
+      @pending_injections << { skill: skill, task: task }
+    end
+    # Redact volatile tmpdir paths from tool call arguments before showing in UI.
+    # @param args [String, Hash, nil] Raw tool arguments
+    # @return [String, Hash, nil] Redacted arguments (same type as input)
+    def redact_tool_args(args)
+      args
+    end
+    # Flush all pending inline skill injections into history.
+    # Must be called AFTER observe() so toolResult is appended before skill instructions,
+    # producing the correct message sequence for all API providers (especially Bedrock).
+    private def flush_pending_injections
+      return if @pending_injections.empty?
+      @pending_injections.each do |entry|
+        inject_skill_as_assistant_message(entry[:skill], entry[:task], @current_task_id)
+      end
+      @pending_injections.clear
+    end
+    # Check if agent is currently running
+    def running?
+      !@start_time.nil?
+    end
+    private def build_result(status = :success, error: nil)
+      task_iterations = @iterations - (@task_start_iterations || 0)
+      {
+        status: status,
+        session_id: @session_id,
+        iterations: task_iterations,
+        duration_seconds: Time.now - @start_time,
+        cache_stats: @task_cache_stats || @cache_stats,
+        history: @history,
+        error: error
+      }
+    end
+    private def format_tool_calls_for_api(tool_calls)
+      return nil unless tool_calls
+      valid = tool_calls.filter_map do |call|
+        func = call[:function] || call
+        name = func[:name] || call[:name]
+        arguments = func[:arguments] || call[:arguments]
+        # Skip malformed tool calls with nil name or arguments
+        next if name.nil? || arguments.nil?
+        {
+          id: call[:id],
+          type: call[:type] || "function",
+          function: {
+            name: name,
+            arguments: arguments
+          }
+        }
+      end
+      valid.any? ? valid : nil
+    end
+    private def register_builtin_tools
+      @tool_registry.register(Tools::Terminal.new(agent_session_id: @session_id))
+      @tool_registry.register(Tools::FileReader.new)
+      @tool_registry.register(Tools::Write.new)
+      @tool_registry.register(Tools::Edit.new)
+      @tool_registry.register(Tools::Glob.new)
+      @tool_registry.register(Tools::Grep.new)
+      @tool_registry.register(Tools::WebSearch.new)
+      @tool_registry.register(Tools::WebFetch.new)
+      @tool_registry.register(Tools::TodoManager.new)
+      @tool_registry.register(Tools::RequestUserFeedback.new)
+      @tool_registry.register(Tools::InvokeSkill.new)
+      @tool_registry.register(Tools::UndoTask.new)
+      @tool_registry.register(Tools::RedoTask.new)
+      @tool_registry.register(Tools::ListTasks.new)
+      @tool_registry.register(Tools::Browser.new)
+    end
+    # Fork a subagent with specified configuration
+    # The subagent inherits all messages and tools from parent agent
+    # Tools are not modified (for cache reuse), but forbidden tools are blocked at runtime via hooks
+    # @param model [String, nil] Model name to use (nil = use current model)
+    # @param forbidden_tools [Array<String>] List of tool names to forbid
+    # @param system_prompt_suffix [String, nil] Additional instructions (inserted as user message for cache reuse)
+    # @return [Agent] New subagent instance
+    def fork_subagent(model: nil, forbidden_tools: [], system_prompt_suffix: nil)
+      # Clone config to avoid affecting parent
+      subagent_config = @config.deep_copy
+      # Switch to specified model if provided
+      if model
+        if model == "lite"
+          # Special keyword: use lite model if available, otherwise fall back to default.
+          #
+          # Lite is now a *virtual* role — we don't require it to exist as a
+          # concrete entry in @models. Instead we derive it from whatever
+          # model the user is currently on (current_model), so switching
+          # primary models automatically re-pairs with the right lite
+          # companion (Claude → Haiku, DeepSeek V4-pro → V4-flash, ...).
+          lite_cfg = subagent_config.lite_model_config_for_current
+          if lite_cfg
+            if lite_cfg["virtual"]
+              # Provider-preset derived: apply the lite fields as a *session
+              # overlay* on the subagent's config — this intentionally avoids
+              # mutating the shared @models array / hashes which would pollute
+              # the parent agent's own current model (e.g. turning the parent's
+              # Opus entry into Haiku for the rest of the session).
+              subagent_config.apply_virtual_model_overlay!(
+                "api_key"          => lite_cfg["api_key"],
+                "base_url"         => lite_cfg["base_url"],
+                "model"            => lite_cfg["model"],
+                "anthropic_format" => lite_cfg["anthropic_format"]
+              )
+            elsif lite_cfg["id"]
+              # Explicit user-configured lite (from OCTO_LITE_* env): a
+              # real @models entry with a stable id. Switch to it normally.
+              subagent_config.switch_model_by_id(lite_cfg["id"])
+            end
+          end
+          # If no lite is resolvable, just use current (primary) model.
+        else
+          # Regular model name lookup — find the first model with a matching
+          # name and switch by its stable id.
+          target = subagent_config.models.find { |m| m["model"] == model }
+          if target && target["id"]
+            subagent_config.switch_model_by_id(target["id"])
+          else
+            raise AgentError, "Model '#{model}' not found in config. Available models: #{subagent_config.model_names.join(', ')}"
+          end
+        end
+      end
+      # Create new client for subagent
+      subagent_client = Octo::Client.new(
+        subagent_config.api_key,
+        base_url: subagent_config.base_url,
+        model: subagent_config.model_name,
+        anthropic_format: subagent_config.anthropic_format?
+      )
+      # Create subagent (reuses all tools from parent, inherits agent profile from parent)
+      # Subagent gets its own unique session_id.
+      subagent = self.class.new(
+        subagent_client,
+        subagent_config,
+        working_dir: @working_dir,
+        ui: @ui,
+        profile: @agent_profile.name,
+        session_id: Octo::SessionManager.generate_id,
+        source: @source
+      )
+      subagent.instance_variable_set(:@is_subagent, true)
+      # Inherit previous_total_tokens so the first iteration delta is calculated correctly
+      subagent.instance_variable_set(:@previous_total_tokens, @previous_total_tokens)
+      # Deep clone history to avoid cross-contamination.
+      # Dangling tool_calls (no tool_result yet) are cleaned up automatically by
+      # MessageHistory#append when the subagent appends its first user message.
+      cloned_messages = deep_clone(@history.to_a)
+      subagent.instance_variable_set(:@history, MessageHistory.new(cloned_messages))
+      # Append system prompt suffix as user message (for cache reuse)
+      if system_prompt_suffix
+        subagent_history = subagent.history
+        # Build forbidden tools notice if any tools are forbidden
+        forbidden_notice = if forbidden_tools.any?
+          tool_list = forbidden_tools.map { |t| "`#{t}`" }.join(", ")
+          "\n\n[System Notice] The following tools are disabled in this subagent and will be rejected if called: #{tool_list}"
+        else
+          ""
+        end
+        subagent_history.append({
+          role: "user",
+          content: "CRITICAL: TASK CONTEXT SWITCH - FORKED SUBAGENT MODE\n\nYou are now running as a forked subagent — a temporary, isolated agent spawned by the parent agent to handle a specific task. You run independently and cannot communicate back to the parent mid-task. When you finish (i.e., you stop calling tools and return a final response), your output will be automatically summarized and returned to the parent agent as a result so it can continue.\n\n#{system_prompt_suffix}#{forbidden_notice}",
+          system_injected: true,
+          subagent_instructions: true
+        })
+        # Insert an assistant acknowledgement so the conversation structure is complete:
+        #   [user] role/constraints  →  [assistant] ack  →  [user] actual task (from run())
+        subagent_history.append({
+          role: "assistant",
+          content: "Understood. I am now operating as a subagent with the constraints above. Please provide the task.",
+          system_injected: true
+        })
+      end
+      # Register hook to forbid certain tools at runtime (doesn't affect tool registry for cache)
+      if forbidden_tools.any?
+        subagent.add_hook(:before_tool_use) do |call|
+          if forbidden_tools.include?(call[:name])
+            {
+              action: :deny,
+              reason: "Tool '#{call[:name]}' is forbidden in this subagent context"
+            }
+          else
+            { action: :allow }
+          end
+        end
+      end
+      # Mark subagent metadata for summary generation
+      subagent.instance_variable_set(:@is_subagent, true)
+      subagent.instance_variable_set(:@parent_message_count, @history.size)
+      subagent
+    end
+    # Generate summary from subagent execution
+    # Extracts new messages added by subagent and creates a concise summary
+    # This summary will replace the subagent instructions message in parent agent
+    # @param subagent [Agent] The subagent that completed execution
+    # @return [String] Summary text to insert into parent agent
+    def generate_subagent_summary(subagent)
+      parent_count = subagent.instance_variable_get(:@parent_message_count) || 0
+      new_messages = subagent.history.to_a[parent_count..] || []
+      # Extract tool calls
+      tool_calls = new_messages
+        .select { |m| m[:role] == "assistant" && m[:tool_calls] }
+        .flat_map { |m| m[:tool_calls].map { |tc| tc[:name] } }
+        .uniq
+      # Extract final assistant response
+      last_response = new_messages
+        .reverse
+        .find { |m| m[:role] == "assistant" && m[:content] && !m[:content].empty? }
+        &.dig(:content)
+      # Build summary (this will replace the subagent instructions message)
+      parts = []
+      parts << "[SUBAGENT SUMMARY]"
+      parts << "Completed in #{subagent.iterations} iterations"
+      parts << "Tools used: #{tool_calls.join(', ')}" if tool_calls.any?
+      parts << ""
+      parts << "Results:"
+      parts << (last_response || "(No response)")
+      parts.join("\n")
+    end
+    # Deep clone helper for messages using Marshal
+    # @param obj [Object] Object to clone
+    # @return [Object] Deep cloned object
+    private def deep_clone(obj)
+      Marshal.load(Marshal.dump(obj))
+    end
+    # Format user content with optional images
+    # PDF files are handled upstream (server injects file path into message text),
+    # so this method only needs to handle images.
+    # @param text [String] User's text input
+    # @param images [Array<String>] Array of image file paths or data: URLs
+    # @param files [Array] Unused — kept for signature compatibility
+    # @return [String|Array] String if no images, Array with content blocks otherwise
+    # Pure: process a user message's text + file attachments into the data
+    # structures needed for @history append, WITHOUT touching @history itself.
+    # Safe to call from any thread (HTTP-handler thread or agent thread) —
+    # only mutates argument-local state and runs the FileProcessor subprocess.
+    #
+    # Returns a Hash:
+    #   {
+    #     user_content:  String or content-block Array (text + vision blocks),
+    #     display_files: Array<{name, type, preview_path}> for replay bubbles,
+    #     file_prompt:   String (system_injected file references for LLM, "" if none)
+    #   }
+    #
+    # The companion +append_processed_user_message_to_history!+ takes this
+    # hash and does the actual append — that part MUST run on the
+    # @run_mutex-holding thread.
+    private def process_files_for_user_message(content, files)
+      image_files, disk_files = partition_files(Array(files))
+      vision_images, downgraded = resolve_vision_images(image_files)
+      all_disk_files = disk_files + downgraded
+      # Format user message — text + inline vision images
+      user_content = format_user_content(content, vision_images.map { |v| { url: v[:url], path: v[:path] } })
+      # Parse disk files — process_path runs the parser script and returns a FileRef.
+      all_disk_files = all_disk_files.map do |f|
+        path = f[:path] || f["path"]
+        name = f[:name] || f["name"]
+        next f unless path && File.exist?(path.to_s)
+        downgrade_reason = f[:downgrade_reason] || f["downgrade_reason"]
+        ref = Utils::FileProcessor.process_path(path, name: name)
+        { name: ref.name, type: ref.type.to_s, path: ref.original_path,
+          preview_path: ref.preview_path, parse_error: ref.parse_error, parser_path: ref.parser_path,
+          downgrade_reason: downgrade_reason }
+      end
+      display_files = all_disk_files.filter_map do |f|
+        name = f[:name] || f["name"]
+        next unless name
+        { name: name, type: f[:type] || f["type"] || "file",
+          preview_path: f[:preview_path] || f["preview_path"] }
+      end
+      all_meta_files = vision_images.map { |v|
+        { name: v[:name], type: "image", size_bytes: v[:size_bytes], path: v[:path] }
+      } + all_disk_files
+      file_prompt = build_file_prompt(all_meta_files)
+      {
+        user_content:  user_content,
+        display_files: display_files,
+        file_prompt:   file_prompt
+      }
+    end
+    # Mutates @history. Caller MUST hold @run_mutex (i.e. this is called
+    # from inside Agent#run, either from the user-message-mode branch
+    # directly or from drain_inbox_into_history! processing a user_msg
+    # item whose files were pre-processed at HTTP-entry time).
+    private def append_processed_user_message_to_history!(processed, task_id)
+      @history.append({
+        role:          "user",
+        content:       processed[:user_content],
+        task_id:       task_id,
+        created_at:    Time.now.to_f,
+        display_files: processed[:display_files].empty? ? nil : processed[:display_files]
+      })
+      @total_tasks += 1
+      file_prompt = processed[:file_prompt]
+      unless file_prompt.nil? || file_prompt.empty?
+        @history.append({
+          role:            "user",
+          content:         file_prompt,
+          system_injected: true,
+          task_id:         task_id
+        })
+      end
+    end
+    # Build the system_injected file-prompt string from an Array of file
+    # metadata hashes. Returns "" if there are no files. Extracted so both
+    # process_files_for_user_message and any future caller share one shape.
+    private def build_file_prompt(all_meta_files)
+      return "" if all_meta_files.empty?
+      all_meta_files.filter_map do |f|
+        name             = f[:name]             || f["name"]
+        type             = f[:type]             || f["type"]
+        path             = f[:path]             || f["path"]
+        preview_path     = f[:preview_path]     || f["preview_path"]
+        size_bytes       = f[:size_bytes]       || f["size_bytes"]
+        parse_error      = f[:parse_error]      || f["parse_error"]
+        parser_path      = f[:parser_path]      || f["parser_path"]
+        downgrade_reason = f[:downgrade_reason] || f["downgrade_reason"]
+        next unless name
+        lines = ["[File: #{name}]", "Type: #{type || "file"}"]
+        lines << "Size: #{format_size(size_bytes)}" if size_bytes
+        lines << "Original: #{path}" if path
+        lines << "Preview (Markdown): #{preview_path}" if preview_path
+        note = downgrade_note_for(downgrade_reason)
+        lines << "Note: #{note}" if note
+        if preview_path.nil? && parse_error
+          lines << "Parse failed: #{parse_error}"
+          if parser_path
+            expected_preview = "#{path}.preview.md"
+            lines << "Action required: fix the parser at #{parser_path}, then run:"
+            lines << "  ruby #{parser_path} #{path} > #{expected_preview}"
+            lines << "Once done, read #{expected_preview} to continue helping the user."
+          end
+        end
+        lines.join("\n")
+      end.join("\n\n")
+    end
+    # Partition files array into [image_files, non_image_files].
+    # Image files: have mime_type starting with "image/" OR have data_url present.
+    private def partition_files(files)
+      image_files = []
+      non_image_files = []
+      files.each do |f|
+        mime = f[:mime_type] || f["mime_type"] || ""
+        data_url = f[:data_url] || f["data_url"]
+        if mime.start_with?("image/") || data_url
+          image_files << f
+        else
+          non_image_files << f
+        end
+      end
+      [image_files, non_image_files]
+    end
+    # Resolve image files to vision data_urls.
+    # Files with data_url: use as-is (already compressed by frontend or adapter).
+    # Files with path: convert to data_url via FileProcessor.
+    #
+    # Downgrade to disk file refs (with a `downgrade_reason` tag) when:
+    #   - :provider_no_vision — current model does not support vision input
+    #     (e.g. MiniMax, Kimi, DeepSeek, or octo's DeepSeek sidecar).
+    #     The downgrade is capability-driven and reflects the *current* model;
+    #     switching models takes effect on the next run with no cached state.
+    #   - :too_large — base64 payload exceeds MAX_IMAGE_BYTES. Downgrading here
+    #     keeps a hot context window from blowing up on e.g. a 20MB screenshot.
+    #
+    # Both reasons share the same downgrade path; `file_prompt` will later
+    # emit a `Note:` line on the file entry explaining why the image isn't
+    # inline, so the LLM has colocated context (no system prompt pollution).
+    #
+    # @return [Array<Hash>, Array<Hash>] [vision_images, downgraded_disk_files]
+    private def resolve_vision_images(image_files)
+      require "base64"
+      max_bytes = Utils::FileProcessor::MAX_IMAGE_BYTES
+      # Capability check once per run — current_model_supports? is cheap and
+      # delegates to Providers.supports? under the hood, always reflecting
+      # the current model (no stale state on `/model` switch).
+      vision_supported = @config.current_model_supports?(:vision)
+      vision_images = []  # Array of { url:, name:, size_bytes:, path: }
+      downgraded    = []
+      image_files.each do |f|
+        name     = f[:name]     || f["name"]     || "image.jpg"
+        mime     = f[:mime_type] || f["mime_type"] || "image/jpeg"
+        data_url = f[:data_url]  || f["data_url"]
+        path     = f[:path]      || f["path"]
+        if data_url
+          b64_data  = data_url.split(",", 2).last.to_s
+          byte_size = (b64_data.bytesize * 3) / 4
+          raw       = Base64.decode64(b64_data)
+          file_ref  = Utils::FileProcessor.save_image_to_disk(body: raw, mime_type: mime, filename: name)
+          reason    = downgrade_reason_for(vision_supported, byte_size, max_bytes)
+          if reason
+            downgraded << { name: name, path: file_ref.original_path, type: "image",
+                            mime_type: mime, size_bytes: byte_size, downgrade_reason: reason }
+          else
+            vision_images << { url: data_url, name: name, size_bytes: byte_size, path: file_ref.original_path }
+          end
+        elsif path
+          begin
+            data_url_from_path = Utils::FileProcessor.image_path_to_data_url(path)
+            b64_data  = data_url_from_path.split(",", 2).last.to_s
+            byte_size = (b64_data.bytesize * 3) / 4
+            reason    = downgrade_reason_for(vision_supported, byte_size, max_bytes)
+            if reason
+              downgraded << { name: name, path: path, type: "image",
+                              mime_type: mime, size_bytes: byte_size, downgrade_reason: reason }
+            else
+              vision_images << { url: data_url_from_path, name: name, size_bytes: byte_size, path: path }
+            end
+          rescue => e
+            @ui&.log("Failed to load image #{name}: #{e.message}", level: :warn)
+          end
+        end
+      end
+      [vision_images, downgraded]
+    end
+    # Decide whether an image must be downgraded to a disk ref, and if so why.
+    # Precedence: provider capability is checked first — a text-only model
+    # can't use the image at any size, so there's no point re-checking size.
+    # @return [Symbol, nil] :provider_no_vision | :too_large | nil (keep inline)
+    private def downgrade_reason_for(vision_supported, byte_size, max_bytes)
+      return :provider_no_vision unless vision_supported
+      return :too_large if byte_size > max_bytes
+      nil
+    end
+    # Human-readable note for a downgrade reason, embedded next to the file
+    # entry in the file_prompt. Kept intentionally terse and factual; the LLM
+    # will see this alongside the file's name/type/path so it can tell the
+    # user honestly why it can't see the image.
+    # @return [String, nil] note text, or nil for no note
+    private def downgrade_note_for(reason)
+      case reason&.to_sym
+      when :provider_no_vision
+        "The current model does not support vision input. Image content is not visible to the model; suggest switching to a vision-capable model if the user needs image analysis."
+      when :too_large
+        "Image was too large for inline delivery and has been saved to disk. Read it with a vision-capable tool/model if needed."
+      end
+    end
+    # Build user message content for LLM.
+    # Returns plain String when no vision images; Array of content parts otherwise.
+    # Build user message content for LLM.
+    # vision_images: Array of String (plain url) OR Hash { url:, path: }
+    # path is stored in the block so history replay can reconstruct the image
+    # from the tmp file when the base64 data_url is no longer available.
+    private def format_user_content(text, vision_images)
+      vision_images ||= []
+      return text if vision_images.empty?
+      content = []
+      content << { type: "text", text: text } unless text.nil? || text.empty?
+      vision_images.each do |img|
+        if img.is_a?(Hash)
+          block = { type: "image_url", image_url: { url: img[:url] } }
+          block[:image_path] = img[:path] if img[:path]
+          content << block
+        else
+          content << { type: "image_url", image_url: { url: img } }
+        end
+      end
+      content
+    end
+    # Format byte size as human-readable string.
+    private def format_size(bytes)
+      return "0B" unless bytes
+      if bytes >= 1024 * 1024
+        "#{(bytes / 1024.0 / 1024.0).round(1)}MB"
+      elsif bytes >= 1024
+        "#{(bytes / 1024.0).round(0).to_i}KB"
+      else
+        "#{bytes}B"
+      end
+    end
+    # Inject a session context message (date + model) into the conversation.
+    # Only injects when:
+    #   1. No context message exists yet in this session, OR
+    #   2. The existing context is from a previous day (cross-day session)
+    # Marked with system_injected: true so existing filters (replay_history,
+    # get_recent_user_messages, etc.) automatically skip it.
+    # Cache-safe: always inserted just before the current user message,
+    # so no historical cache entries are ever invalidated.
+    private def inject_session_context_if_needed
+      today = Time.now.strftime("%Y-%m-%d")
+      # Skip if we already have a context for today
+      return if @history.last_session_context_date == today
+      inject_session_context
+    end
+    # Core method to inject session context (date, model, OS, paths).
+    # Called by inject_session_context_if_needed (with date check)
+    # and by switch_model (without date check, to force update).
+    #
+    # IMPORTANT: Skip injection when the system prompt hasn't been built yet.
+    # Otherwise, appending a user message to an empty history makes
+    # @history.empty? false, which causes run() to skip building the
+    # system prompt entirely (see run()'s "first run" guard).
+    # The injection will happen naturally in run() via
+    # inject_session_context_if_needed after the system prompt is in place.
+    private def inject_session_context
+      # Don't inject context before system prompt exists — defer to
+      # inject_session_context_if_needed which runs inside run()
+      # after the system prompt has been built.
+      return unless @history.has_system_prompt?
+      today   = Time.now.strftime("%Y-%m-%d")
+      os      = Octo::Utils::EnvironmentDetector.os_type
+      desktop = Octo::Utils::EnvironmentDetector.desktop_path
+      parts   = [
+        "Today is #{Time.now.strftime('%Y-%m-%d, %A')}",
+        "Current model: #{current_model}",
+        os != :unknown ? "OS: #{Octo::Utils::EnvironmentDetector.os_label}" : nil,
+        desktop ? "Desktop: #{desktop}" : nil,
+        "Working directory: #{@working_dir}"
+      ].compact.join(". ")
+      content = "[Session context: #{parts}]"
+      @history.append({
+        role: "user",
+        content: content,
+        system_injected: true,
+        session_context: true,
+        session_date: today
+      })
+    end
+    # Parse markdown file:// links from assistant message content.
+    # Handles both regular links and inline images:
+    #   [Download report](file:///path/to/file.pdf)
+    #   ![chart](file:///path/to/chart.png)
+    #
+    # Returns { text: String (original content, unmodified),
+    #           files: Array<{name:, path:, inline:}> }
+    private def parse_file_links(content)
+      return { text: content, files: [] } if content.nil? || content.empty?
+      files = []
+      content.scan(/(!?)\[([^\]]*)\]\(file:\/\/([^)]+)\)/) do
+        inline = $1 == "!"
+        # URL-decode percent-encoded characters (e.g. Chinese filenames encoded by AI)
+        raw_path = CGI.unescape($3)
+        name   = File.basename(raw_path)
+        path   = File.expand_path(raw_path)
+        Octo::Logger.info("[parse_file_links] raw=#{$3.inspect} expanded=#{path.inspect} exist=#{File.exist?(path)}")
+        files << { name: name, path: path, inline: inline }
+      end
+      { text: content, files: files }
+    end
+    # Emit assistant message to UI, parsing any embedded file:// links first.
+    #
+    # Local image URL rewriting (file:// → /api/local-image) is intentionally
+    # NOT done here. It is browser-specific (the Web UI runs on http://localhost
+    # and cannot load file:// directly) and must stay scoped to the Web UI
+    # controller. IM channel subscribers need the original file:// markdown so
+    # parse_file_links can extract paths and deliver images as native attachments.
+    private def emit_assistant_message(content, reasoning_content: nil)
+      # Prepend reasoning/thinking content (from thinking-mode providers like
+      # DeepSeek V4, Kimi K2) wrapped in <think> tags so the Web UI renders it
+      # as a collapsible thinking block (see sessions.js _renderMarkdown).
+      if reasoning_content && !reasoning_content.to_s.strip.empty?
+        full_content = "<think>\n#{reasoning_content}\n</think>\n#{content}"
+      else
+        full_content = content
+      end
+      return if full_content.nil? || full_content.to_s.strip.empty?
+      parsed = parse_file_links(content)
+      @ui&.show_assistant_message(full_content, files: parsed[:files])
+    end
+    # Track modified files for Time Machine snapshots
+    # @param tool_name [String] Name of the tool that was executed
+    # @param args [Hash] Arguments passed to the tool
+    def track_modified_files(tool_name, args)
+      @modified_files_in_task ||= []
+      case tool_name
+      when "write", "edit"
+        file_path = args[:path]
+        full_path = File.expand_path(file_path, @working_dir)
+        @modified_files_in_task << full_path unless @modified_files_in_task.include?(full_path)
+      end
+    end
+  end
+end