npm - inferoa - Versions diffs - 0.1.0 - Mend

inferoa 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (200) hide show

package/LICENSE +176 -0
package/README.md +154 -0
package/dist/src/app.d.ts +16 -0
package/dist/src/app.js +17 -0
package/dist/src/app.js.map +1 -0
package/dist/src/autoresearch/state.d.ts +106 -0
package/dist/src/autoresearch/state.js +469 -0
package/dist/src/autoresearch/state.js.map +1 -0
package/dist/src/cli.d.ts +2 -0
package/dist/src/cli.js +415 -0
package/dist/src/cli.js.map +1 -0
package/dist/src/code-intelligence/codegraph-engine.d.ts +55 -0
package/dist/src/code-intelligence/codegraph-engine.js +593 -0
package/dist/src/code-intelligence/codegraph-engine.js.map +1 -0
package/dist/src/code-intelligence/hub.d.ts +37 -0
package/dist/src/code-intelligence/hub.js +65 -0
package/dist/src/code-intelligence/hub.js.map +1 -0
package/dist/src/config/config.d.ts +12 -0
package/dist/src/config/config.js +229 -0
package/dist/src/config/config.js.map +1 -0
package/dist/src/config/defaults.d.ts +2 -0
package/dist/src/config/defaults.js +44 -0
package/dist/src/config/defaults.js.map +1 -0
package/dist/src/config/secret-vault.d.ts +3 -0
package/dist/src/config/secret-vault.js +106 -0
package/dist/src/config/secret-vault.js.map +1 -0
package/dist/src/context/compressor.d.ts +33 -0
package/dist/src/context/compressor.js +501 -0
package/dist/src/context/compressor.js.map +1 -0
package/dist/src/context/prompt.d.ts +26 -0
package/dist/src/context/prompt.js +572 -0
package/dist/src/context/prompt.js.map +1 -0
package/dist/src/daemon/serve.d.ts +2 -0
package/dist/src/daemon/serve.js +11 -0
package/dist/src/daemon/serve.js.map +1 -0
package/dist/src/daemon/supervisor.d.ts +33 -0
package/dist/src/daemon/supervisor.js +252 -0
package/dist/src/daemon/supervisor.js.map +1 -0
package/dist/src/goals/state.d.ts +105 -0
package/dist/src/goals/state.js +736 -0
package/dist/src/goals/state.js.map +1 -0
package/dist/src/model/endpoint-signals.d.ts +15 -0
package/dist/src/model/endpoint-signals.js +186 -0
package/dist/src/model/endpoint-signals.js.map +1 -0
package/dist/src/model/gateway.d.ts +11 -0
package/dist/src/model/gateway.js +455 -0
package/dist/src/model/gateway.js.map +1 -0
package/dist/src/plans/state.d.ts +28 -0
package/dist/src/plans/state.js +123 -0
package/dist/src/plans/state.js.map +1 -0
package/dist/src/runtime.d.ts +92 -0
package/dist/src/runtime.js +757 -0
package/dist/src/runtime.js.map +1 -0
package/dist/src/session/store.d.ts +84 -0
package/dist/src/session/store.js +593 -0
package/dist/src/session/store.js.map +1 -0
package/dist/src/session/workspace.d.ts +2 -0
package/dist/src/session/workspace.js +14 -0
package/dist/src/session/workspace.js.map +1 -0
package/dist/src/skills/registry.d.ts +24 -0
package/dist/src/skills/registry.js +203 -0
package/dist/src/skills/registry.js.map +1 -0
package/dist/src/tools/autoresearch-tools.d.ts +6 -0
package/dist/src/tools/autoresearch-tools.js +412 -0
package/dist/src/tools/autoresearch-tools.js.map +1 -0
package/dist/src/tools/clarify-tool.d.ts +3 -0
package/dist/src/tools/clarify-tool.js +107 -0
package/dist/src/tools/clarify-tool.js.map +1 -0
package/dist/src/tools/code-intelligence.d.ts +15 -0
package/dist/src/tools/code-intelligence.js +391 -0
package/dist/src/tools/code-intelligence.js.map +1 -0
package/dist/src/tools/context.d.ts +11 -0
package/dist/src/tools/context.js +2 -0
package/dist/src/tools/context.js.map +1 -0
package/dist/src/tools/goal-tools.d.ts +3 -0
package/dist/src/tools/goal-tools.js +279 -0
package/dist/src/tools/goal-tools.js.map +1 -0
package/dist/src/tools/omni-tools.d.ts +8 -0
package/dist/src/tools/omni-tools.js +349 -0
package/dist/src/tools/omni-tools.js.map +1 -0
package/dist/src/tools/permissions.d.ts +11 -0
package/dist/src/tools/permissions.js +74 -0
package/dist/src/tools/permissions.js.map +1 -0
package/dist/src/tools/plan-tools.d.ts +3 -0
package/dist/src/tools/plan-tools.js +314 -0
package/dist/src/tools/plan-tools.js.map +1 -0
package/dist/src/tools/process-tools.d.ts +6 -0
package/dist/src/tools/process-tools.js +199 -0
package/dist/src/tools/process-tools.js.map +1 -0
package/dist/src/tools/registry.d.ts +20 -0
package/dist/src/tools/registry.js +187 -0
package/dist/src/tools/registry.js.map +1 -0
package/dist/src/tools/schemas.d.ts +3 -0
package/dist/src/tools/schemas.js +500 -0
package/dist/src/tools/schemas.js.map +1 -0
package/dist/src/tools/skill-tools.d.ts +6 -0
package/dist/src/tools/skill-tools.js +124 -0
package/dist/src/tools/skill-tools.js.map +1 -0
package/dist/src/tools/text-args.d.ts +5 -0
package/dist/src/tools/text-args.js +22 -0
package/dist/src/tools/text-args.js.map +1 -0
package/dist/src/tools/web-search.d.ts +5 -0
package/dist/src/tools/web-search.js +602 -0
package/dist/src/tools/web-search.js.map +1 -0
package/dist/src/tools/workspace-tools.d.ts +17 -0
package/dist/src/tools/workspace-tools.js +561 -0
package/dist/src/tools/workspace-tools.js.map +1 -0
package/dist/src/tui/activity.d.ts +11 -0
package/dist/src/tui/activity.js +75 -0
package/dist/src/tui/activity.js.map +1 -0
package/dist/src/tui/ansi.d.ts +24 -0
package/dist/src/tui/ansi.js +131 -0
package/dist/src/tui/ansi.js.map +1 -0
package/dist/src/tui/app.d.ts +163 -0
package/dist/src/tui/app.js +4204 -0
package/dist/src/tui/app.js.map +1 -0
package/dist/src/tui/cache-footer.d.ts +21 -0
package/dist/src/tui/cache-footer.js +75 -0
package/dist/src/tui/cache-footer.js.map +1 -0
package/dist/src/tui/clarify.d.ts +14 -0
package/dist/src/tui/clarify.js +187 -0
package/dist/src/tui/clarify.js.map +1 -0
package/dist/src/tui/composer.d.ts +79 -0
package/dist/src/tui/composer.js +592 -0
package/dist/src/tui/composer.js.map +1 -0
package/dist/src/tui/event-view.d.ts +5 -0
package/dist/src/tui/event-view.js +392 -0
package/dist/src/tui/event-view.js.map +1 -0
package/dist/src/tui/home.d.ts +7 -0
package/dist/src/tui/home.js +92 -0
package/dist/src/tui/home.js.map +1 -0
package/dist/src/tui/markdown.d.ts +18 -0
package/dist/src/tui/markdown.js +271 -0
package/dist/src/tui/markdown.js.map +1 -0
package/dist/src/tui/mode-footer.d.ts +9 -0
package/dist/src/tui/mode-footer.js +62 -0
package/dist/src/tui/mode-footer.js.map +1 -0
package/dist/src/tui/plan-view.d.ts +8 -0
package/dist/src/tui/plan-view.js +45 -0
package/dist/src/tui/plan-view.js.map +1 -0
package/dist/src/tui/prompt-queue.d.ts +18 -0
package/dist/src/tui/prompt-queue.js +27 -0
package/dist/src/tui/prompt-queue.js.map +1 -0
package/dist/src/tui/resize.d.ts +7 -0
package/dist/src/tui/resize.js +15 -0
package/dist/src/tui/resize.js.map +1 -0
package/dist/src/tui/session-picker.d.ts +10 -0
package/dist/src/tui/session-picker.js +17 -0
package/dist/src/tui/session-picker.js.map +1 -0
package/dist/src/tui/session-transcript.d.ts +2 -0
package/dist/src/tui/session-transcript.js +44 -0
package/dist/src/tui/session-transcript.js.map +1 -0
package/dist/src/tui/slash-notice.d.ts +2 -0
package/dist/src/tui/slash-notice.js +9 -0
package/dist/src/tui/slash-notice.js.map +1 -0
package/dist/src/tui/slash.d.ts +21 -0
package/dist/src/tui/slash.js +103 -0
package/dist/src/tui/slash.js.map +1 -0
package/dist/src/tui/splash.d.ts +4 -0
package/dist/src/tui/splash.js +64 -0
package/dist/src/tui/splash.js.map +1 -0
package/dist/src/tui/tool-renderer.d.ts +6 -0
package/dist/src/tui/tool-renderer.js +1024 -0
package/dist/src/tui/tool-renderer.js.map +1 -0
package/dist/src/tui/transcript-spacing.d.ts +1 -0
package/dist/src/tui/transcript-spacing.js +4 -0
package/dist/src/tui/transcript-spacing.js.map +1 -0
package/dist/src/types.d.ts +220 -0
package/dist/src/types.js +2 -0
package/dist/src/types.js.map +1 -0
package/dist/src/util/abort.d.ts +3 -0
package/dist/src/util/abort.js +19 -0
package/dist/src/util/abort.js.map +1 -0
package/dist/src/util/clock.d.ts +2 -0
package/dist/src/util/clock.js +7 -0
package/dist/src/util/clock.js.map +1 -0
package/dist/src/util/fs.d.ts +13 -0
package/dist/src/util/fs.js +75 -0
package/dist/src/util/fs.js.map +1 -0
package/dist/src/util/hash.d.ts +6 -0
package/dist/src/util/hash.js +50 -0
package/dist/src/util/hash.js.map +1 -0
package/dist/src/util/limit.d.ts +11 -0
package/dist/src/util/limit.js +29 -0
package/dist/src/util/limit.js.map +1 -0
package/dist/src/util/types.d.ts +22 -0
package/dist/src/util/types.js +33 -0
package/dist/src/util/types.js.map +1 -0
package/dist/src/validation/acceptance.d.ts +12 -0
package/dist/src/validation/acceptance.js +251 -0
package/dist/src/validation/acceptance.js.map +1 -0
package/dist/src/validation/milestone.d.ts +2 -0
package/dist/src/validation/milestone.js +141 -0
package/dist/src/validation/milestone.js.map +1 -0
package/docs/final-acceptance-task.md +193 -0
package/docs/public-source-hygiene.md +21 -0
package/docs/roadmap.md +265 -0
package/docs/tui-product-design.md +270 -0
package/package.json +67 -0
package/skills/coding-workflow/SKILL.md +16 -0

package/docs/final-acceptance-task.md ADDED Viewed

@@ -0,0 +1,193 @@
+# Final Acceptance Task
+Inferoa is not considered complete until it passes a real end-to-end task
+with actual model endpoints.
+Unit tests, mock endpoints, and isolated smoke tests are necessary but not
+sufficient. The final acceptance task must prove that the implemented agent can
+use its built-in tools, manage context, and call vLLM ecosystem endpoints in one
+durable coding session.
+## Required Environment
+The final task should use real configured endpoints:
+- direct vLLM Engine endpoint for the coding model;
+- vLLM Semantic Router `auto` endpoint when available;
+- vLLM-Omni endpoint for multimodal tools;
+- external OpenAI-compatible provider profile for required compatibility
+  validation. The primary acceptance path should still prove vLLM ecosystem
+  endpoints unless a specific run is intentionally testing an external
+  provider.
+The planned AMD validation hosts are:
+- `165.245.131.56`
+- `134.199.199.149`
+One host should run or expose direct vLLM Engine. The other should run or expose
+vLLM-Omni. The exact host assignment can change, but the final report must
+record endpoint addresses, model names, server flags, and any unavailable
+capabilities.
+For project acceptance, these AMD endpoints are not assumed to already exist.
+The acceptance work includes gaining SSH/deployment access, installing or
+starting the required runtime stack, choosing models that fit the node GPU
+memory, exposing OpenAI-compatible endpoints, and recording deployment evidence.
+The Inferoa product should still treat those services as configured
+endpoints rather than embedding a general deployment controller.
+The AMD validation hosts are disposable for this project validation. Existing
+containers, model processes, ports, and partial deployments may be stopped and
+replaced during deployment. The final report should record what was cleaned,
+but the implementation does not need to preserve host state for backwards
+compatibility.
+The external provider path is also required. At minimum, setup and validation
+must prove one OpenAI-compatible external provider by entering credentials,
+probing `/v1/models`, selecting a model, and running a chat request through
+Inferoa. One current validation target exposes `tke/deepseek-v4-flash` from
+its model list. Raw API keys must not be committed to docs, config, progress
+logs, or evidence artifacts.
+## Required Task Shape
+Use a real coding task against a non-trivial local repository. The task must
+force the agent to use the core coding workflow:
+1. inspect the repository;
+2. use `file_search`;
+3. read files;
+4. use code-intelligence where supported;
+5. edit files;
+6. run shell commands or tests;
+7. maintain a task/evidence ledger;
+8. handle at least one long-running or background process record;
+9. produce a final explanation with evidence.
+The task should be large enough to make context optimization meaningful. It must
+trigger context compression either naturally or through a controlled test setup.
+The final report must show:
+- when compression was triggered;
+- what was preserved;
+- what was moved into managed resources;
+- prompt/token counts when available;
+- cached-token evidence when direct vLLM exposes it.
+## Required Multimodal Coverage
+The same acceptance run, or a linked continuation in the same durable session,
+must exercise endpoint-backed Omni tools:
+- image understanding;
+- image generation;
+- video generation.
+If the deployed Omni endpoint also supports video understanding, include it.
+If it does not, record the missing capability as an endpoint limitation rather
+than a passed test.
+Generated media should be stored as managed resources or artifacts, with stable
+references in the session log. The agent should not paste large binary or media
+payloads into the prompt.
+## Required Session And Supervisor Coverage
+The final acceptance task must prove long-horizon behavior:
+- session creation and resume;
+- durable event log replay;
+- single-writer lock behavior;
+- background process event records;
+- context compression and continued work after compression.
+After T9, the same task must also prove `inferoa daemon` behavior:
+- start a supervised run;
+- detach the terminal;
+- keep a long-running process or agent run alive;
+- reattach and inspect status/logs;
+- cancel or complete the supervised run;
+- suspend and resume safely if a permission prompt occurs.
+Before T9, daemon behavior can be recorded as not implemented, but the
+event/process schema must already be compatible with it.
+## Pass Criteria
+The final task passes only if all of these are true:
+- the coding task is completed by Inferoa using a real model endpoint;
+- built-in tools are used successfully, not only listed or mocked;
+- context compression occurs and work continues after compression;
+- image understanding works through the configured multimodal endpoint;
+- image generation works through the configured multimodal endpoint;
+- video generation works through the configured multimodal endpoint;
+- session events, resources, prompt hashes, and endpoint evidence are persisted;
+- direct vLLM cached-token evidence is recorded when the endpoint exposes it;
+- failures are limited to explicitly unavailable endpoint capabilities and are
+  recorded with concrete endpoint/model details.
+The project is not complete if the final evidence only shows unit tests, mock
+servers, or manual calls outside the agent.
+## Runner
+The prototype includes a real-endpoint acceptance runner:
+```bash
+node dist/src/cli.js debug acceptance --daemon
+```
+The runner checks configuration first and refuses to pass without:
+- `model_setup.base_url`;
+- `model_setup.model`;
+- Omni `vision`, `image_generation`, and `video_generation` endpoint
+  `base_url` plus `model` values.
+When configured, the acceptance workflow creates a durable session, forces
+compression, asks the model to complete a real repository edit using built-in
+tools, runs Omni multimodal tools through the agent tool loop, records endpoint
+evidence, and validates daemon attach/detach/status/cancel behavior.
+The final product acceptance must be driven from the TUI. The current CLI
+runner can remain as an automation scaffold, but it does not by itself satisfy
+final acceptance.
+The TUI acceptance run must show per-turn cache evidence after each chat turn.
+For direct vLLM this means cached prompt tokens, total prompt tokens, cache hit
+rate, output tokens, endpoint mode, model, and request id when the endpoint
+exposes those fields.
+The runner verifies persisted evidence rather than trusting the prompt alone.
+It checks for:
+- required tool calls by category: `file_search`, read, edit,
+  shell/background process, git, todo, evidence, code intelligence, and Omni;
+- background process start and stop/cancel events;
+- context compression followed by later model or tool work;
+- session resume evidence in the same durable session;
+- managed resources;
+- prompt hash and tool schema hash records;
+- endpoint evidence and cached-token fields when the endpoint exposes them;
+- daemon job status, attach, detach, and cancel records on the same session.
+## Final Report Requirements
+The final report must include:
+- repository and task description;
+- configured provider, direct vLLM, SR, and Omni endpoints;
+- model names;
+- vLLM engine flags relevant to prefix caching, prompt token details, request
+  ids, chunked prefill, and tool calling;
+- tool calls used by category;
+- files changed;
+- tests or commands run;
+- context compression evidence;
+- multimodal artifacts and resource ids;
+- session id and resume evidence;
+- daemon attach/detach evidence after T9;
+- remaining endpoint limitations or blockers.

package/docs/public-source-hygiene.md ADDED Viewed

@@ -0,0 +1,21 @@
+# Public Source Hygiene
+Public Inferoa documents and source should describe Inferoa on its own
+terms. Design research can inform private implementation work, but public
+materials must avoid naming unrelated products as inspirations, competitors, or
+implementation sources.
+Allowed in this repository:
+- Independent product positioning.
+- Generalized terminal-agent design pressures.
+- vLLM ecosystem-specific decisions.
+- Original module contracts and roadmap.
+Avoid in this repository:
+- Naming unrelated coding agents as sources for UX or implementation choices.
+- Copying prompts, UI language, tool schemas, command names, or file names from
+  unrelated products.
+- Recording third-party implementation details that are not necessary for
+  Inferoa's own design.

package/docs/roadmap.md ADDED Viewed

@@ -0,0 +1,265 @@
+# Roadmap
+This roadmap supersedes the earlier CLI-first M0-M8 implementation labels.
+The existing backend prototype is useful as scaffolding, but it does not satisfy
+the product goal until the user workflow is TUI-first end to end.
+## Product Contract
+Inferoa is a branded terminal application, not a collection of CLI
+subcommands with a small readline fallback.
+- `inferoa` launches the TUI by default.
+- `inferoa "prompt"` launches the TUI and submits the initial prompt in the
+  new or resumed session.
+- `inferoa setup` opens the TUI setup wizard.
+- `inferoa --print "prompt"` is the explicit non-interactive path.
+- This is a fast-development product, so there is no compatibility requirement
+  for the current CLI-first scaffold. Any command, flag, output format, or
+  workflow that conflicts with the TUI-first product contract should be removed
+  instead of preserved.
+- JSON and narrow debug commands may exist only when they support tests or
+  acceptance automation. They should not shape the user workflow.
+- The chat `/` command registry is a first-class TUI surface with its own
+  product-specific command set. It must not be a mirror of legacy CLI
+  subcommands.
+- The user-facing identity stays simple: current directory plus session
+  id/title. Internal workspace, run, client, prompt epoch, and cache salt ids
+  remain implementation details.
+## T0: Goal Reset And UI Direction
+- mark the earlier CLI-first prototype as scaffolding, not complete product;
+- lock the TUI-first entrypoint contract;
+- use `docs/tui-product-design.md` as the UI product contract;
+- define the Inferoa brand language for the terminal UI: inference-native,
+  fast, technical, cache-aware, and visually distinct;
+- define core scenes: welcome, setup, chat, sessions, tools, endpoints, daemon,
+  and acceptance;
+- define terminal animation rules for smooth streaming, tool progress, endpoint
+  probing, compression, and artifact creation;
+- define the canonical TUI slash command registry and delete incompatible CLI
+  subcommands or chat commands from the active user path;
+- update public docs after validation.
+Validation:
+- `inferoa --help` documents TUI-first behavior;
+- roadmap and README no longer present CLI-first commands as the main path.
+- no legacy command is retained solely for backwards compatibility.
+## T1: TUI Application Shell
+- implement a real terminal app shell with transcript, input editor, status
+  line, overlays, selector lists, notifications, and keyboard bindings;
+- add branded Inferoa welcome screen with workspace, endpoint, model,
+  session, git, context, and daemon status;
+- add slash command palette for setup, status, sessions, tools, endpoints,
+  daemon, and acceptance views;
+- add responsive terminal layout that works in narrow and wide panes;
+- keep rendering deterministic and testable through snapshot or ANSI output
+  checks.
+Validation:
+- `inferoa` opens the TUI;
+- slash command palette opens and can select a command;
+- terminal resize does not corrupt the layout.
+## T2: TUI Setup Wizard
+- move provider setup into TUI scenes, not plain CLI output;
+- support direct vLLM setup with endpoint URL, vault-backed API key, `/v1/models`
+  probing, and model selection;
+- support external OpenAI-compatible setup with endpoint URL, masked vault
+  secret entry, `/v1/models` probing, and model selection;
+- support `auto` setup through vLLM Semantic Router with `/v1/models` probing
+  when available;
+- support Omni endpoint setup for vision, image generation, video
+  understanding, video generation, audio understanding, and audio generation;
+- after the user enters a key or endpoint, actively probe the endpoint and show
+  a model picker instead of asking the user to type model ids manually;
+- write config only after a final review screen;
+- never persist raw pasted API keys in config; setup stores secrets in the
+  local encrypted vault and writes only `api_key_ref`.
+Validation:
+- setup can configure the provided OpenAI-compatible provider and list
+  `tke/deepseek-v4-flash`;
+- setup can configure direct vLLM and Omni endpoints from the AMD validation
+  deployment;
+- invalid endpoints produce actionable TUI errors.
+## T3: Chat And Tool Interaction TUI
+- render streaming assistant output in the transcript;
+- render tool calls as cards with status, duration, bounded output, and
+  expandable managed resources;
+- animate pending tools with smooth but bounded redraw cadence;
+- render file edits with diff previews and approval controls where policy
+  requires approval;
+- stabilize streaming edit previews so partial removals do not jitter before
+  matching additions arrive;
+- render line-numbered diffs with added/removed colors, indentation markers,
+  syntax-highlighted context, and intra-line changed-token emphasis;
+- render shell and background process tools with live output, stop controls,
+  and bounded buffers;
+- render git, todo, evidence, and code-intelligence results in compact
+  workflow cards;
+- support image and video artifacts as first-class transcript resources.
+Validation:
+- a real coding task uses file search, read, edit, shell/process, git, todo,
+  evidence, and code intelligence through the TUI;
+- permission prompts are handled inside the TUI.
+- file diff and shell/process output are visually inspectable without raw JSON.
+## T4: Sessions And Workspace UX
+- add TUI session picker with title, id, status, last updated time, and
+  workspace path;
+- add resume, archive, rename, and new-session flows;
+- support multiple independent sessions per workspace with a single active
+  writer lock per session;
+- show lock conflicts and stale lock recovery in the TUI;
+- keep internal workspace ids and client ids out of normal user output.
+Validation:
+- a session can be resumed from the TUI and continues the same event log;
+- concurrent terminals show clear session ownership state.
+## T5: Endpoint Evidence And vLLM Optimization
+- record direct vLLM cached-token usage when exposed;
+- record prompt hashes, tool schema hashes, endpoint request ids, response ids,
+  model ids, and usage metadata;
+- record `/tokenize` availability as optional endpoint evidence when available,
+  but do not require it for workflow token budgeting;
+- show endpoint capability status in the TUI without assuming direct access to
+  serving metrics;
+- after every assistant turn, render a compact cache/usage footer with prompt
+  tokens, cached prompt tokens, cache hit rate, output tokens, endpoint mode,
+  model, and request id when available;
+- expose a `/cache` or equivalent TUI view for recent turns and aggregate cache
+  evidence;
+- keep stable prompt sections and deterministic tool schema order within each
+  prompt epoch.
+Validation:
+- endpoint evidence is persisted and visible from the TUI;
+- direct vLLM cache evidence is recorded when the endpoint exposes it.
+- turns without provider cache fields omit cache-hit fields entirely; cache
+  hit rate is shown only when the endpoint exposes cached prompt tokens.
+## T6: Context Compression UX
+- estimate prompt size against configured context windows;
+- compact older middle context at the configured threshold;
+- mechanically prune large raw tool outputs into managed resources before
+  model summarization;
+- render compression events in the transcript with what was preserved, moved,
+  and summarized;
+- continue work after compression in the same session.
+Validation:
+- a controlled long task triggers compression;
+- the agent continues after compression, surfaces compression status in the
+  TUI transcript, and persists resume/compression evidence.
+## T7: AMD Endpoint Deployment And Validation
+Product code must not become a deployment controller, but the project
+acceptance environment must be deployed and validated by the project team.
+Planned AMD validation hosts:
+- `165.245.131.56`
+- `134.199.199.149`
+Required deployment shape:
+- one host exposes a direct vLLM Engine OpenAI-compatible endpoint for the
+  coding model;
+- one host exposes vLLM-Omni OpenAI-compatible endpoints for multimodal
+  tools;
+- deployed models must fit the host GPU memory and support the required node
+  GPU/runtime stack;
+- existing containers, model processes, and occupied ports on the validation
+  hosts may be cleaned during deployment. The runbook should record what was
+  stopped or replaced, but it does not need to preserve pre-existing services;
+- the final report records endpoint URLs, model names, server flags, and
+  unavailable capabilities.
+Validation:
+- direct vLLM `/v1/models`, chat, tool calling, streaming, token usage, and
+  cached-token evidence work when exposed;
+- Omni image understanding, image generation, and video generation work through
+  Inferoa tools;
+- SSH/deployment access to both hosts is documented before this milestone can
+  pass.
+## T8: Auto Mode Through vLLM Semantic Router
+- configure `auto` mode through the TUI;
+- connect to vLLM Semantic Router as an endpoint, not as an owned deployment;
+- pass stable session identity headers;
+- preserve tool-loop continuity from the agent side;
+- record router-visible model selection metadata when available.
+Validation:
+- TUI setup can configure SR;
+- a coding session runs through SR and persists router evidence.
+## T9: Long-Horizon Supervisor TUI
+- add daemon job view with queued, running, detached, cancelled, failed, and
+  complete states;
+- support attach, detach, status, logs, and cancel from the TUI;
+- keep long-running processes alive after terminal detach where possible;
+- suspend safely when approval is required and resume after attach;
+- transfer session writer ownership to the daemon while a supervised run is
+  active.
+Validation:
+- daemon attach, detach, status, and cancel work from the TUI on the same final
+  acceptance task.
+## T10: Final Real-Endpoint Acceptance
+The project is complete only when the TUI-driven product completes a real
+end-to-end coding task with actual configured endpoints.
+Required coverage:
+- complete a real coding task using a real model endpoint;
+- use built-in tools: file search, read, edit, shell/process, git, todo,
+  evidence, and code intelligence where supported;
+- trigger context compression and continue after compression;
+- run image understanding through the configured Omni endpoint;
+- run image generation through the configured Omni endpoint;
+- run video generation through the configured Omni endpoint;
+- persist session events, resources, prompt hashes, endpoint evidence, and
+  resume evidence;
+- record direct vLLM cached-token evidence when exposed;
+- validate daemon attach, detach, status, and cancel behavior on the same final
+  task.
+## Later
+- local HTTP API;
+- local web dashboard;
+- standalone binary packaging;
+- richer codegraph index layer;
+- expanded multimodal workflows beyond endpoint-backed built-ins;
+- Responses API continuation support;
+- richer Semantic Router replay integration;
+- remote or multi-machine long-horizon supervision;
+- endpoint capability discovery for scheduler hints and cache diagnostics.