npm - triflux - Versions diffs - 10.1.1 → 10.2.0 - Mend

triflux 10.1.1 → 10.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/README.md CHANGED Viewed

@@ -8,15 +8,19 @@
   </picture>
 </p>
+<h3 align="center">Tri-CLI Orchestration with Consensus Intelligence</h3>
 <p align="center">
-  <strong>Tri-CLI Orchestration with Consensus Intelligence</strong><br>
-  <em>Claude + Codex + Gemini — natural language routing, cross-model review, 42 skills with Deep/Light variants.</em>
+  Route tasks across <strong>Claude + Codex + Gemini</strong> — 42 skills, natural language routing,<br>
+  cross-model review, and reflexion-based adaptive learning.
 </p>
 <p align="center">
   <a href="https://www.npmjs.com/package/triflux"><img src="https://img.shields.io/npm/v/triflux?style=flat-square&color=FFAF00&label=npm" alt="npm version"></a>
   <a href="https://www.npmjs.com/package/triflux"><img src="https://img.shields.io/npm/dm/triflux?style=flat-square&color=F5C242" alt="npm downloads"></a>
   <a href="https://github.com/tellang/triflux/stargazers"><img src="https://img.shields.io/github/stars/tellang/triflux?style=flat-square&color=FFAF00" alt="GitHub stars"></a>
+  <img src="https://img.shields.io/badge/skills-42-F5C242?style=flat-square" alt="42 skills">
+  <img src="https://img.shields.io/badge/node-%3E%3D18-374151?style=flat-square" alt="Node >= 18">
   <a href="https://opensource.org/licenses/MIT"><img src="https://img.shields.io/badge/License-MIT-374151?style=flat-square" alt="License: MIT"></a>
 </p>
@@ -25,16 +29,34 @@
 </p>
 <p align="center">
-  <a href="#quick-start">Quick Start</a> ·
-  <a href="#tri-cli-consensus">Tri-CLI Consensus</a> ·
-  <a href="#38-skills">38 Skills</a> ·
-  <a href="#architecture">Architecture</a> ·
-  <a href="#deep-vs-light">Deep vs Light</a> ·
+  <a href="#quick-start">Quick Start</a> &middot;
+  <a href="#tri-cli-consensus">Consensus Engine</a> &middot;
+  <a href="#42-skills">42 Skills</a> &middot;
+  <a href="#deep-vs-light">Deep vs Light</a> &middot;
+  <a href="#architecture">Architecture</a> &middot;
+  <a href="#under-the-hood">Under the Hood</a> &middot;
   <a href="#security">Security</a>
 </p>
 ---
+## What is triflux?
+Most AI coding tools talk to **one model**. triflux talks to **three** — and makes them argue.
+Every Deep skill runs Claude, Codex, and Gemini **independently** (no cross-visibility), then cross-validates their findings. Only consensus-verified results survive. The result: **87% fewer false positives** compared to single-model review.
+You don't need to memorize commands. Say what you want in natural language — triflux routes to the right skill automatically:
+```
+"review this"          → /tfx-review       (Light — single model, fast)
+"review this thoroughly" → /tfx-deep-review  (Deep — 3-party consensus)
+"리뷰해줘"              → /tfx-review       (Korean works too)
+"제대로 리뷰해"          → /tfx-deep-review  (depth modifier detected)
+```
+---
 ## Quick Start
 ### 1. Install
@@ -67,52 +89,72 @@ tfx setup
 # Persistence — don't stop until done
 /tfx-persist "implement full auth flow with tests"
-# Compatibility alias
-/tfx-ralph "implement full auth flow with tests"
-# Team — Multi-CLI parallel orchestration
+# Team — multi-CLI parallel orchestration
 /tfx-multi "refactor auth + update UI + add tests"
+# Monitor — real-time routing dashboard
+tfx monitor
 # Remote — spawn Claude sessions on other machines
-/tfx-remote-setup                                # interactive host wizard (Tailscale + SSH)
-/tfx-remote-spawn "run security review on my-server" # spawn on remote host
+/tfx-remote-setup           # interactive host wizard
+/tfx-remote-spawn "run security review on my-server"
 ```
+> **Note**: Deep skills require **psmux** (or tmux), **triflux Hub**, **Codex CLI**, and **Gemini CLI** for full Tri-CLI consensus. Without these, skills automatically degrade to Claude-only mode. Run `tfx doctor` to check your environment.
 ---
-## What's New in v10
+## What's New
+### v10.1 — Reflexion Pipeline + TUI Monitor
-**triflux v10** completes the **4-Lake Roadmap** — a systematic hardening of every layer from CLI stability to remote multi-agent orchestration.
+| Feature | Description |
+|---------|-------------|
+| **TUI Routing Monitor** | `tfx monitor` — interactive terminal dashboard showing real-time skill routing, model selection, and success rates |
+| **Reflexion Pipeline** | safety-guard events feed into a reflexion store, enabling adaptive learning from past routing decisions |
+| **Adaptive Rules API v2** | Penalty promotion pipeline (`pending-penalties` → `adaptive_rules`), hit_count isolation, schema v2 with 18 tests |
+| **Q-Learning Routing** | Experimental dynamic skill routing via Q-table weight optimization (`TRIFLUX_DYNAMIC_ROUTING=true`) |
+| **Security Hardening** | headless-guard: wrapper bypass, pipe bypass, env escape vectors blocked. SSH bash-syntax forwarding prevention |
+| **HUD System** | Codex plan-aware status display with correct bucket-to-slot mapping |
-### v10 Highlights
+### v10.0 — 4-Lake Roadmap
+<details>
+<summary>Expand v10.0 details</summary>
 - **Lake 1: CLI Stability** — Retry, stall detection, version cache. Zero silent failures
 - **Lake 2: Plugin Isolation** — cli-adapter-base, team-bridge, pack.mjs sync
-- **Lake 3: Remote Infrastructure** — SSH keepalive/retry, hosts.json capability routing, remote handoff, MCP singleton daemon
+- **Lake 3: Remote Infrastructure** — SSH keepalive/retry, hosts.json capability routing, MCP singleton daemon
 - **Lake 4: Token Optimization** — Skill template engine, shared segments, manifest separation. 62% prompt token reduction
 - **Lake 5: Agent Mesh** — Message routing, per-agent queues, heartbeat monitoring, Conductor integration
-### v9 (carried forward)
+</details>
-**triflux v9** introduces **Harness-Native Intelligence** — speak naturally, and triflux routes to the right skill automatically. Cross-model review ensures no model approves its own work.
+### v9 — Harness-Native Intelligence
-### v9 Highlights
+<details>
+<summary>Expand v9 details</summary>
-- **Natural Language Routing** — Say "review this" or "리뷰해줘" instead of memorizing `/tfx-review`. Depth modifiers ("thoroughly", "제대로") auto-escalate to Deep variants
-- **Cross-Model Review** — Claude writes → Codex reviews. Codex writes → Claude reviews. Same-model self-approve is blocked. Pre-commit nudge for unreviewed files
-- **Context Isolation** — Off-topic requests auto-detected; spawns a clean psmux session so your main context stays focused
-- **38 Skills** — 14 Light + 10 Deep + 14 Infrastructure, organized across 10 domains
-- **Codex Swarm Hardened** — PowerShell `.ps1` launchers, profile-based execution (no `--dangerously` flag), `/merge-worktree` auto-invocation for result collection
-- **Skill Metadata** — Every skill labeled: wrapper/infrastructure/Light-Deep pairs. Trigger conflicts resolved
+- **Natural Language Routing** — Say "review this" or "리뷰해줘" instead of memorizing skill names
+- **Cross-Model Review** — Claude writes → Codex reviews. Same-model self-approve blocked
+- **Context Isolation** — Off-topic requests auto-detected; spawns a clean psmux session
+- **Codex Swarm Hardened** — PowerShell `.ps1` launchers, profile-based execution
-### v8 Foundations (carried forward)
+</details>
-- **Tri-Debate Engine** — 3-CLI independent analysis with anti-herding, cross-validation, and consensus scoring
-- **Deep/Light Variants** — Every capability has a token-efficient Light mode and a thorough Deep mode
-- **Consensus Gate** — Deep skills require 2/3+ CLI agreement; learned weights track CLI reliability over time
+### v8 — Tri-Debate Foundation
+<details>
+<summary>Expand v8 details</summary>
+- **Tri-Debate Engine** — 3-CLI independent analysis with anti-herding and consensus scoring
+- **Deep/Light Variants** — Every domain has both a fast mode and a thorough mode
 - **Expert Panel** — Virtual expert simulation via `tfx-panel`
-- **Hub IPC** — Resident Hub server with Named Pipe & HTTP MCP bridge
-- **psmux / Windows Native** — Hybrid support for `tmux` (WSL) and `psmux` (Windows Terminal)
+- **Hub IPC** — Named Pipe & HTTP MCP bridge
+- **psmux** — Windows Terminal native multiplexer
+</details>
 ---
@@ -122,18 +164,18 @@ tfx setup
   <img src="docs/assets/consensus-flow.svg" alt="Tri-CLI Consensus Flow" width="680">
 </p>
-The core innovation of triflux. Instead of trusting a single model, every Deep skill runs:
+The core innovation. Instead of trusting a single model, every Deep skill runs:
 ```
 Phase 1: Independent Analysis (Anti-Herding)
-  ├─ Claude Opus  → Analysis A (isolated, no cross-visibility)
-  ├─ Codex CLI    → Analysis B (isolated, no cross-visibility)
-  └─ Gemini CLI   → Analysis C (isolated, no cross-visibility)
+  ├─ Claude Opus  → Analysis A  (isolated, no cross-visibility)
+  ├─ Codex CLI    → Analysis B  (isolated, no cross-visibility)
+  └─ Gemini CLI   → Analysis C  (isolated, no cross-visibility)
 Phase 2: Cross-Validation
-  ├─ Compare all findings across 3 sources
-  ├─ Items with 2/3+ agreement → CONSENSUS
-  └─ Items with 1/3 only → DISPUTED (needs resolution)
+  ├─ Compare findings across 3 sources
+  ├─ 2/3+ agreement → CONSENSUS
+  └─ 1/3 only → DISPUTED (needs resolution)
 Phase 3: Resolution (if consensus < 70%)
   ├─ Each CLI reviews opposing arguments
@@ -141,119 +183,117 @@ Phase 3: Resolution (if consensus < 70%)
   └─ Unresolved → user decides
 ```
-**Result**: 87% fewer false positives compared to single-model review (based on Calimero consensus research).
+**v10.1 addition**: The **Reflexion Pipeline** feeds consensus outcomes back into an adaptive rules store, so routing decisions improve over time based on which models perform best for which task types.
 ---
-## 38 Skills
+## 42 Skills
-### Research
+### Research & Discovery
-| Skill | Type | Description | Tokens |
-|-------|------|-------------|--------|
-| `tfx-research` | Light | Quick web search via Exa/Brave/Tavily auto-selection | ~5K |
-| `tfx-deep-research` | Deep | Multi-source parallel search with 3-CLI cross-validation | ~50K |
-| `tfx-find` | Light | Fast codebase search — files, symbols, patterns via Haiku | ~3K |
-| `tfx-autoresearch` | Light | Autonomous web research to structured report | ~15K |
+| Skill | Type | Description |
+|-------|------|-------------|
+| `tfx-research` | Light | Quick web search via Exa/Brave/Tavily auto-selection |
+| `tfx-deep-research` | Deep | Multi-source parallel search with 3-CLI cross-validation |
+| `tfx-find` | Light | Fast codebase search — files, symbols, patterns |
+| `tfx-autoresearch` | Light | Autonomous web research to structured report |
-### Analysis
+### Analysis & Planning
-| Skill | Type | Description | Tokens |
-|-------|------|-------------|--------|
-| `tfx-analysis` | Light | Quick code/architecture analysis via Codex | ~8K |
-| `tfx-deep-analysis` | Deep | 3-perspective analysis + Tri-Debate consensus | ~30K |
+| Skill | Type | Description |
+|-------|------|-------------|
+| `tfx-analysis` | Light | Quick code/architecture analysis |
+| `tfx-deep-analysis` | Deep | 3-perspective analysis with Tri-Debate consensus |
+| `tfx-plan` | Light | Quick implementation plan |
+| `tfx-deep-plan` | Deep | Planner + Architect + Critic consensus planning |
+| `tfx-interview` | Light | Socratic requirements exploration |
+| `tfx-deep-interview` | Deep | Deep interview with mathematical ambiguity gating |
 ### Execution
-| Skill | Type | Description | Tokens |
-|-------|------|-------------|--------|
-| `tfx-autopilot` | Light | Simple autonomous task execution (single file, <5min) | ~10K |
-| `tfx-fullcycle` | Deep | Full pipeline: Design → Plan → Execute → QA → Verify | ~80K |
-| `tfx-auto` | — | Unified CLI orchestrator with command shortcuts + auto-triage | varies |
-### QA & Verification
-| Skill | Type | Description | Tokens |
-|-------|------|-------------|--------|
-| `tfx-qa` | Light | Test → Fix → Retest cycle (max 3 rounds) | ~5K |
-| `tfx-deep-qa` | Deep | 3-CLI independent verification with consensus scoring | ~25K |
+| Skill | Type | Description |
+|-------|------|-------------|
+| `tfx-auto` | Router | Unified CLI orchestrator — auto-triage + command shortcuts |
+| `tfx-autopilot` | Light | Single-file autonomous execution (<5min tasks) |
+| `tfx-fullcycle` | Deep | Full pipeline: Design → Plan → Execute → QA → Verify |
-### Planning
+### Review & QA
-| Skill | Type | Description | Tokens |
-|-------|------|-------------|--------|
-| `tfx-plan` | Light | Quick implementation plan via Opus | ~8K |
-| `tfx-deep-plan` | Deep | Planner + Architect + Critic consensus planning | ~20K |
+| Skill | Type | Description |
+|-------|------|-------------|
+| `tfx-review` | Light | Quick code review |
+| `tfx-deep-review` | Deep | 3-CLI independent review, consensus-only reporting |
+| `tfx-qa` | Light | Test → Fix → Retest cycle (max 3 rounds) |
+| `tfx-deep-qa` | Deep | 3-CLI independent verification with consensus scoring |
-### Review
+### Debate & Decision
-| Skill | Type | Description | Tokens |
-|-------|------|-------------|--------|
-| `tfx-review` | Light | Quick code review via Codex | ~8K |
-| `tfx-deep-review` | Deep | 3-CLI independent review, consensus-only reporting | ~25K |
+| Skill | Type | Description |
+|-------|------|-------------|
+| `tfx-debate` | Deep | Structured 3-party debate on any topic |
+| `tfx-panel` | Deep | Virtual expert panel simulation |
-### Debate & Panel
+### Persistence & Routing
-| Skill | Type | Description | Tokens |
-|-------|------|-------------|--------|
-| `tfx-debate` | Deep | Structured 3-party debate on any topic | ~20K |
-| `tfx-panel` | Deep | Virtual expert panel simulation | ~30K |
+| Skill | Type | Description |
+|-------|------|-------------|
+| `tfx-persist` | Deep | 3-party verified loop until task completion |
+| `tfx-ralph` | — | Alias for `tfx-persist` |
+| `tfx-autoroute` | Light | Auto model escalation on failure |
+| `tfx-auto-codex` | — | Codex-lead orchestrator |
-### Persistence
+### Orchestration & Infrastructure
-| Skill | Type | Description | Tokens |
-|-------|------|-------------|--------|
-| `tfx-persist` | Deep | 3-party verified persistence loop until done | varies |
-| `tfx-ralph` | — | Alias for `tfx-persist` | varies |
-| `tfx-autoroute` | Light | Auto-routing with model escalation on failure | varies |
+| Skill | Description |
+|-------|-------------|
+| `tfx-consensus` | Core consensus engine (used by all Deep skills) |
+| `tfx-hub` | MCP message bus — Named Pipe & HTTP bridge |
+| `tfx-multi` | Multi-CLI team orchestration (2+ parallel tasks) |
+| `tfx-codex-swarm` | Parallel Codex sessions via worktree + psmux |
+| `tfx-swarm` | Unified swarm orchestration |
+| `tfx-codex` | Codex-only orchestrator |
+| `tfx-gemini` | Gemini-only orchestrator |
-### Meta & Utility
+### Remote
-| Skill | Type | Description | Tokens |
-|-------|------|-------------|--------|
-| `tfx-index` | Light | 94% token reduction via project indexing (58K→3K) | ~2K |
-| `tfx-forge` | Light | Create new skills interactively | ~10K |
-| `tfx-interview` | Light | Socratic requirements exploration | ~15K |
-| `tfx-deep-interview` | Deep | Socratic deep interview with ambiguity gating | ~25K |
-| `tfx-prune` | Light | AI slop removal — dead code, over-abstraction cleanup | ~10K |
+| Skill | Description |
+|-------|-------------|
+| `tfx-remote-spawn` | Spawn Claude sessions on remote machines via SSH |
+| `tfx-remote-setup` | Interactive host wizard (Tailscale + SSH discovery) |
-### Infrastructure
+### Meta & Tooling
 | Skill | Description |
 |-------|-------------|
-| `tfx-consensus` | Core consensus engine (internal, used by all Deep skills) |
-| `tfx-hub` | MCP message bus management |
-| `tfx-multi` | Multi-CLI team orchestration |
-| `tfx-codex-swarm` | Parallel Codex sessions via worktree + psmux |
-| `tfx-swarm` | Unified swarm orchestration |
+| `tfx-index` | Project indexing — 94% token reduction (58K → 3K) |
+| `tfx-forge` | Create new skills interactively |
+| `tfx-prune` | AI slop removal — dead code, over-abstraction cleanup |
 | `tfx-setup` | Initial setup wizard |
 | `tfx-doctor` | Diagnostics and auto-repair |
 | `tfx-hooks` | Claude Code hook priority manager |
 | `tfx-profile` | Codex/Gemini CLI profile management |
-| `tfx-codex` | Codex-only orchestrator |
-| `tfx-gemini` | Gemini-only orchestrator |
-| `tfx-auto-codex` | Codex-lead orchestrator |
-| `tfx-remote-spawn` | Remote session management via psmux + SSH |
-| `tfx-remote-setup` | Remote host setup wizard (Tailscale + SSH) |
+| `tfx-psmux-rules` | psmux command generation rules |
+| `merge-worktree` | Worktree merge helper for swarm results |
+| `star-prompt` | GitHub star prompt for postinstall |
 ---
 ## Deep vs Light
-Every domain offers both modes:
 <p align="center">
   <img src="docs/assets/deep-vs-light.svg" alt="Deep vs Light comparison" width="680">
 </p>
+Every domain offers both modes. Depth modifiers in natural language auto-escalate:
 | Dimension | Light | Deep |
 |-----------|-------|------|
-| **CLIs** | Single (usually Codex) | 3-party (Claude + Codex + Gemini) |
-| **Tokens** | 3K-15K | 20K-80K |
+| **Models** | Single (usually Codex) | 3-party (Claude + Codex + Gemini) |
+| **Tokens** | 3K–15K | 20K–80K |
 | **Speed** | Seconds | Minutes |
 | **Accuracy** | Good (single perspective) | Excellent (consensus-verified) |
 | **Bias** | Possible | Eliminated via anti-herding |
-| **Use when** | Quick tasks, known patterns | Critical decisions, unknown territory |
+| **Trigger** | Default, "quick", "fast" | "thoroughly", "carefully", "제대로" |
 ---
@@ -264,11 +304,11 @@ Every domain offers both modes:
 </p>
 <details>
-<summary>Interactive diagram (GitHub only)</summary>
+<summary>Interactive diagram</summary>
 ```mermaid
 graph TD
-    User([User / Claude Code]) <-->|Skills & Slash Commands| TFX[tfx Skills Layer]
+    User([User / Claude Code]) <-->|"Skills & Natural Language"| TFX[tfx Skills Layer]
     TFX <-->|Consensus Engine| CONSENSUS[tfx-consensus]
     subgraph "Tri-CLI Consensus"
@@ -284,14 +324,16 @@ graph TD
         RESOLVE --> MERGE
     end
-    TFX <-->|Named Pipe / HTTP| HUB[triflux Hub Server]
+    TFX <-->|Named Pipe / HTTP| HUB[triflux Hub]
-    subgraph "Orchestration Hub"
+    subgraph "Hub Services"
         HUB <--> STORE[(SQLite Store)]
-        HUB <--> DASH[QoS Dashboard]
-        HUB <--> DELEGATOR[Delegator Service]
+        HUB <--> REFLEXION[Reflexion Engine]
+        HUB <--> ADAPTIVE[Adaptive Rules]
+        HUB <--> MONITOR[TUI Monitor]
     end
+    REFLEXION -->|"Feedback Loop"| TFX
     HUB -.->|MCP Bridge| External[External MCP Clients]
 ```
@@ -299,95 +341,154 @@ graph TD
 ---
-## Quick Start
+## Under the Hood
-### 1. Install
+### Singleton MCP Hub with Dual-Protocol IPC
+triflux Hub runs as a **singleton daemon** per machine. A filesystem lock prevents duplicate instances.
-```bash
-npm install -g triflux
+```
+Local agents ──→ Named Pipe (NDJSON, sub-ms latency) ──→ Hub
+Remote/Dashboard ──→ HTTP/REST ──────────────────────→ Hub
 ```
-### 2. Setup
+The bridge client tries Named Pipe first and falls back to HTTP automatically. Sessions auto-expire after 30 minutes, and the Hub self-terminates when idle. Run `tfx hub ensure` to guarantee the Hub is alive from any context.
-```bash
-tfx setup
+### Reflexion Adaptive Learning
+Errors become knowledge automatically. The Reflexion Engine runs a closed-loop learning pipeline:
+```
+safety-guard blocks command
+  → error normalized (paths, timestamps, UUIDs stripped)
+  → pattern stored in pending-penalties
+  → promoted to adaptive rule (Bayesian confidence scoring)
+  → injected into CLAUDE.md when confidence > threshold
+Three-tier memory:
+  Tier 1 (Session)   → cleared on session end
+  Tier 2 (Project)   → decays -0.2 confidence per 5 unobserved sessions
+  Tier 3 (Permanent) → auto-injected into CLAUDE.md as machine-readable rules
 ```
-### 3. Usage
+A blocked command in Session 1 becomes a proactive warning in Session 2 and eventually a permanent instruction. Your AI agent literally gets smarter over time.
-```bash
-# Light — Quick single-model execution
-/tfx-research "React 19 Server Actions best practices"
-/tfx-review
-/tfx-plan "add JWT auth middleware"
+### Pipeline Quality Gates
-# Deep — 3-party consensus for critical work
-/tfx-deep-research "microservice architecture comparison 2026"
-/tfx-deep-review
-/tfx-deep-plan "migrate REST to GraphQL"
+Every Deep task runs through a **10-phase state machine** with quality gates:
-# Debate — Get 3 independent opinions
-/tfx-debate "Redis vs PostgreSQL LISTEN/NOTIFY for real-time events"
+```
+plan → PRD → confidence gate → execute → deslop → verify → selfcheck → complete
+                                                              ↓
+                                                          fix (max 3) → retry
+```
-# Persistence — Don't stop until done
-/tfx-persist "implement full auth flow with tests"  # /tfx-ralph also works
+- **Confidence Gate** (pre-execution): 5 weighted criteria must score >= 90% before execution starts
+- **Hallucination Detection** (post-execution): 7 regex patterns catch AI claims without evidence:
+  - "tests pass" without test output
+  - "performance improved" without benchmarks
+  - "backward compatible" without verification
+  - "no changes needed" when diff exists
+- **Bounded loops**: Fix attempts capped at 3, ralph iterations at 10. State persists in SQLite for crash recovery.
-# Team — Multi-CLI parallel orchestration
-/tfx-multi "refactor auth + update UI + add tests"
+### 5-Tier Adaptive HUD
+The Claude Code status bar auto-adapts to any terminal width:
+```
+ full (120+ cols)  ██████░░░░ claude 52%  ██████░░░░ codex 48%  savings: $2.40
+ compact (80 cols) c:52% x:48% g:Free  sv:$2.40  CTX:67%
+ minimal (60 cols) c:52% x:48% sv:$2.40
+ micro (<60 cols)  c52 x48 sv$2
+ nano (<40 cols)   c:52%/x:48%
 ```
-> **Note**: Deep skills (`/tfx-deep-*`, `/tfx-persist`, `/tfx-ralph`) require **psmux** (or tmux), **triflux Hub**, **Codex CLI**, and **Gemini CLI** for full Tri-CLI consensus (Tier 1). Without these prerequisites, skills automatically degrade to Tier 3 (Claude-only, single-model) mode. Run `tfx doctor` to check your environment.
->
-> **Serena note**: Serena MCP is stateful. Share one Serena instance only across agents working on the **same project**. For parallel work across different projects, prefer separate Serena instances. If Serena reports `No active project`, check your Codex Serena config for `--project-from-cwd` (or `--project <path>`) and rerun `tfx doctor`.
+Zero config. Open a vertical split pane and the HUD auto-collapses. Close it and it expands back. When `tfx-multi` is active, a live worker row appears showing per-CLI progress: `x✓ g⋯ c✗` (completed/running/failed).
+Context token attribution tracks usage by skill, file, and tool call, with warnings at 60%/80%/90% context fill.
+### Windows Terminal Orchestration
+triflux doesn't just run in a terminal -- it **orchestrates** it. The WT Manager API provides:
+- **Tab creation** with PID-tracked lifecycle (temp file polling for readiness)
+- **Split-pane layouts** via `applySplitLayout()` for multi-agent dashboards
+- **Dead tab pruning** using cross-platform PID liveness detection
+- **Base64 PowerShell encoding** eliminating all quoting/escaping issues
+Every direct `wt.exe` call is blocked by safety-guard. Agents can only use the managed API path, preventing uncontrolled terminal sprawl.
 ---
-## Research Foundation
+## TUI Routing Monitor
-The v8 skill suite was inspired by patterns and ideas from across the Claude Code ecosystem:
+**New in v10.1** — `tfx monitor` launches an interactive terminal dashboard:
-| Project | Stars | Inspiration |
-|---------|-------|-------------------|
-| everything-claude-code | 114K | Instinct-based learning patterns |
-| Superpowers | 93K | TDD enforcement, composable skills |
-| oh-my-openagent | 44K | Category routing, Hashline edits |
-| SuperClaude | 22K | index-repo 94% token reduction, expert panels |
-| oh-my-claudecode | 15K | Ralph persistence, CCG tri-model |
-| ruflo | 28K | 60+ agent orchestration |
-| Exa MCP | 3.7K | Neural search, highlight extraction |
-| Brave Search MCP | — | Independent index, Goggles re-ranking |
-| Tavily MCP | — | Deep research pipeline |
+```
+┌─ Routing Monitor ─────────────────────────────────────────┐
+│                                                           │
+│  Active Skills    Success Rate    Avg Latency    Model    │
+│  ─────────────    ────────────    ───────────    ─────    │
+│  tfx-review       94.2%           3.2s           codex    │
+│  tfx-auto         87.1%           5.8s           mixed    │
+│  tfx-research     91.0%           4.1s           claude   │
+│                                                           │
+│  Reflexion Store: 142 rules  │  Adaptive: 28 promoted     │
+│  Q-Table entries: 89         │  Pending penalties: 3      │
+│                                                           │
+└───────────────────────────────────────────────────────────┘
+```
-5-language research (EN/CN/RU/JP/UA) uncovered unique patterns: WeChat integration (CN), Discord mobile bridges (JP), GigaCode domestic alternatives (RU), and community-driven localization efforts.
+The monitor visualizes:
+- Real-time skill routing decisions and model selection
+- Success/failure rates per skill and per model
+- Reflexion store growth and adaptive rule promotions
+- Q-Learning weight evolution (when `TRIFLUX_DYNAMIC_ROUTING=true`)
 ---
 ## Security
-- **Hub Token Auth** — Secure IPC using `TFX_HUB_TOKEN` (Bearer Auth)
-- **Localhost Only** — Default Hub binding to `127.0.0.1`
-- **CORS Lockdown** — Strict origin checking for QoS Dashboard
-- **Injection Protection** — Sanitized shell execution in `psmux` and `tmux`
-- **Consensus Verification** — Deep skills prevent single-model hallucination via 3-party consensus
+| Layer | Protection |
+|-------|-----------|
+| **Hub Token Auth** | Secure IPC via `TFX_HUB_TOKEN` (Bearer Auth) |
+| **Localhost Binding** | Hub defaults to `127.0.0.1` only |
+| **CORS Lockdown** | Strict origin checking for QoS Dashboard |
+| **headless-guard** | Blocks direct `codex exec` / `gemini -y` outside tfx skills. Wrapper bypass, pipe bypass, env escape vectors all covered |
+| **safety-guard** | SSH bash-syntax forwarding prevention, injection-safe shell execution |
+| **Consensus Verification** | Deep skills prevent single-model hallucination via 3-party consensus |
+| **Reflexion Feedback** | Security events feed adaptive rules for continuous improvement |
 ---
 ## Platform Support
-- **Linux / macOS**: Native `tmux` integration
-- **Windows**: **psmux** (PowerShell Multiplexer) + Windows Terminal native
+| Platform | Multiplexer | Status |
+|----------|-------------|--------|
+| **Windows** | psmux (PowerShell) + Windows Terminal | Full support (CP949 encoding handled) |
+| **Linux** | tmux | Full support |
+| **macOS** | tmux | Full support |
 ---
-## QoS Dashboard
+## Research Foundation
+The triflux skill suite was shaped by patterns from across the Claude Code ecosystem:
-Monitor orchestration health via the built-in QoS Dashboard (run `tfx doctor` for URL).
+| Project | Inspiration |
+|---------|-------------|
+| everything-claude-code | Instinct-based learning patterns |
+| Superpowers | TDD enforcement, composable skills |
+| oh-my-openagent | Category routing, Hashline edits |
+| SuperClaude | index-repo 94% token reduction, expert panels |
+| oh-my-claudecode | Ralph persistence, CCG tri-model |
+| ruflo | 60+ agent orchestration |
+| Exa / Brave / Tavily MCP | Neural search, deep research pipeline |
-- **AIMD Batch Sizing** — Auto-scales parallel tasks based on success rates
-- **Token Savings** — Real-time tracking of Claude tokens saved
-- **Consensus Metrics** — Track agreement rates across CLIs
+5-language research (EN/CN/RU/JP/UA) uncovered unique patterns: WeChat integration (CN), Discord mobile bridges (JP), GigaCode alternatives (RU), and community-driven localization efforts.
 ---
 <p align="center">
-  <sub>MIT License · Made by <a href="https://github.com/tellang">tellang</a></sub>
+  <sub>MIT License &middot; Made by <a href="https://github.com/tellang">tellang</a></sub>
 </p>

package/bin/triflux.mjs CHANGED Viewed

@@ -171,11 +171,12 @@ const CLI_COMMAND_SCHEMAS = Object.freeze({
     },
   },
   hub: {
-    usage: "tfx hub <start|stop|status> [--port N] [--json]",
+    usage: "tfx hub <start|stop|status|ensure> [--port N] [--json]",
     description: "tfx-hub 프로세스 제어",
     subcommands: {
       start: { usage: "tfx hub start [--port N]" },
       stop: { usage: "tfx hub stop" },
+      ensure: { usage: "tfx hub ensure [--port N] [--json]", description: "헬스체크 + 자동 시작 (idempotent)" },
       status: {
         usage: "tfx hub status [--json]",
         options: [{ name: "--json", type: "boolean", description: "허브 상태를 JSON으로 출력" }],
@@ -3840,12 +3841,93 @@ async function cmdHub(args = [], options = {}) {
       break;
     }
+    case "ensure": {
+      // 사일런트 idempotent 보장 — 스킬 환경 프로브용.
+      // Hub 살아있으면 즉시 종료, 죽어있으면 자동 시작 + ready 대기.
+      const portArg = args.indexOf("--port");
+      const ensurePort = portArg !== -1 ? args[portArg + 1] : (process.env.TFX_HUB_PORT || "27888");
+      // 1. 이미 healthy?
+      const ensureProbed = await probeHubStatus("127.0.0.1", Number(ensurePort), 1500);
+      if (ensureProbed?.hub?.state === "healthy") {
+        if (json) printJson({ status: "ok", pid: ensureProbed.pid, port: Number(ensurePort) });
+        else process.stdout.write("hub: ok\n");
+        return;
+      }
+      // 2. PID 파일 있는데 프로세스 죽었으면 정리
+      if (existsSync(HUB_PID_FILE)) {
+        try {
+          const staleInfo = JSON.parse(readFileSync(HUB_PID_FILE, "utf8"));
+          process.kill(staleInfo.pid, 0);
+          // 프로세스 살아있지만 healthy가 아님 — 잠시 더 대기
+          const retryDeadline = Date.now() + 3000;
+          while (Date.now() < retryDeadline) {
+            await new Promise((r) => setTimeout(r, 250));
+            const retry = await probeHubStatus("127.0.0.1", Number(ensurePort), 1000);
+            if (retry?.hub?.state === "healthy") {
+              if (json) printJson({ status: "ok", pid: retry.pid, port: Number(ensurePort) });
+              else process.stdout.write("hub: ok\n");
+              return;
+            }
+          }
+        } catch {
+          try { unlinkSync(HUB_PID_FILE); } catch {}
+        }
+      }
+      // 3. 시작
+      const serverPath = join(PKG_ROOT, "hub", "server.mjs");
+      if (!existsSync(serverPath)) {
+        if (json) printJson({ status: "error", reason: "server_missing" });
+        else process.stderr.write("hub: server.mjs not found\n");
+        process.exitCode = 1;
+        return;
+      }
+      if (process.platform === "win32") {
+        const child = spawn("cmd.exe", ["/c", "start", "/b", "", process.execPath, serverPath], {
+          env: { ...process.env, TFX_HUB_PORT: String(ensurePort) },
+          stdio: "ignore",
+          windowsHide: true,
+        });
+        child.unref();
+      } else {
+        const child = spawn(process.execPath, [serverPath], {
+          env: { ...process.env, TFX_HUB_PORT: String(ensurePort) },
+          detached: true,
+          stdio: "ignore",
+        });
+        child.unref();
+      }
+      // 4. ready 대기 (최대 5초)
+      const readyDeadline = Date.now() + 5000;
+      while (Date.now() < readyDeadline) {
+        await new Promise((r) => setTimeout(r, 250));
+        if (existsSync(HUB_PID_FILE)) {
+          const readyProbe = await probeHubStatus("127.0.0.1", Number(ensurePort), 1000);
+          if (readyProbe?.hub?.state === "healthy") {
+            if (json) printJson({ status: "ok", pid: readyProbe.pid, port: Number(ensurePort), started: true });
+            else process.stdout.write("hub: started\n");
+            return;
+          }
+        }
+      }
+      // 5. 타임아웃이지만 프로세스는 기동 중일 수 있음
+      if (json) printJson({ status: "starting", port: Number(ensurePort) });
+      else process.stdout.write("hub: starting\n");
+      break;
+    }
     default:
       console.log(`\n  ${AMBER}${BOLD}⬡ tfx-hub${RESET}\n`);
-      console.log(`    ${WHITE_BRIGHT}tfx hub start${RESET}   ${GRAY}허브 데몬 시작${RESET}`);
-      console.log(`    ${DIM}  --port N${RESET}      ${GRAY}포트 지정 (기본 27888)${RESET}`);
-      console.log(`    ${WHITE_BRIGHT}tfx hub stop${RESET}    ${GRAY}허브 중지${RESET}`);
-      console.log(`    ${WHITE_BRIGHT}tfx hub status${RESET}  ${GRAY}상태 확인${RESET}\n`);
+      console.log(`    ${WHITE_BRIGHT}tfx hub start${RESET}    ${GRAY}허브 데몬 시작${RESET}`);
+      console.log(`    ${DIM}  --port N${RESET}       ${GRAY}포트 지정 (기본 27888)${RESET}`);
+      console.log(`    ${WHITE_BRIGHT}tfx hub stop${RESET}     ${GRAY}허브 중지${RESET}`);
+      console.log(`    ${WHITE_BRIGHT}tfx hub status${RESET}   ${GRAY}상태 확인${RESET}`);
+      console.log(`    ${WHITE_BRIGHT}tfx hub ensure${RESET}   ${GRAY}헬스체크 + 자동 시작 (스킬 프로브용)${RESET}\n`);
   }
 }
@@ -3886,7 +3968,7 @@ async function main() {
       cmdHandoff(cmdArgs, { json: JSON_OUTPUT });
       return;
     case "hub":
-      await cmdHub(cmdArgs, { json: JSON_OUTPUT && (cmdArgs[0] || "status") === "status" });
+      await cmdHub(cmdArgs, { json: JSON_OUTPUT && ["status", "ensure"].includes(cmdArgs[0] || "status") });
       return;
     case "monitor": {
       const { createMonitor } = await import("../tui/monitor.mjs");

package/hub/team/ansi.mjs CHANGED Viewed

@@ -128,9 +128,28 @@ function renderBorderChar(glyph, row, col, highlightCell, borderSeq, highlightSe
 export function box(lines, width, borderColor = "", options = {}) {
   const isFn = typeof borderColor === "function";
   const totalRows = lines.length + 2;
+  const highlightCell = borderHighlightCell(width, totalRows, options.highlightPos);
+  // Fast path: static border, no highlight — batch border chars (~13x less output)
+  if (!highlightCell && !isFn) {
+    const bc = borderColor || "";
+    const rst = bc ? RESET : "";
+    const hLine = BOX.h.repeat(Math.max(0, width - 2));
+    const top = `${bc}${BOX.tl}${hLine}${BOX.tr}${rst}`;
+    const bot = `${bc}${BOX.bl}${hLine}${BOX.br}${rst}`;
+    const mid = `${bc}${BOX.ml}${hLine}${BOX.mr}${rst}`;
+    const body = lines.map((l, i) => {
+      const content = options.titleFlashBg && i === 0
+        ? reapplyBackground(padRight(l, width - 4), options.titleFlashBg)
+        : padRight(l, width - 4);
+      return `${bc}${BOX.v}${rst} ${content} ${bc}${BOX.v}${rst}`;
+    });
+    return { top, body, bot, mid };
+  }
+  // Slow path: per-character rendering for highlight animation
   const bc = isFn ? (row) => borderColor(row, totalRows) : () => borderColor;
   const rst = (isFn || borderColor) ? RESET : "";
-  const highlightCell = borderHighlightCell(width, totalRows, options.highlightPos);
   const highlightSeq = options.highlightColor
     || (() => {
       const parsed = parseRgbSeq(typeof borderColor === "string" ? borderColor : "");

package/hub/team/tui-lite.mjs CHANGED Viewed

@@ -1,4 +1,4 @@
-import { altScreenOff, altScreenOn, BG, bold, box, clearScreen, clearToEnd, color, cursorHide, cursorHome, cursorShow, dim, eraseBelow, FG, MOCHA, padRight, progressBar, statusBadge, stripAnsi, truncate, wcswidth } from "./ansi.mjs";
+import { altScreenOff, altScreenOn, BG, bold, box, clearScreen, clearToEnd, color, cursorHide, cursorHome, cursorShow, dim, eraseBelow, FG, MOCHA, moveTo, padRight, progressBar, statusBadge, stripAnsi, truncate, wcswidth } from "./ansi.mjs";
 const FALLBACK_COLUMNS = 100, FALLBACK_ROWS = 24;
 const VALID_TABS = new Set(["log", "detail", "files"]);
@@ -209,6 +209,7 @@ export function createLiteDashboard(opts = {}) {
   let detailExpanded = true;
   let focusTab = "log";
   let helpVisible = false;
+  let prevFrame = [];
   let inputAttached = false;
   let rawModeEnabled = false;
@@ -297,7 +298,7 @@ export function createLiteDashboard(opts = {}) {
   function attachInput() {
     if (inputAttached) return;
-    if (!isTTY || !input?.isTTY || typeof input?.on !== "function") return;
+    if (!input?.isTTY || typeof input?.on !== "function") return;
     inputAttached = true;
     if (typeof input.setRawMode === "function") {
       input.setRawMode(true);
@@ -337,8 +338,19 @@ export function createLiteDashboard(opts = {}) {
     const rowsOut = buildRows();
     if (isTTY) {
       const width = viewportColumns();
-      const padded = rowsOut.map((line) => padRight(String(line ?? ""), width) + clearToEnd);
-      write(cursorHome + padded.join("\n") + eraseBelow);
+      const padded = rowsOut.map((line) => padRight(String(line ?? ""), width));
+      // Diff-based rendering: only rewrite lines that actually changed
+      let buf = "";
+      for (let i = 0; i < padded.length; i++) {
+        if (padded[i] !== prevFrame[i]) {
+          buf += moveTo(i + 1, 1) + padded[i] + clearToEnd;
+        }
+      }
+      if (prevFrame.length > padded.length) {
+        buf += moveTo(padded.length + 1, 1) + eraseBelow;
+      }
+      if (buf) write(buf);
+      prevFrame = padded;
     } else write(`${rowsOut.join("\n")}\n`);
   }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "triflux",
-  "version": "10.1.1",
+  "version": "10.2.0",
   "description": "CLI-first multi-model orchestrator for Claude Code — route tasks to Codex, Gemini, and Claude",
   "type": "module",
   "bin": {