npm - claude-flow - Versions diffs - 3.7.0-alpha.3 → 3.7.0-alpha.5 - Mend

claude-flow 3.7.0-alpha.3 → 3.7.0-alpha.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/README.md +9 -7
package/package.json +1 -1
package/v3/@claude-flow/cli/README.md +9 -7
package/v3/@claude-flow/cli/dist/src/mcp-tools/neural-tools.js +13 -1
package/v3/@claude-flow/cli/dist/src/memory/intelligence.js +28 -3
package/v3/@claude-flow/cli/dist/src/ruvector/model-router.d.ts +22 -1
package/v3/@claude-flow/cli/dist/src/ruvector/model-router.js +125 -5
package/v3/@claude-flow/cli/package.json +1 -1

package/README.md CHANGED Viewed

@@ -2,13 +2,15 @@
 [![Ruflo Banner](ruflo/assets/ruflo-small.jpeg)](https://flo.ruv.io/)
-[![✨ Try the UI Beta — flo.ruv.io](https://img.shields.io/badge/✨_Try_the_UI_Beta-flo.ruv.io-6366f1?style=for-the-badge&logoColor=white&logo=svelte)](https://flo.ruv.io/)
-[![🎯 Goal Planner — goal.ruv.io](https://img.shields.io/badge/🎯_Goal_Planner-goal.ruv.io-8b5cf6?style=for-the-badge&logoColor=white&logo=react)](https://goal.ruv.io/)
-[![🤖 Live Agents — goal.ruv.io/agents](https://img.shields.io/badge/🤖_Live_Agents-goal.ruv.io%2Fagents-10b981?style=for-the-badge&logoColor=white&logo=react)](https://goal.ruv.io/agents)
+[![Try the UI Beta — flo.ruv.io](https://img.shields.io/badge/_Try_the_UI_Beta-flo.ruv.io-6366f1?style=for-the-badge&logoColor=white&logo=svelte)](https://flo.ruv.io/)
+[![Goal Planner — goal.ruv.io](https://img.shields.io/badge/_Goal_Planner-goal.ruv.io-8b5cf6?style=for-the-badge&logoColor=white&logo=react)](https://goal.ruv.io/)
+[![Live Agents — goal.ruv.io/agents](https://img.shields.io/badge/_Live_Agents-goal.ruv.io%2Fagents-10b981?style=for-the-badge&logoColor=white&logo=react)](https://goal.ruv.io/agents)
 [![Star on GitHub](https://img.shields.io/github/stars/ruvnet/claude-flow?style=for-the-badge&logo=github&color=gold)](https://github.com/ruvnet/claude-flow)
 [![MIT License](https://img.shields.io/badge/License-MIT-yellow?style=for-the-badge)](https://opensource.org/licenses/MIT)
-[![Claude Code](https://img.shields.io/badge/Claude%20Code-Plugin-green?style=for-the-badge&logo=anthropic)](https://github.com/ruvnet/claude-flow)
+[![Claude Code](https://img.shields.io/badge/Claude%20Code-Plugin-D97757?style=for-the-badge&logoColor=white&logo=anthropic)](https://github.com/ruvnet/claude-flow)
+[![Codex Plugin](https://img.shields.io/badge/Codex-Plugin-412991?style=for-the-badge&logoColor=white&logo=data%3Aimage%2Fsvg%2Bxml%3Bbase64%2CPHN2ZyB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciIHZpZXdCb3g9IjAgMCAyNCAyNCI%2BPHBhdGggZmlsbD0id2hpdGUiIGQ9Ik0yMi4yODIgOS44MjFhNS45ODUgNS45ODUgMCAwIDAtLjUxNi00LjkxIDYuMDQ2IDYuMDQ2IDAgMCAwLTYuNTEtMi45QTYuMDY1IDYuMDY1IDAgMCAwIDQuOTgxIDQuMThhNS45ODUgNS45ODUgMCAwIDAtMy45OTggMi45IDYuMDQ2IDYuMDQ2IDAgMCAwIC43NDMgNy4wOTcgNS45OCA1Ljk4IDAgMCAwIC41MSA0LjkxMSA2LjA1MSA2LjA1MSAwIDAgMCA2LjUxNSAyLjlBNS45ODUgNS45ODUgMCAwIDAgMTMuMjYgMjRhNi4wNTYgNi4wNTYgMCAwIDAgNS43NzItNC4yMDYgNS45OSA1Ljk5IDAgMCAwIDMuOTk4LTIuOSA2LjA1NiA2LjA1NiAwIDAgMC0uNzQ3LTcuMDczek0xMy4yNiAyMi40M2E0LjQ3NiA0LjQ3NiAwIDAgMS0yLjg3Ni0xLjA0bC4xNDItLjA4IDQuNzc4LTIuNzU4YS43OTUuNzk1IDAgMCAwIC4zOTMtLjY4MXYtNi43MzdsMi4wMiAxLjE2OGEuMDcxLjA3MSAwIDAgMSAuMDM4LjA1MnY1LjU4M2E0LjUwNCA0LjUwNCAwIDAgMS00LjQ5NSA0LjQ5NHpNMy42IDE4LjMwNGE0LjQ3IDQuNDcgMCAwIDEtLjUzNS0zLjAxNGwuMTQyLjA4NSA0Ljc4MyAyLjc1OWEuNzcxLjc3MSAwIDAgMCAuNzgxIDBsNS44NDMtMy4zNjl2Mi4zMzJhLjA4LjA4IDAgMCAxLS4wMzMuMDYyTDkuNzQgMTkuOTVhNC41IDQuNSAwIDAgMS02LjE0LTEuNjQ2ek0yLjM0IDcuODk2YTQuNDg1IDQuNDg1IDAgMCAxIDIuMzY2LTEuOTczVjExLjZhLjc2Ni43NjYgMCAwIDAgLjM4OC42NzdsNS44MTUgMy4zNTQtMi4wMiAxLjE2OGEuMDc2LjA3NiAwIDAgMS0uMDcyIDBsLTQuODMtMi43ODZBNC41MDQgNC41MDQgMCAwIDEgMi4zNCA3Ljg3MnptMTYuNTk3IDMuODU1LTUuODMzLTMuMzg3IDIuMDE2LTEuMTY1YS4wNzYuMDc2IDAgMCAxIC4wNzEgMGw0LjgzIDIuNzkxYTQuNDk0IDQuNDk0IDAgMCAxLS42NzYgOC4xMDR2LTUuNjc3YS43OS43OSAwIDAgMC0uNDA3LS42Njd6bTIuMDEtMy4wMjMtLjE0MS0uMDg1LTQuNzc0LTIuNzgyYS43NzYuNzc2IDAgMCAwLS43ODUgMEw5LjQwOSA5LjIzVjYuODk3YS4wNjYuMDY2IDAgMCAxIC4wMjgtLjA2Mmw0LjgzLTIuNzg3YTQuNDk5IDQuNDk5IDAgMCAxIDYuNjggNC42NnpNOC4zMDcgMTIuODYzbC0yLjAyLTEuMTY0YS4wOC4wOCAwIDAgMS0uMDM4LS4wNTdWNi4wNzRhNC40OTkgNC40OTkgMCAwIDEgNy4zNzYtMy40NTRsLS4xNDIuMDgtNC43NzggMi43NThhLjc5NS43OTUgMCAwIDAtLjM5My42ODJ6bTEuMDk3LTIuMzY2IDIuNjAyLTEuNSAyLjYwNyAxLjV2Mi45OTlsLTIuNTk3IDEuNS0yLjYwNy0xLjVaIi8%2BPC9zdmc%2B)](https://www.npmjs.com/package/@claude-flow/codex)
+[![🕸️ RuVector Graph Ai](https://img.shields.io/badge/RuVector_Agentic-DB-06b6d4?style=for-the-badge&logoColor=white&logo=graphql)](https://github.com/ruvnet/ruvector)
 # Ruflo
@@ -20,12 +22,12 @@ Orchestrate 100+ specialized AI agents across machines, teams, and trust boundar
 ### Why Ruflo?
-> Claude Flow is now Ruflo — named by rUv, who loves Rust, flow states, and building things that feel inevitable. The "Ru" is the Ruv. The "flo" is the flow. Underneath, WASM kernels written in Rust power the policy engine, embeddings, and proof system.
+> Claude Flow is now Ruflo — named by [`rUv`](https://ruv.io), who loves Rust, flow states, and building things that feel inevitable. The "Ru" is the rUv. The "flo" is working until 3am. Underneath, powered by [`Cognitum.One`](https://cognitum.one/?RuFlo) agentic architecture, running a supercharged Rust based AI engine, embeddings, memory, and plugin system.
 ### What Ruflo Does
-One `init` gives Claude Code a nervous system: agents self-organize into swarms, learn from every task, remember across sessions, and — with federation — securely talk to agents on other machines without leaking data. You keep writing code. Ruflo handles the coordination.
+One `npx ruvflo init` gives Claude Code a nervous system: agents self-organize into swarms, learn from every task, remember across sessions, and — with federation — securely talk to agents on other machines without leaking data. You keep writing code. Ruflo handles the coordination.
 ```
 Self-Learning / Self-Optimizing Agent Architecture
@@ -69,7 +71,7 @@ There are **two different install paths** with very different surface areas. Pic
 This adds slash commands and agent definitions only. The Ruflo MCP server is NOT registered, so `memory_store`, `swarm_init`, `agent_spawn`, etc. won't be callable from Claude. For the full loop, use Path B below.
 <details>
-<summary><strong>All 32 plugins</strong></summary>
+<summary><strong>🔌 All 32 plugins</strong></summary>
 #### Core & Orchestration

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "claude-flow",
-  "version": "3.7.0-alpha.3",
+  "version": "3.7.0-alpha.5",
   "description": "Ruflo - Enterprise AI agent orchestration for Claude Code. Deploy 60+ specialized agents in coordinated swarms with self-learning, fault-tolerant consensus, vector memory, and MCP integration",
   "main": "dist/index.js",
   "type": "module",

package/v3/@claude-flow/cli/README.md CHANGED Viewed

@@ -2,13 +2,15 @@
 [![Ruflo Banner](ruflo/assets/ruflo-small.jpeg)](https://flo.ruv.io/)
-[![✨ Try the UI Beta — flo.ruv.io](https://img.shields.io/badge/✨_Try_the_UI_Beta-flo.ruv.io-6366f1?style=for-the-badge&logoColor=white&logo=svelte)](https://flo.ruv.io/)
-[![🎯 Goal Planner — goal.ruv.io](https://img.shields.io/badge/🎯_Goal_Planner-goal.ruv.io-8b5cf6?style=for-the-badge&logoColor=white&logo=react)](https://goal.ruv.io/)
-[![🤖 Live Agents — goal.ruv.io/agents](https://img.shields.io/badge/🤖_Live_Agents-goal.ruv.io%2Fagents-10b981?style=for-the-badge&logoColor=white&logo=react)](https://goal.ruv.io/agents)
+[![Try the UI Beta — flo.ruv.io](https://img.shields.io/badge/_Try_the_UI_Beta-flo.ruv.io-6366f1?style=for-the-badge&logoColor=white&logo=svelte)](https://flo.ruv.io/)
+[![Goal Planner — goal.ruv.io](https://img.shields.io/badge/_Goal_Planner-goal.ruv.io-8b5cf6?style=for-the-badge&logoColor=white&logo=react)](https://goal.ruv.io/)
+[![Live Agents — goal.ruv.io/agents](https://img.shields.io/badge/_Live_Agents-goal.ruv.io%2Fagents-10b981?style=for-the-badge&logoColor=white&logo=react)](https://goal.ruv.io/agents)
 [![Star on GitHub](https://img.shields.io/github/stars/ruvnet/claude-flow?style=for-the-badge&logo=github&color=gold)](https://github.com/ruvnet/claude-flow)
 [![MIT License](https://img.shields.io/badge/License-MIT-yellow?style=for-the-badge)](https://opensource.org/licenses/MIT)
-[![Claude Code](https://img.shields.io/badge/Claude%20Code-Plugin-green?style=for-the-badge&logo=anthropic)](https://github.com/ruvnet/claude-flow)
+[![Claude Code](https://img.shields.io/badge/Claude%20Code-Plugin-D97757?style=for-the-badge&logoColor=white&logo=anthropic)](https://github.com/ruvnet/claude-flow)
+[![Codex Plugin](https://img.shields.io/badge/Codex-Plugin-412991?style=for-the-badge&logoColor=white&logo=data%3Aimage%2Fsvg%2Bxml%3Bbase64%2CPHN2ZyB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciIHZpZXdCb3g9IjAgMCAyNCAyNCI%2BPHBhdGggZmlsbD0id2hpdGUiIGQ9Ik0yMi4yODIgOS44MjFhNS45ODUgNS45ODUgMCAwIDAtLjUxNi00LjkxIDYuMDQ2IDYuMDQ2IDAgMCAwLTYuNTEtMi45QTYuMDY1IDYuMDY1IDAgMCAwIDQuOTgxIDQuMThhNS45ODUgNS45ODUgMCAwIDAtMy45OTggMi45IDYuMDQ2IDYuMDQ2IDAgMCAwIC43NDMgNy4wOTcgNS45OCA1Ljk4IDAgMCAwIC41MSA0LjkxMSA2LjA1MSA2LjA1MSAwIDAgMCA2LjUxNSAyLjlBNS45ODUgNS45ODUgMCAwIDAgMTMuMjYgMjRhNi4wNTYgNi4wNTYgMCAwIDAgNS43NzItNC4yMDYgNS45OSA1Ljk5IDAgMCAwIDMuOTk4LTIuOSA2LjA1NiA2LjA1NiAwIDAgMC0uNzQ3LTcuMDczek0xMy4yNiAyMi40M2E0LjQ3NiA0LjQ3NiAwIDAgMS0yLjg3Ni0xLjA0bC4xNDItLjA4IDQuNzc4LTIuNzU4YS43OTUuNzk1IDAgMCAwIC4zOTMtLjY4MXYtNi43MzdsMi4wMiAxLjE2OGEuMDcxLjA3MSAwIDAgMSAuMDM4LjA1MnY1LjU4M2E0LjUwNCA0LjUwNCAwIDAgMS00LjQ5NSA0LjQ5NHpNMy42IDE4LjMwNGE0LjQ3IDQuNDcgMCAwIDEtLjUzNS0zLjAxNGwuMTQyLjA4NSA0Ljc4MyAyLjc1OWEuNzcxLjc3MSAwIDAgMCAuNzgxIDBsNS44NDMtMy4zNjl2Mi4zMzJhLjA4LjA4IDAgMCAxLS4wMzMuMDYyTDkuNzQgMTkuOTVhNC41IDQuNSAwIDAgMS02LjE0LTEuNjQ2ek0yLjM0IDcuODk2YTQuNDg1IDQuNDg1IDAgMCAxIDIuMzY2LTEuOTczVjExLjZhLjc2Ni43NjYgMCAwIDAgLjM4OC42NzdsNS44MTUgMy4zNTQtMi4wMiAxLjE2OGEuMDc2LjA3NiAwIDAgMS0uMDcyIDBsLTQuODMtMi43ODZBNC41MDQgNC41MDQgMCAwIDEgMi4zNCA3Ljg3MnptMTYuNTk3IDMuODU1LTUuODMzLTMuMzg3IDIuMDE2LTEuMTY1YS4wNzYuMDc2IDAgMCAxIC4wNzEgMGw0LjgzIDIuNzkxYTQuNDk0IDQuNDk0IDAgMCAxLS42NzYgOC4xMDR2LTUuNjc3YS43OS43OSAwIDAgMC0uNDA3LS42Njd6bTIuMDEtMy4wMjMtLjE0MS0uMDg1LTQuNzc0LTIuNzgyYS43NzYuNzc2IDAgMCAwLS43ODUgMEw5LjQwOSA5LjIzVjYuODk3YS4wNjYuMDY2IDAgMCAxIC4wMjgtLjA2Mmw0LjgzLTIuNzg3YTQuNDk5IDQuNDk5IDAgMCAxIDYuNjggNC42NnpNOC4zMDcgMTIuODYzbC0yLjAyLTEuMTY0YS4wOC4wOCAwIDAgMS0uMDM4LS4wNTdWNi4wNzRhNC40OTkgNC40OTkgMCAwIDEgNy4zNzYtMy40NTRsLS4xNDIuMDgtNC43NzggMi43NThhLjc5NS43OTUgMCAwIDAtLjM5My42ODJ6bTEuMDk3LTIuMzY2IDIuNjAyLTEuNSAyLjYwNyAxLjV2Mi45OTlsLTIuNTk3IDEuNS0yLjYwNy0xLjVaIi8%2BPC9zdmc%2B)](https://www.npmjs.com/package/@claude-flow/codex)
+[![🕸️ RuVector Graph Ai](https://img.shields.io/badge/RuVector_Agentic-DB-06b6d4?style=for-the-badge&logoColor=white&logo=graphql)](https://github.com/ruvnet/ruvector)
 # Ruflo
@@ -20,12 +22,12 @@ Orchestrate 100+ specialized AI agents across machines, teams, and trust boundar
 ### Why Ruflo?
-> Claude Flow is now Ruflo — named by rUv, who loves Rust, flow states, and building things that feel inevitable. The "Ru" is the Ruv. The "flo" is the flow. Underneath, WASM kernels written in Rust power the policy engine, embeddings, and proof system.
+> Claude Flow is now Ruflo — named by [`rUv`](https://ruv.io), who loves Rust, flow states, and building things that feel inevitable. The "Ru" is the rUv. The "flo" is working until 3am. Underneath, powered by [`Cognitum.One`](https://cognitum.one/?RuFlo) agentic architecture, running a supercharged Rust based AI engine, embeddings, memory, and plugin system.
 ### What Ruflo Does
-One `init` gives Claude Code a nervous system: agents self-organize into swarms, learn from every task, remember across sessions, and — with federation — securely talk to agents on other machines without leaking data. You keep writing code. Ruflo handles the coordination.
+One `npx ruvflo init` gives Claude Code a nervous system: agents self-organize into swarms, learn from every task, remember across sessions, and — with federation — securely talk to agents on other machines without leaking data. You keep writing code. Ruflo handles the coordination.
 ```
 Self-Learning / Self-Optimizing Agent Architecture
@@ -69,7 +71,7 @@ There are **two different install paths** with very different surface areas. Pic
 This adds slash commands and agent definitions only. The Ruflo MCP server is NOT registered, so `memory_store`, `swarm_init`, `agent_spawn`, etc. won't be callable from Claude. For the full loop, use Path B below.
 <details>
-<summary><strong>All 32 plugins</strong></summary>
+<summary><strong>🔌 All 32 plugins</strong></summary>
 #### Core & Orchestration

package/v3/@claude-flow/cli/dist/src/mcp-tools/neural-tools.js CHANGED Viewed

@@ -662,7 +662,19 @@ export const neuralTools = [
                 features: {
                     hnsw: true,
                     quantization: true,
-                    flashAttention: false,
+                    // #1770: probe the real loader instead of returning a literal false.
+                    // Was hardcoded false, which contradicted hooks_intelligence_stats's
+                    // simultaneous claim of `implementation: real-flash-attention`.
+                    // The two surfaces now agree on a single source of truth.
+                    flashAttention: await (async () => {
+                        try {
+                            const { getFlashAttention } = await import('../ruvector/flash-attention.js');
+                            return getFlashAttention() !== null;
+                        }
+                        catch {
+                            return false;
+                        }
+                    })(),
                     reasoningBank: true,
                 },
             };

package/v3/@claude-flow/cli/dist/src/memory/intelligence.js CHANGED Viewed

@@ -12,6 +12,7 @@
  */
 import { existsSync, mkdirSync, readFileSync, writeFileSync } from 'node:fs';
 import { homedir } from 'node:os';
+import { createRequire } from 'node:module';
 import { join } from 'node:path';
 // ============================================================================
 // Persistence Configuration
@@ -563,21 +564,37 @@ class LocalReasoningBank {
 // ============================================================================
 let ruvllmCoordinator = null;
 let ruvllmLoaded = false;
-async function loadRuvllmCoordinator() {
+/**
+ * Synchronously load the @ruvector/ruvllm SonaCoordinator. Used both by the
+ * async init path (initializeIntelligence) and by sync stat readers like
+ * getIntelligenceStats — the dashboard would otherwise report "unavailable"
+ * when stats are queried before any async init has fired (#1770).
+ */
+function loadRuvllmCoordinatorSync() {
     if (ruvllmLoaded)
         return ruvllmCoordinator;
     ruvllmLoaded = true;
     try {
-        const { createRequire } = await import('module');
         const requireCjs = createRequire(import.meta.url);
         const ruvllm = requireCjs('@ruvector/ruvllm');
         ruvllmCoordinator = new ruvllm.SonaCoordinator(ruvllm.DEFAULT_SONA_CONFIG);
         return ruvllmCoordinator;
     }
-    catch {
+    catch (err) {
+        // Surface the reason on debug builds so future regressions of #1770 don't
+        // disappear silently. Stays quiet by default to avoid noise on the cli's
+        // hot path (e.g., npx invocations).
+        if (process.env.CLAUDE_FLOW_DEBUG) {
+            // eslint-disable-next-line no-console
+            console.error('[ruvllm] SonaCoordinator load failed, falling back to JS:', err.message);
+        }
+        ruvllmCoordinator = null;
         return null;
     }
 }
+async function loadRuvllmCoordinator() {
+    return loadRuvllmCoordinatorSync();
+}
 // ============================================================================
 // Module State
 // ============================================================================
@@ -879,6 +896,14 @@ export async function findSimilarPatterns(query, options) {
 export function getIntelligenceStats() {
     const sonaStats = sonaCoordinator?.stats();
     const bankStats = reasoningBank?.stats();
+    // Lazy-init the ruvllm coordinator if it hasn't been loaded yet. The MCP
+    // dashboard (`hooks_intelligence_stats`) hits this path before any
+    // initializeIntelligence() call has fired, so the coordinator field would
+    // otherwise stay null and the dashboard would report "unavailable" even
+    // when @ruvector/ruvllm is fully resolvable. Sync require — cheap, idempotent.
+    if (!ruvllmLoaded) {
+        loadRuvllmCoordinatorSync();
+    }
     const ruvllmStats = ruvllmCoordinator?.stats?.() || null;
     // Fetch cross-module stats for unified reporting
     let contrastiveTrainer = 'unavailable';

package/v3/@claude-flow/cli/dist/src/ruvector/model-router.d.ts CHANGED Viewed

@@ -104,6 +104,15 @@ export interface ComplexityAnalysis {
         uncertaintyLevel: number;
     };
 }
+/**
+ * Beta(α, β) prior for Thompson sampling. Each model carries one of these;
+ * outcomes update α (successes) and β (failures) so the router auto-balances
+ * cost/quality without manual threshold tuning. See ADR-101.
+ */
+export interface BetaPrior {
+    alpha: number;
+    beta: number;
+}
 /**
  * Intelligent Model Router using complexity-based routing
  */
@@ -146,7 +155,13 @@ export declare class ModelRouter {
      */
     private applyCircuitBreaker;
     /**
-     * Select the best model from scores
+     * Select the best model from scores. Uses Thompson sampling (#1772):
+     * each model's deterministic complexity score is multiplied by a draw
+     * θ_m ~ Beta(α_m, β_m) from its bandit prior. Models with strong empirical
+     * track records get sampled higher; models with poor outcomes get sampled
+     * lower; the system auto-corrects against tier overuse without manual
+     * threshold tuning. Beta(1,1) = uniform on cold start so behavior matches
+     * the prior deterministic router until outcomes accumulate.
      */
     private selectModel;
     /**
@@ -184,6 +199,12 @@ export declare class ModelRouter {
      * Reset router state
      */
     reset(): void;
+    /**
+     * Public read-only accessor for the bandit priors. Useful for tests,
+     * dashboards, and the pending hooks_intelligence_stats integration that
+     * surfaces convergence in the dashboard. Returns a copy.
+     */
+    getBanditPriors(): Record<ClaudeModel, BetaPrior>;
 }
 /**
  * Get or create the singleton ModelRouter instance

package/v3/@claude-flow/cli/dist/src/ruvector/model-router.js CHANGED Viewed

@@ -67,6 +67,84 @@ export const COMPLEXITY_INDICATORS = {
         'delete', 'documentation', 'readme', 'config', 'version', 'bump',
     ],
 };
+/**
+ * Cost-adjusted Bernoulli rewards for Thompson sampling updates. Higher
+ * reward when the right tier is chosen — Haiku-success > Sonnet-success >
+ * Opus-success because Opus-success on a simple task is wasteful even when
+ * the answer is correct. Escalations get partial credit at best (Sonnet) or
+ * zero (Haiku/Opus) since they signal the initial choice was wrong.
+ */
+const BANDIT_REWARDS = {
+    haiku: { success: 1.0, failure: 0.0, escalated: 0.0 },
+    sonnet: { success: 0.7, failure: 0.0, escalated: 0.1 },
+    opus: { success: 0.4, failure: 0.0, escalated: 0.0 },
+    inherit: { success: 0.5, failure: 0.0, escalated: 0.0 },
+};
+// ============================================================================
+// Beta Sampling for Thompson Sampling Bandit
+// ============================================================================
+/**
+ * Standard normal sample via Box-Muller. Used by Marsaglia-Tsang Gamma.
+ * Module-local so the bandit doesn't pull in a heavy stats dep.
+ */
+function sampleStandardNormal() {
+    const u1 = Math.random() || 1e-12; // avoid log(0)
+    const u2 = Math.random();
+    return Math.sqrt(-2 * Math.log(u1)) * Math.cos(2 * Math.PI * u2);
+}
+/**
+ * Sample from Gamma(shape α, scale=1). Marsaglia & Tsang (2000), with the
+ * standard "boost α<1 by α+1 then scale by U^(1/α)" trick for shape parameters
+ * smaller than 1. O(1) expected, no rejection-loop pathology in practice.
+ */
+function sampleGamma(alpha) {
+    if (alpha < 1) {
+        const u = Math.random() || 1e-12;
+        return sampleGamma(alpha + 1) * Math.pow(u, 1 / alpha);
+    }
+    const d = alpha - 1 / 3;
+    const c = 1 / Math.sqrt(9 * d);
+    while (true) {
+        let x;
+        let v;
+        do {
+            x = sampleStandardNormal();
+            v = 1 + c * x;
+        } while (v <= 0);
+        v = v * v * v;
+        const u = Math.random();
+        const xx = x * x;
+        if (u < 1 - 0.0331 * xx * xx)
+            return d * v;
+        if (Math.log(u) < 0.5 * xx + d * (1 - v + Math.log(v)))
+            return d * v;
+    }
+}
+/**
+ * Sample θ ~ Beta(α, β) via the identity Beta(α,β) = X / (X+Y) where
+ * X ~ Gamma(α), Y ~ Gamma(β). Returns the mean for degenerate α+β=0
+ * (shouldn't happen in practice but defensive).
+ */
+function sampleBeta(alpha, beta) {
+    if (alpha <= 0 || beta <= 0)
+        return 0.5;
+    const x = sampleGamma(alpha);
+    const y = sampleGamma(beta);
+    const denom = x + y;
+    return denom > 0 ? x / denom : 0.5;
+}
+/**
+ * Default uniform priors (no prior knowledge). Beta(1,1) is the standard
+ * Bayesian-Bernoulli starting point — uniform over [0,1].
+ */
+function defaultBanditPriors() {
+    return {
+        haiku: { alpha: 1, beta: 1 },
+        sonnet: { alpha: 1, beta: 1 },
+        opus: { alpha: 1, beta: 1 },
+        inherit: { alpha: 1, beta: 1 },
+    };
+}
 // ============================================================================
 // Default Configuration
 // ============================================================================
@@ -263,15 +341,29 @@ export class ModelRouter {
         return adjusted;
     }
     /**
-     * Select the best model from scores
+     * Select the best model from scores. Uses Thompson sampling (#1772):
+     * each model's deterministic complexity score is multiplied by a draw
+     * θ_m ~ Beta(α_m, β_m) from its bandit prior. Models with strong empirical
+     * track records get sampled higher; models with poor outcomes get sampled
+     * lower; the system auto-corrects against tier overuse without manual
+     * threshold tuning. Beta(1,1) = uniform on cold start so behavior matches
+     * the prior deterministic router until outcomes accumulate.
      */
     selectModel(scores, complexityScore) {
-        // Get sorted models by score
-        const sorted = Object.entries(scores)
+        // Thompson sampling: combine deterministic score with bandit posterior
+        const priors = this.state.priors ?? defaultBanditPriors();
+        const sampledScores = {
+            haiku: scores.haiku * sampleBeta(priors.haiku.alpha, priors.haiku.beta),
+            sonnet: scores.sonnet * sampleBeta(priors.sonnet.alpha, priors.sonnet.beta),
+            opus: scores.opus * sampleBeta(priors.opus.alpha, priors.opus.beta),
+            inherit: scores.inherit, // not bandit-controlled
+        };
+        // Get sorted models by sampled score (drops 'inherit' from selection)
+        const sorted = Object.entries(sampledScores)
             .filter(([m]) => m !== 'inherit')
             .sort((a, b) => b[1] - a[1]);
         const [bestModel, bestScore] = sorted[0];
-        const [secondModel, secondScore] = sorted[1] || ['sonnet', 0];
+        const [, secondScore] = sorted[1] || ['sonnet', 0];
         // Confidence is how much better the best is vs second
         const confidence = bestScore > 0 ? Math.min(1, bestScore / (bestScore + secondScore + 0.01)) : 0.5;
         // Uncertainty based on score spread and complexity
@@ -346,6 +438,14 @@ export class ModelRouter {
         if (outcome === 'failure') {
             this.state.circuitBreakerTrips++;
         }
+        // Thompson sampling update (#1772): cost-adjusted Bernoulli reward.
+        // Haiku-success > Sonnet-success > Opus-success (Opus on simple tasks
+        // is wasteful even when correct). Failure/escalation always β++.
+        if (!this.state.priors)
+            this.state.priors = defaultBanditPriors();
+        const reward = BANDIT_REWARDS[model]?.[outcome] ?? 0.5;
+        this.state.priors[model].alpha += reward;
+        this.state.priors[model].beta += 1 - reward;
         this.saveState();
     }
     /**
@@ -373,12 +473,17 @@ export class ModelRouter {
             circuitBreakerTrips: 0,
             lastUpdated: new Date().toISOString(),
             learningHistory: [],
+            priors: defaultBanditPriors(),
         };
         try {
             const fullPath = join(process.cwd(), this.config.statePath);
             if (existsSync(fullPath)) {
                 const data = readFileSync(fullPath, 'utf-8');
-                return { ...defaultState, ...JSON.parse(data) };
+                const loaded = JSON.parse(data);
+                // Backfill priors for state files written by pre-bandit cli versions.
+                if (!loaded.priors)
+                    loaded.priors = defaultBanditPriors();
+                return { ...defaultState, ...loaded };
             }
         }
         catch {
@@ -415,11 +520,26 @@ export class ModelRouter {
             circuitBreakerTrips: 0,
             lastUpdated: new Date().toISOString(),
             learningHistory: [],
+            priors: defaultBanditPriors(),
         };
         this.consecutiveFailures = { haiku: 0, sonnet: 0, opus: 0, inherit: 0 };
         this.decisionCount = 0;
         this.saveState();
     }
+    /**
+     * Public read-only accessor for the bandit priors. Useful for tests,
+     * dashboards, and the pending hooks_intelligence_stats integration that
+     * surfaces convergence in the dashboard. Returns a copy.
+     */
+    getBanditPriors() {
+        const p = this.state.priors ?? defaultBanditPriors();
+        return {
+            haiku: { ...p.haiku },
+            sonnet: { ...p.sonnet },
+            opus: { ...p.opus },
+            inherit: { ...p.inherit },
+        };
+    }
 }
 // ============================================================================
 // Singleton & Factory Functions

package/v3/@claude-flow/cli/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@claude-flow/cli",
-  "version": "3.7.0-alpha.3",
+  "version": "3.7.0-alpha.5",
   "type": "module",
   "description": "Ruflo CLI - Enterprise AI agent orchestration with 60+ specialized agents, swarm coordination, MCP server, self-learning hooks, and vector memory for Claude Code",
   "main": "dist/src/index.js",