agentic-flow 1.1.14 → 1.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (32) hide show
  1. package/.claude/agents/custom/test-long-runner.md +44 -0
  2. package/README.md +50 -1
  3. package/dist/agents/claudeAgent.js +31 -0
  4. package/dist/cli/mcp-manager.js +474 -0
  5. package/dist/cli-proxy.js +22 -1
  6. package/dist/utils/.claude-flow/metrics/agent-metrics.json +1 -0
  7. package/dist/utils/.claude-flow/metrics/performance.json +9 -0
  8. package/dist/utils/.claude-flow/metrics/task-metrics.json +10 -0
  9. package/dist/utils/cli.js +9 -1
  10. package/dist/utils/modelOptimizer.js +18 -2
  11. package/docs/.claude-flow/metrics/performance.json +1 -1
  12. package/docs/.claude-flow/metrics/task-metrics.json +3 -3
  13. package/docs/INDEX.md +44 -7
  14. package/docs/archived/RELEASE-SUMMARY-v1.1.14-beta.1.md +336 -0
  15. package/docs/archived/V1.1.14-BETA-READY.md +418 -0
  16. package/docs/guides/ADDING-MCP-SERVERS-CLI.md +515 -0
  17. package/docs/guides/ADDING-MCP-SERVERS.md +642 -0
  18. package/docs/mcp-validation/IMPLEMENTATION-SUMMARY.md +493 -0
  19. package/docs/mcp-validation/MCP-CLI-VALIDATION-REPORT.md +322 -0
  20. package/docs/mcp-validation/README.md +43 -0
  21. package/docs/mcp-validation/strange-loops-test.md +63 -0
  22. package/docs/releases/HOTFIX-v1.2.1.md +315 -0
  23. package/docs/releases/NPM-PUBLISH-GUIDE-v1.2.0.md +440 -0
  24. package/docs/releases/PUBLISH-COMPLETE-v1.2.0.md +308 -0
  25. package/docs/releases/README.md +18 -0
  26. package/docs/releases/RELEASE-v1.2.0.md +339 -0
  27. package/docs/testing/AGENT-SYSTEM-VALIDATION.md +517 -0
  28. package/docs/testing/FINAL-TESTING-SUMMARY.md +362 -0
  29. package/docs/testing/README.md +46 -0
  30. package/docs/testing/REGRESSION-TEST-RESULTS.md +269 -0
  31. package/docs/testing/STREAMING-AND-MCP-VALIDATION.md +517 -0
  32. package/package.json +2 -2
package/dist/utils/cli.js CHANGED
@@ -16,8 +16,16 @@ export function parseArgs() {
16
16
  }
17
17
  // Check for MCP command
18
18
  if (args[0] === 'mcp') {
19
+ const mcpSubcommand = args[1];
20
+ // MCP Manager commands (CLI configuration)
21
+ const managerCommands = ['add', 'list', 'remove', 'enable', 'disable', 'update', 'test', 'info', 'export', 'import'];
22
+ if (managerCommands.includes(mcpSubcommand)) {
23
+ options.mode = 'mcp-manager';
24
+ return options;
25
+ }
26
+ // MCP Server commands (start/stop server)
19
27
  options.mode = 'mcp';
20
- options.mcpCommand = args[1] || 'start'; // default to start
28
+ options.mcpCommand = mcpSubcommand || 'start'; // default to start
21
29
  options.mcpServer = args[2] || 'all'; // default to all servers
22
30
  return options;
23
31
  }
@@ -16,6 +16,7 @@ const MODEL_DATABASE = {
16
16
  speed_score: 85,
17
17
  cost_score: 20,
18
18
  tier: 'flagship',
19
+ supports_tools: true,
19
20
  strengths: ['reasoning', 'coding', 'analysis', 'production'],
20
21
  weaknesses: ['cost'],
21
22
  bestFor: ['coder', 'reviewer', 'architecture', 'planner', 'production-validator']
@@ -30,6 +31,7 @@ const MODEL_DATABASE = {
30
31
  speed_score: 90,
31
32
  cost_score: 30,
32
33
  tier: 'flagship',
34
+ supports_tools: true,
33
35
  strengths: ['multimodal', 'speed', 'general-purpose', 'vision'],
34
36
  weaknesses: ['cost'],
35
37
  bestFor: ['researcher', 'analyst', 'multimodal-tasks']
@@ -44,6 +46,7 @@ const MODEL_DATABASE = {
44
46
  speed_score: 75,
45
47
  cost_score: 50,
46
48
  tier: 'flagship',
49
+ supports_tools: true,
47
50
  strengths: ['reasoning', 'large-context', 'math', 'analysis'],
48
51
  weaknesses: ['speed'],
49
52
  bestFor: ['planner', 'architecture', 'researcher', 'code-analyzer']
@@ -59,8 +62,9 @@ const MODEL_DATABASE = {
59
62
  speed_score: 80,
60
63
  cost_score: 100,
61
64
  tier: 'cost-effective',
65
+ supports_tools: false, // DeepSeek R1 does NOT support tool/function calling
62
66
  strengths: ['reasoning', 'coding', 'math', 'value', 'free'],
63
- weaknesses: ['newer-model'],
67
+ weaknesses: ['newer-model', 'no-tool-use'],
64
68
  bestFor: ['coder', 'pseudocode', 'specification', 'refinement', 'tester']
65
69
  },
66
70
  'deepseek-chat-v3': {
@@ -73,6 +77,7 @@ const MODEL_DATABASE = {
73
77
  speed_score: 90,
74
78
  cost_score: 100,
75
79
  tier: 'cost-effective',
80
+ supports_tools: true,
76
81
  strengths: ['cost', 'speed', 'coding', 'development', 'free'],
77
82
  weaknesses: ['complex-reasoning'],
78
83
  bestFor: ['coder', 'reviewer', 'tester', 'backend-dev', 'cicd-engineer']
@@ -88,6 +93,7 @@ const MODEL_DATABASE = {
88
93
  speed_score: 98,
89
94
  cost_score: 98,
90
95
  tier: 'balanced',
96
+ supports_tools: true,
91
97
  strengths: ['speed', 'cost', 'interactive'],
92
98
  weaknesses: ['quality'],
93
99
  bestFor: ['researcher', 'planner', 'smart-agent']
@@ -102,6 +108,7 @@ const MODEL_DATABASE = {
102
108
  speed_score: 95,
103
109
  cost_score: 100,
104
110
  tier: 'balanced',
111
+ supports_tools: true,
105
112
  strengths: ['open-source', 'versatile', 'coding', 'free', 'fast'],
106
113
  weaknesses: ['smaller-model'],
107
114
  bestFor: ['coder', 'reviewer', 'base-template-generator', 'tester']
@@ -116,6 +123,7 @@ const MODEL_DATABASE = {
116
123
  speed_score: 85,
117
124
  cost_score: 90,
118
125
  tier: 'balanced',
126
+ supports_tools: true,
119
127
  strengths: ['multilingual', 'coding', 'reasoning'],
120
128
  weaknesses: ['english-optimized'],
121
129
  bestFor: ['researcher', 'coder', 'multilingual-tasks']
@@ -131,6 +139,7 @@ const MODEL_DATABASE = {
131
139
  speed_score: 95,
132
140
  cost_score: 99,
133
141
  tier: 'budget',
142
+ supports_tools: true,
134
143
  strengths: ['ultra-low-cost', 'speed'],
135
144
  weaknesses: ['quality', 'complex-tasks'],
136
145
  bestFor: ['simple-tasks', 'testing']
@@ -146,6 +155,7 @@ const MODEL_DATABASE = {
146
155
  speed_score: 30,
147
156
  cost_score: 100,
148
157
  tier: 'local',
158
+ supports_tools: false,
149
159
  strengths: ['privacy', 'offline', 'zero-cost'],
150
160
  weaknesses: ['quality', 'speed'],
151
161
  bestFor: ['privacy-tasks', 'offline-tasks']
@@ -197,8 +207,14 @@ export class ModelOptimizer {
197
207
  const taskComplexity = criteria.taskComplexity || this.inferComplexity(criteria.task);
198
208
  // Set default priority to balanced if not specified
199
209
  const priority = criteria.priority || 'balanced';
210
+ // Filter models that support tools if required
211
+ let availableModels = Object.entries(MODEL_DATABASE);
212
+ if (criteria.requiresTools) {
213
+ availableModels = availableModels.filter(([key, model]) => model.supports_tools !== false);
214
+ logger.info(`Filtered to ${availableModels.length} models with tool support`);
215
+ }
200
216
  // Score all models
201
- const scoredModels = Object.entries(MODEL_DATABASE).map(([key, model]) => {
217
+ const scoredModels = availableModels.map(([key, model]) => {
202
218
  // Calculate overall score based on priority
203
219
  let overall_score;
204
220
  switch (priority) {
@@ -1,5 +1,5 @@
1
1
  {
2
- "startTime": 1759680310468,
2
+ "startTime": 1759762593440,
3
3
  "totalTasks": 1,
4
4
  "successfulTasks": 1,
5
5
  "failedTasks": 0,
@@ -1,10 +1,10 @@
1
1
  [
2
2
  {
3
- "id": "cmd-hooks-1759680310618",
3
+ "id": "cmd-hooks-1759762593563",
4
4
  "type": "hooks",
5
5
  "success": true,
6
- "duration": 8.211029999999994,
7
- "timestamp": 1759680310627,
6
+ "duration": 24.05694200000005,
7
+ "timestamp": 1759762593587,
8
8
  "metadata": {}
9
9
  }
10
10
  ]
package/docs/INDEX.md CHANGED
@@ -54,10 +54,35 @@ Multi-model router configuration and usage.
54
54
  - [Router Config Reference](router/ROUTER_CONFIG_REFERENCE.md) - Configuration options
55
55
  - [Top 20 Models Matrix](router/TOP20_MODELS_MATRIX.md) - Model comparison guide
56
56
 
57
- ### ✅ [Validation & Testing](validation/)
58
- Test results and quality assurance reports.
57
+ ### ✅ [Testing & Validation](testing/)
58
+ Current test results, validation reports, and quality assurance.
59
59
 
60
- - [Validation README](validation/README.md) - Overview and archived reports
60
+ - [Testing Overview](testing/README.md) - Current testing documentation
61
+ - [Agent System Validation](testing/AGENT-SYSTEM-VALIDATION.md) - Multi-agent testing
62
+ - [Final Testing Summary](testing/FINAL-TESTING-SUMMARY.md) - Comprehensive coverage
63
+ - [Regression Test Results](testing/REGRESSION-TEST-RESULTS.md) - Regression testing
64
+ - [Streaming & MCP Validation](testing/STREAMING-AND-MCP-VALIDATION.md) - Integration tests
65
+
66
+ ### 🔍 [MCP Validation](mcp-validation/)
67
+ Model Context Protocol implementation and validation.
68
+
69
+ - [MCP Validation Overview](mcp-validation/README.md) - MCP testing documentation
70
+ - [Implementation Summary](mcp-validation/IMPLEMENTATION-SUMMARY.md) - MCP implementation
71
+ - [CLI Validation Report](mcp-validation/MCP-CLI-VALIDATION-REPORT.md) - CLI tool testing
72
+ - [Strange Loops Test](mcp-validation/strange-loops-test.md) - Advanced patterns
73
+
74
+ ### 📦 [Releases](releases/)
75
+ Version-specific release notes and publishing documentation.
76
+
77
+ - [Release Overview](releases/README.md) - Release documentation index
78
+ - [v1.2.0 Release](releases/RELEASE-v1.2.0.md) - Latest stable release
79
+ - [v1.2.0 Publishing Guide](releases/NPM-PUBLISH-GUIDE-v1.2.0.md) - Publishing process
80
+ - [v1.2.1 Hotfix](releases/HOTFIX-v1.2.1.md) - Critical fixes
81
+
82
+ ### 🗄️ [Validation Archive](validation/)
83
+ Historical validation reports and test archives.
84
+
85
+ - [Validation Archive](validation/README.md) - Archived test reports
61
86
 
62
87
  ### 📦 [Archived](archived/)
63
88
  Historical documentation, completed implementations, and validation reports.
@@ -103,13 +128,15 @@ Historical documentation, completed implementations, and validation reports.
103
128
  ### Path 2: Developers (1.5 hours)
104
129
  1. [Architecture Overview](architecture/EXECUTIVE_SUMMARY.md) - System design (20 min)
105
130
  2. [Implementation Examples](guides/IMPLEMENTATION_EXAMPLES.md) - Code patterns (40 min)
106
- 3. [Integration Guides](integrations/) - External services (30 min)
131
+ 3. [Integration Guides](integrations/) - External services (20 min)
132
+ 4. [Testing Documentation](testing/) - Quality assurance (10 min)
107
133
 
108
134
  ### Path 3: System Architects (2 hours)
109
135
  1. [Research Summary](architecture/RESEARCH_SUMMARY.md) - Technical findings (30 min)
110
136
  2. [Multi-Model Router Plan](architecture/MULTI_MODEL_ROUTER_PLAN.md) - Router architecture (45 min)
111
- 3. [Integration Status](architecture/INTEGRATION-STATUS.md) - Current state (30 min)
137
+ 3. [Integration Status](architecture/INTEGRATION-STATUS.md) - Current state (20 min)
112
138
  4. [Router Documentation](router/) - Configuration and usage (15 min)
139
+ 5. [MCP Validation](mcp-validation/) - Protocol implementation (10 min)
113
140
 
114
141
  ---
115
142
 
@@ -192,5 +219,15 @@ Historical reports, completed implementations, and superseded guides are in the
192
219
 
193
220
  ---
194
221
 
195
- **Documentation Status**: ✅ Organized and up-to-date
196
- **Last Updated**: October 5, 2025
222
+ **Documentation Status**: ✅ Reorganized and up-to-date
223
+ **Last Updated**: October 6, 2025
224
+
225
+ ## 📋 Recent Documentation Updates
226
+
227
+ **v2.0 Reorganization (Oct 6, 2025)**:
228
+ - Created dedicated `releases/` directory for version-specific documentation
229
+ - Consolidated testing reports into `testing/` directory
230
+ - Separated MCP validation into dedicated `mcp-validation/` section
231
+ - Added comprehensive READMEs to all major sections
232
+ - Archived historical v1.1.x releases for cleaner navigation
233
+ - Improved documentation index with better categorization
@@ -0,0 +1,336 @@
1
+ # v1.1.14-beta.1 Release Summary
2
+
3
+ **Date:** 2025-10-05
4
+ **Status:** ✅ **PUBLISHED & LIVE**
5
+ **NPM:** https://www.npmjs.com/package/agentic-flow/v/1.1.14-beta.1
6
+ **GitHub:** https://github.com/ruvnet/agentic-flow/releases/tag/v1.1.14-beta.1
7
+
8
+ ---
9
+
10
+ ## 🎉 Major Achievement
11
+
12
+ **Fixed critical OpenRouter proxy bug that was causing 100% failure rate!**
13
+
14
+ From **0% success** → **80% success** (8 out of 10 models working)
15
+
16
+ ---
17
+
18
+ ## Installation & Usage
19
+
20
+ ### Install Beta Version
21
+ ```bash
22
+ # Install globally
23
+ npm install -g agentic-flow@beta
24
+
25
+ # Or use with npx (no installation needed)
26
+ npx agentic-flow@beta --help
27
+ ```
28
+
29
+ ### Quick Start
30
+ ```bash
31
+ # List available agents
32
+ npx agentic-flow@beta --list
33
+
34
+ # Run with Anthropic (default)
35
+ npx agentic-flow@beta --agent coder --task "Write Python hello world"
36
+
37
+ # Run with OpenRouter (99% cost savings!)
38
+ npx agentic-flow@beta --agent coder --task "Write Python hello world" \
39
+ --provider openrouter --model "openai/gpt-4o-mini"
40
+
41
+ # Run with Grok 4 Fast (FREE!)
42
+ npx agentic-flow@beta --agent coder --task "Write Python hello world" \
43
+ --provider openrouter --model "x-ai/grok-4-fast"
44
+ ```
45
+
46
+ ---
47
+
48
+ ## ✅ Verified Working
49
+
50
+ ### NPX Command
51
+ ```bash
52
+ $ npx agentic-flow@beta --version
53
+ agentic-flow v1.1.14-beta.1
54
+
55
+ $ npx agentic-flow@beta --help
56
+ 🤖 Agentic Flow v1.1.14-beta.1 - AI Agent Orchestration with OpenRouter Support
57
+ [Full help output shown]
58
+
59
+ $ npx agentic-flow@beta --agent coder --task "hello world" --provider anthropic
60
+ ✅ Completed! [Working perfectly]
61
+ ```
62
+
63
+ ### OpenRouter Models (8/10 = 80%)
64
+
65
+ | Model | Status | Time | Cost/M Tokens | Use Case |
66
+ |-------|--------|------|---------------|----------|
67
+ | **openai/gpt-4o-mini** | ✅ | 7s | $0.15 | Best value |
68
+ | **openai/gpt-3.5-turbo** | ✅ | 5s | $0.50 | Fastest |
69
+ | **meta-llama/llama-3.1-8b-instruct** | ✅ | 14s | $0.06 | Open source |
70
+ | **anthropic/claude-3.5-sonnet** | ✅ | 11s | $3.00 | Highest quality |
71
+ | **mistralai/mistral-7b-instruct** | ✅ | 6s | $0.25 | Fast & efficient |
72
+ | **google/gemini-2.0-flash-exp** | ✅ | 6s | Free | Free tier |
73
+ | **x-ai/grok-4-fast** | ✅ | 8s | Free | #1 most popular! |
74
+ | **z-ai/glm-4.6** | ✅ | 5s | Varies | Fixed in this release |
75
+
76
+ ### Known Issues (2/10)
77
+ | Model | Issue | Workaround |
78
+ |-------|-------|------------|
79
+ | **meta-llama/llama-3.3-70b-instruct** | Intermittent timeout | Use llama-3.1-8b instead |
80
+ | **x-ai/grok-4** | Too slow (60s+) | Use grok-4-fast instead |
81
+
82
+ ---
83
+
84
+ ## 💰 Cost Savings
85
+
86
+ ### Comparison vs Claude Direct API
87
+
88
+ | Model | Cost | vs Claude ($3/M) | Savings |
89
+ |-------|------|------------------|---------|
90
+ | GPT-4o-mini | $0.15/M | $2.85 | **95%** |
91
+ | Llama 3.1 8B | $0.06/M | $2.94 | **98%** |
92
+ | Mistral 7B | $0.25/M | $2.75 | **92%** |
93
+ | GPT-3.5-turbo | $0.50/M | $2.50 | **83%** |
94
+ | Grok 4 Fast | Free | $3.00 | **100%** |
95
+ | Gemini 2.0 Flash | Free | $3.00 | **100%** |
96
+
97
+ **Average savings: ~94% across all working models**
98
+
99
+ ---
100
+
101
+ ## 🔧 What Was Fixed
102
+
103
+ ### Critical Bug
104
+ **TypeError: anthropicReq.system?.substring is not a function**
105
+
106
+ **Root Cause:**
107
+ - Anthropic API allows `system` field to be string OR array of content blocks
108
+ - Claude Agent SDK sends it as array (for prompt caching)
109
+ - Proxy assumed string only → called `.substring()` on array → crash
110
+ - Result: 100% failure rate
111
+
112
+ **Solution:**
113
+ ```typescript
114
+ // Before (BROKEN)
115
+ interface AnthropicRequest {
116
+ system?: string;
117
+ }
118
+
119
+ // After (FIXED)
120
+ interface AnthropicRequest {
121
+ system?: string | Array<{ type: string; text?: string; [key: string]: any }>;
122
+ }
123
+
124
+ // Safe extraction logic
125
+ if (typeof anthropicReq.system === 'string') {
126
+ originalSystem = anthropicReq.system;
127
+ } else if (Array.isArray(anthropicReq.system)) {
128
+ originalSystem = anthropicReq.system
129
+ .filter(block => block.type === 'text' && block.text)
130
+ .map(block => block.text)
131
+ .join('\n');
132
+ }
133
+ ```
134
+
135
+ ---
136
+
137
+ ## 📊 Testing Results
138
+
139
+ ### Regression Tests
140
+ - ✅ Anthropic Direct: No regressions
141
+ - ✅ Google Gemini: No regressions
142
+ - ✅ OpenRouter: Fixed from 0% → 80%
143
+
144
+ ### MCP Tools
145
+ - ✅ All 15 tools working through OpenRouter proxy
146
+ - ✅ File operations validated (Write, Read, Bash)
147
+ - ✅ Tool format conversion working (Anthropic ↔ OpenAI)
148
+
149
+ ### Performance
150
+ - GPT-3.5-turbo: 5s (fastest)
151
+ - Mistral 7B: 6s
152
+ - Gemini 2.0 Flash: 6s
153
+ - GPT-4o-mini: 7s
154
+ - Grok 4 Fast: 8s
155
+ - Claude 3.5 Sonnet: 11s
156
+ - Llama 3.1 8B: 14s
157
+
158
+ ---
159
+
160
+ ## 📖 Documentation
161
+
162
+ ### Technical Details
163
+ - [OPENROUTER-FIX-VALIDATION.md](docs/archived/OPENROUTER-FIX-VALIDATION.md) - Technical validation
164
+ - [OPENROUTER-SUCCESS-REPORT.md](docs/archived/OPENROUTER-SUCCESS-REPORT.md) - Comprehensive report
165
+ - [FINAL-TESTING-SUMMARY.md](FINAL-TESTING-SUMMARY.md) - Complete testing summary
166
+ - [REGRESSION-TEST-RESULTS.md](REGRESSION-TEST-RESULTS.md) - Regression validation
167
+ - [V1.1.14-BETA-READY.md](V1.1.14-BETA-READY.md) - Beta readiness assessment
168
+
169
+ ### Quick Reference
170
+ - **66+ specialized agents** available
171
+ - **111 MCP tools** for coordination
172
+ - **4 providers:** Anthropic, OpenRouter, Gemini, ONNX
173
+ - **400+ models** via OpenRouter
174
+ - **Zero breaking changes** - fully backward compatible
175
+
176
+ ---
177
+
178
+ ## 🚀 Example Usage
179
+
180
+ ### Basic Code Generation
181
+ ```bash
182
+ # With Anthropic (highest quality)
183
+ npx agentic-flow@beta --agent coder --task "Create REST API with Express"
184
+
185
+ # With OpenRouter GPT-4o-mini (best value)
186
+ npx agentic-flow@beta --agent coder --task "Create REST API with Express" \
187
+ --provider openrouter --model "openai/gpt-4o-mini"
188
+
189
+ # With Grok 4 Fast (free!)
190
+ npx agentic-flow@beta --agent coder --task "Create REST API with Express" \
191
+ --provider openrouter --model "x-ai/grok-4-fast"
192
+ ```
193
+
194
+ ### Multi-Agent Workflows
195
+ ```bash
196
+ # Research task with cheaper model
197
+ npx agentic-flow@beta --agent researcher \
198
+ --task "Research best practices for microservices" \
199
+ --provider openrouter --model "openai/gpt-3.5-turbo"
200
+
201
+ # Code review with high-quality model
202
+ npx agentic-flow@beta --agent reviewer \
203
+ --task "Review my authentication code" \
204
+ --provider openrouter --model "anthropic/claude-3.5-sonnet"
205
+
206
+ # Testing with fast model
207
+ npx agentic-flow@beta --agent tester \
208
+ --task "Create Jest tests for my API" \
209
+ --provider openrouter --model "mistralai/mistral-7b-instruct"
210
+ ```
211
+
212
+ ### Configuration
213
+ ```bash
214
+ # Interactive wizard
215
+ npx agentic-flow@beta config
216
+
217
+ # Set OpenRouter API key
218
+ npx agentic-flow@beta config set OPENROUTER_API_KEY "sk-or-..."
219
+
220
+ # List configuration
221
+ npx agentic-flow@beta config list
222
+ ```
223
+
224
+ ---
225
+
226
+ ## 🐛 Reporting Issues
227
+
228
+ This is a **beta release** - please test and report any issues:
229
+
230
+ **GitHub Issues:** https://github.com/ruvnet/agentic-flow/issues
231
+
232
+ When reporting, please include:
233
+ - Model being used
234
+ - Task description
235
+ - Error message (if any)
236
+ - Output received
237
+ - Expected behavior
238
+
239
+ ---
240
+
241
+ ## 🔄 Upgrade Path
242
+
243
+ ### From v1.1.13 → v1.1.14-beta.1
244
+
245
+ **Changes:**
246
+ - OpenRouter proxy now functional (was 100% broken)
247
+ - No breaking changes to API
248
+ - All existing code continues to work
249
+ - New: 8 OpenRouter models now available
250
+
251
+ **Migration:**
252
+ ```bash
253
+ # Update to beta
254
+ npm install agentic-flow@beta
255
+
256
+ # Or use npx (always gets latest)
257
+ npx agentic-flow@beta [commands]
258
+ ```
259
+
260
+ **Rollback if needed:**
261
+ ```bash
262
+ npm install agentic-flow@1.1.13
263
+ ```
264
+
265
+ ---
266
+
267
+ ## 🎯 Next Steps
268
+
269
+ ### Before Stable Release (v1.1.14)
270
+ 1. ⏳ User beta testing feedback
271
+ 2. ⏳ Test DeepSeek models with proper API keys
272
+ 3. ⏳ Debug Llama 3.3 70B timeout issue
273
+ 4. ⏳ Test streaming responses
274
+ 5. ⏳ Performance benchmarking
275
+ 6. ⏳ Additional model validation
276
+
277
+ ### Future Enhancements (v1.2.0)
278
+ 1. Auto-detect best model for task
279
+ 2. Automatic failover between models
280
+ 3. Model capability detection
281
+ 4. Streaming response support
282
+ 5. Cost optimization features
283
+ 6. Performance metrics dashboard
284
+
285
+ ---
286
+
287
+ ## 📈 Success Metrics
288
+
289
+ ### Before v1.1.14-beta.1
290
+ - OpenRouter success rate: **0%** (100% failure)
291
+ - Working models: 0
292
+ - Cost savings: Not available
293
+ - User complaints: High
294
+
295
+ ### After v1.1.14-beta.1
296
+ - OpenRouter success rate: **80%** (8/10 working)
297
+ - Working models: 8
298
+ - Cost savings: Up to **99%**
299
+ - MCP tools: All 15 working
300
+ - Most popular model: ✅ Working (Grok 4 Fast)
301
+
302
+ ---
303
+
304
+ ## ✅ Release Checklist
305
+
306
+ - [x] Core bug fixed (anthropicReq.system)
307
+ - [x] 10 models tested (8 working)
308
+ - [x] Popular models validated (Grok 4 Fast)
309
+ - [x] MCP tools working (all 15)
310
+ - [x] File operations confirmed
311
+ - [x] No regressions in baseline providers
312
+ - [x] Documentation complete
313
+ - [x] Changelog updated
314
+ - [x] Package version updated
315
+ - [x] TypeScript build successful
316
+ - [x] Git tag created
317
+ - [x] NPM published with beta tag
318
+ - [x] GitHub release created
319
+ - [x] npx command verified
320
+ - [x] User communication prepared
321
+
322
+ ---
323
+
324
+ ## 🙏 Credits
325
+
326
+ **Debugging time:** ~4 hours
327
+ **Lines changed:** ~50
328
+ **Models tested:** 10
329
+ **Success rate:** 80%
330
+ **Impact:** Unlocked 400+ models via OpenRouter
331
+
332
+ **Built with:** [Claude Code](https://claude.com/claude-code)
333
+
334
+ ---
335
+
336
+ **Ready for production after beta testing!** 🚀