agentic-flow 1.1.14 → 1.2.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude/agents/custom/test-long-runner.md +44 -0
- package/README.md +50 -1
- package/dist/agents/claudeAgent.js +31 -0
- package/dist/cli/mcp-manager.js +474 -0
- package/dist/cli-proxy.js +22 -1
- package/dist/utils/.claude-flow/metrics/agent-metrics.json +1 -0
- package/dist/utils/.claude-flow/metrics/performance.json +9 -0
- package/dist/utils/.claude-flow/metrics/task-metrics.json +10 -0
- package/dist/utils/cli.js +9 -1
- package/dist/utils/modelOptimizer.js +18 -2
- package/docs/.claude-flow/metrics/performance.json +1 -1
- package/docs/.claude-flow/metrics/task-metrics.json +3 -3
- package/docs/INDEX.md +44 -7
- package/docs/archived/RELEASE-SUMMARY-v1.1.14-beta.1.md +336 -0
- package/docs/archived/V1.1.14-BETA-READY.md +418 -0
- package/docs/guides/ADDING-MCP-SERVERS-CLI.md +515 -0
- package/docs/guides/ADDING-MCP-SERVERS.md +642 -0
- package/docs/mcp-validation/IMPLEMENTATION-SUMMARY.md +493 -0
- package/docs/mcp-validation/MCP-CLI-VALIDATION-REPORT.md +322 -0
- package/docs/mcp-validation/README.md +43 -0
- package/docs/mcp-validation/strange-loops-test.md +63 -0
- package/docs/releases/HOTFIX-v1.2.1.md +315 -0
- package/docs/releases/NPM-PUBLISH-GUIDE-v1.2.0.md +440 -0
- package/docs/releases/PUBLISH-COMPLETE-v1.2.0.md +308 -0
- package/docs/releases/README.md +18 -0
- package/docs/releases/RELEASE-v1.2.0.md +339 -0
- package/docs/testing/AGENT-SYSTEM-VALIDATION.md +517 -0
- package/docs/testing/FINAL-TESTING-SUMMARY.md +362 -0
- package/docs/testing/README.md +46 -0
- package/docs/testing/REGRESSION-TEST-RESULTS.md +269 -0
- package/docs/testing/STREAMING-AND-MCP-VALIDATION.md +517 -0
- package/package.json +2 -2
package/dist/utils/cli.js
CHANGED
|
@@ -16,8 +16,16 @@ export function parseArgs() {
|
|
|
16
16
|
}
|
|
17
17
|
// Check for MCP command
|
|
18
18
|
if (args[0] === 'mcp') {
|
|
19
|
+
const mcpSubcommand = args[1];
|
|
20
|
+
// MCP Manager commands (CLI configuration)
|
|
21
|
+
const managerCommands = ['add', 'list', 'remove', 'enable', 'disable', 'update', 'test', 'info', 'export', 'import'];
|
|
22
|
+
if (managerCommands.includes(mcpSubcommand)) {
|
|
23
|
+
options.mode = 'mcp-manager';
|
|
24
|
+
return options;
|
|
25
|
+
}
|
|
26
|
+
// MCP Server commands (start/stop server)
|
|
19
27
|
options.mode = 'mcp';
|
|
20
|
-
options.mcpCommand =
|
|
28
|
+
options.mcpCommand = mcpSubcommand || 'start'; // default to start
|
|
21
29
|
options.mcpServer = args[2] || 'all'; // default to all servers
|
|
22
30
|
return options;
|
|
23
31
|
}
|
|
@@ -16,6 +16,7 @@ const MODEL_DATABASE = {
|
|
|
16
16
|
speed_score: 85,
|
|
17
17
|
cost_score: 20,
|
|
18
18
|
tier: 'flagship',
|
|
19
|
+
supports_tools: true,
|
|
19
20
|
strengths: ['reasoning', 'coding', 'analysis', 'production'],
|
|
20
21
|
weaknesses: ['cost'],
|
|
21
22
|
bestFor: ['coder', 'reviewer', 'architecture', 'planner', 'production-validator']
|
|
@@ -30,6 +31,7 @@ const MODEL_DATABASE = {
|
|
|
30
31
|
speed_score: 90,
|
|
31
32
|
cost_score: 30,
|
|
32
33
|
tier: 'flagship',
|
|
34
|
+
supports_tools: true,
|
|
33
35
|
strengths: ['multimodal', 'speed', 'general-purpose', 'vision'],
|
|
34
36
|
weaknesses: ['cost'],
|
|
35
37
|
bestFor: ['researcher', 'analyst', 'multimodal-tasks']
|
|
@@ -44,6 +46,7 @@ const MODEL_DATABASE = {
|
|
|
44
46
|
speed_score: 75,
|
|
45
47
|
cost_score: 50,
|
|
46
48
|
tier: 'flagship',
|
|
49
|
+
supports_tools: true,
|
|
47
50
|
strengths: ['reasoning', 'large-context', 'math', 'analysis'],
|
|
48
51
|
weaknesses: ['speed'],
|
|
49
52
|
bestFor: ['planner', 'architecture', 'researcher', 'code-analyzer']
|
|
@@ -59,8 +62,9 @@ const MODEL_DATABASE = {
|
|
|
59
62
|
speed_score: 80,
|
|
60
63
|
cost_score: 100,
|
|
61
64
|
tier: 'cost-effective',
|
|
65
|
+
supports_tools: false, // DeepSeek R1 does NOT support tool/function calling
|
|
62
66
|
strengths: ['reasoning', 'coding', 'math', 'value', 'free'],
|
|
63
|
-
weaknesses: ['newer-model'],
|
|
67
|
+
weaknesses: ['newer-model', 'no-tool-use'],
|
|
64
68
|
bestFor: ['coder', 'pseudocode', 'specification', 'refinement', 'tester']
|
|
65
69
|
},
|
|
66
70
|
'deepseek-chat-v3': {
|
|
@@ -73,6 +77,7 @@ const MODEL_DATABASE = {
|
|
|
73
77
|
speed_score: 90,
|
|
74
78
|
cost_score: 100,
|
|
75
79
|
tier: 'cost-effective',
|
|
80
|
+
supports_tools: true,
|
|
76
81
|
strengths: ['cost', 'speed', 'coding', 'development', 'free'],
|
|
77
82
|
weaknesses: ['complex-reasoning'],
|
|
78
83
|
bestFor: ['coder', 'reviewer', 'tester', 'backend-dev', 'cicd-engineer']
|
|
@@ -88,6 +93,7 @@ const MODEL_DATABASE = {
|
|
|
88
93
|
speed_score: 98,
|
|
89
94
|
cost_score: 98,
|
|
90
95
|
tier: 'balanced',
|
|
96
|
+
supports_tools: true,
|
|
91
97
|
strengths: ['speed', 'cost', 'interactive'],
|
|
92
98
|
weaknesses: ['quality'],
|
|
93
99
|
bestFor: ['researcher', 'planner', 'smart-agent']
|
|
@@ -102,6 +108,7 @@ const MODEL_DATABASE = {
|
|
|
102
108
|
speed_score: 95,
|
|
103
109
|
cost_score: 100,
|
|
104
110
|
tier: 'balanced',
|
|
111
|
+
supports_tools: true,
|
|
105
112
|
strengths: ['open-source', 'versatile', 'coding', 'free', 'fast'],
|
|
106
113
|
weaknesses: ['smaller-model'],
|
|
107
114
|
bestFor: ['coder', 'reviewer', 'base-template-generator', 'tester']
|
|
@@ -116,6 +123,7 @@ const MODEL_DATABASE = {
|
|
|
116
123
|
speed_score: 85,
|
|
117
124
|
cost_score: 90,
|
|
118
125
|
tier: 'balanced',
|
|
126
|
+
supports_tools: true,
|
|
119
127
|
strengths: ['multilingual', 'coding', 'reasoning'],
|
|
120
128
|
weaknesses: ['english-optimized'],
|
|
121
129
|
bestFor: ['researcher', 'coder', 'multilingual-tasks']
|
|
@@ -131,6 +139,7 @@ const MODEL_DATABASE = {
|
|
|
131
139
|
speed_score: 95,
|
|
132
140
|
cost_score: 99,
|
|
133
141
|
tier: 'budget',
|
|
142
|
+
supports_tools: true,
|
|
134
143
|
strengths: ['ultra-low-cost', 'speed'],
|
|
135
144
|
weaknesses: ['quality', 'complex-tasks'],
|
|
136
145
|
bestFor: ['simple-tasks', 'testing']
|
|
@@ -146,6 +155,7 @@ const MODEL_DATABASE = {
|
|
|
146
155
|
speed_score: 30,
|
|
147
156
|
cost_score: 100,
|
|
148
157
|
tier: 'local',
|
|
158
|
+
supports_tools: false,
|
|
149
159
|
strengths: ['privacy', 'offline', 'zero-cost'],
|
|
150
160
|
weaknesses: ['quality', 'speed'],
|
|
151
161
|
bestFor: ['privacy-tasks', 'offline-tasks']
|
|
@@ -197,8 +207,14 @@ export class ModelOptimizer {
|
|
|
197
207
|
const taskComplexity = criteria.taskComplexity || this.inferComplexity(criteria.task);
|
|
198
208
|
// Set default priority to balanced if not specified
|
|
199
209
|
const priority = criteria.priority || 'balanced';
|
|
210
|
+
// Filter models that support tools if required
|
|
211
|
+
let availableModels = Object.entries(MODEL_DATABASE);
|
|
212
|
+
if (criteria.requiresTools) {
|
|
213
|
+
availableModels = availableModels.filter(([key, model]) => model.supports_tools !== false);
|
|
214
|
+
logger.info(`Filtered to ${availableModels.length} models with tool support`);
|
|
215
|
+
}
|
|
200
216
|
// Score all models
|
|
201
|
-
const scoredModels =
|
|
217
|
+
const scoredModels = availableModels.map(([key, model]) => {
|
|
202
218
|
// Calculate overall score based on priority
|
|
203
219
|
let overall_score;
|
|
204
220
|
switch (priority) {
|
|
@@ -1,10 +1,10 @@
|
|
|
1
1
|
[
|
|
2
2
|
{
|
|
3
|
-
"id": "cmd-hooks-
|
|
3
|
+
"id": "cmd-hooks-1759762593563",
|
|
4
4
|
"type": "hooks",
|
|
5
5
|
"success": true,
|
|
6
|
-
"duration":
|
|
7
|
-
"timestamp":
|
|
6
|
+
"duration": 24.05694200000005,
|
|
7
|
+
"timestamp": 1759762593587,
|
|
8
8
|
"metadata": {}
|
|
9
9
|
}
|
|
10
10
|
]
|
package/docs/INDEX.md
CHANGED
|
@@ -54,10 +54,35 @@ Multi-model router configuration and usage.
|
|
|
54
54
|
- [Router Config Reference](router/ROUTER_CONFIG_REFERENCE.md) - Configuration options
|
|
55
55
|
- [Top 20 Models Matrix](router/TOP20_MODELS_MATRIX.md) - Model comparison guide
|
|
56
56
|
|
|
57
|
-
### ✅ [
|
|
58
|
-
|
|
57
|
+
### ✅ [Testing & Validation](testing/)
|
|
58
|
+
Current test results, validation reports, and quality assurance.
|
|
59
59
|
|
|
60
|
-
- [
|
|
60
|
+
- [Testing Overview](testing/README.md) - Current testing documentation
|
|
61
|
+
- [Agent System Validation](testing/AGENT-SYSTEM-VALIDATION.md) - Multi-agent testing
|
|
62
|
+
- [Final Testing Summary](testing/FINAL-TESTING-SUMMARY.md) - Comprehensive coverage
|
|
63
|
+
- [Regression Test Results](testing/REGRESSION-TEST-RESULTS.md) - Regression testing
|
|
64
|
+
- [Streaming & MCP Validation](testing/STREAMING-AND-MCP-VALIDATION.md) - Integration tests
|
|
65
|
+
|
|
66
|
+
### 🔍 [MCP Validation](mcp-validation/)
|
|
67
|
+
Model Context Protocol implementation and validation.
|
|
68
|
+
|
|
69
|
+
- [MCP Validation Overview](mcp-validation/README.md) - MCP testing documentation
|
|
70
|
+
- [Implementation Summary](mcp-validation/IMPLEMENTATION-SUMMARY.md) - MCP implementation
|
|
71
|
+
- [CLI Validation Report](mcp-validation/MCP-CLI-VALIDATION-REPORT.md) - CLI tool testing
|
|
72
|
+
- [Strange Loops Test](mcp-validation/strange-loops-test.md) - Advanced patterns
|
|
73
|
+
|
|
74
|
+
### 📦 [Releases](releases/)
|
|
75
|
+
Version-specific release notes and publishing documentation.
|
|
76
|
+
|
|
77
|
+
- [Release Overview](releases/README.md) - Release documentation index
|
|
78
|
+
- [v1.2.0 Release](releases/RELEASE-v1.2.0.md) - Latest stable release
|
|
79
|
+
- [v1.2.0 Publishing Guide](releases/NPM-PUBLISH-GUIDE-v1.2.0.md) - Publishing process
|
|
80
|
+
- [v1.2.1 Hotfix](releases/HOTFIX-v1.2.1.md) - Critical fixes
|
|
81
|
+
|
|
82
|
+
### 🗄️ [Validation Archive](validation/)
|
|
83
|
+
Historical validation reports and test archives.
|
|
84
|
+
|
|
85
|
+
- [Validation Archive](validation/README.md) - Archived test reports
|
|
61
86
|
|
|
62
87
|
### 📦 [Archived](archived/)
|
|
63
88
|
Historical documentation, completed implementations, and validation reports.
|
|
@@ -103,13 +128,15 @@ Historical documentation, completed implementations, and validation reports.
|
|
|
103
128
|
### Path 2: Developers (1.5 hours)
|
|
104
129
|
1. [Architecture Overview](architecture/EXECUTIVE_SUMMARY.md) - System design (20 min)
|
|
105
130
|
2. [Implementation Examples](guides/IMPLEMENTATION_EXAMPLES.md) - Code patterns (40 min)
|
|
106
|
-
3. [Integration Guides](integrations/) - External services (
|
|
131
|
+
3. [Integration Guides](integrations/) - External services (20 min)
|
|
132
|
+
4. [Testing Documentation](testing/) - Quality assurance (10 min)
|
|
107
133
|
|
|
108
134
|
### Path 3: System Architects (2 hours)
|
|
109
135
|
1. [Research Summary](architecture/RESEARCH_SUMMARY.md) - Technical findings (30 min)
|
|
110
136
|
2. [Multi-Model Router Plan](architecture/MULTI_MODEL_ROUTER_PLAN.md) - Router architecture (45 min)
|
|
111
|
-
3. [Integration Status](architecture/INTEGRATION-STATUS.md) - Current state (
|
|
137
|
+
3. [Integration Status](architecture/INTEGRATION-STATUS.md) - Current state (20 min)
|
|
112
138
|
4. [Router Documentation](router/) - Configuration and usage (15 min)
|
|
139
|
+
5. [MCP Validation](mcp-validation/) - Protocol implementation (10 min)
|
|
113
140
|
|
|
114
141
|
---
|
|
115
142
|
|
|
@@ -192,5 +219,15 @@ Historical reports, completed implementations, and superseded guides are in the
|
|
|
192
219
|
|
|
193
220
|
---
|
|
194
221
|
|
|
195
|
-
**Documentation Status**: ✅
|
|
196
|
-
**Last Updated**: October
|
|
222
|
+
**Documentation Status**: ✅ Reorganized and up-to-date
|
|
223
|
+
**Last Updated**: October 6, 2025
|
|
224
|
+
|
|
225
|
+
## 📋 Recent Documentation Updates
|
|
226
|
+
|
|
227
|
+
**v2.0 Reorganization (Oct 6, 2025)**:
|
|
228
|
+
- Created dedicated `releases/` directory for version-specific documentation
|
|
229
|
+
- Consolidated testing reports into `testing/` directory
|
|
230
|
+
- Separated MCP validation into dedicated `mcp-validation/` section
|
|
231
|
+
- Added comprehensive READMEs to all major sections
|
|
232
|
+
- Archived historical v1.1.x releases for cleaner navigation
|
|
233
|
+
- Improved documentation index with better categorization
|
|
@@ -0,0 +1,336 @@
|
|
|
1
|
+
# v1.1.14-beta.1 Release Summary
|
|
2
|
+
|
|
3
|
+
**Date:** 2025-10-05
|
|
4
|
+
**Status:** ✅ **PUBLISHED & LIVE**
|
|
5
|
+
**NPM:** https://www.npmjs.com/package/agentic-flow/v/1.1.14-beta.1
|
|
6
|
+
**GitHub:** https://github.com/ruvnet/agentic-flow/releases/tag/v1.1.14-beta.1
|
|
7
|
+
|
|
8
|
+
---
|
|
9
|
+
|
|
10
|
+
## 🎉 Major Achievement
|
|
11
|
+
|
|
12
|
+
**Fixed critical OpenRouter proxy bug that was causing 100% failure rate!**
|
|
13
|
+
|
|
14
|
+
From **0% success** → **80% success** (8 out of 10 models working)
|
|
15
|
+
|
|
16
|
+
---
|
|
17
|
+
|
|
18
|
+
## Installation & Usage
|
|
19
|
+
|
|
20
|
+
### Install Beta Version
|
|
21
|
+
```bash
|
|
22
|
+
# Install globally
|
|
23
|
+
npm install -g agentic-flow@beta
|
|
24
|
+
|
|
25
|
+
# Or use with npx (no installation needed)
|
|
26
|
+
npx agentic-flow@beta --help
|
|
27
|
+
```
|
|
28
|
+
|
|
29
|
+
### Quick Start
|
|
30
|
+
```bash
|
|
31
|
+
# List available agents
|
|
32
|
+
npx agentic-flow@beta --list
|
|
33
|
+
|
|
34
|
+
# Run with Anthropic (default)
|
|
35
|
+
npx agentic-flow@beta --agent coder --task "Write Python hello world"
|
|
36
|
+
|
|
37
|
+
# Run with OpenRouter (99% cost savings!)
|
|
38
|
+
npx agentic-flow@beta --agent coder --task "Write Python hello world" \
|
|
39
|
+
--provider openrouter --model "openai/gpt-4o-mini"
|
|
40
|
+
|
|
41
|
+
# Run with Grok 4 Fast (FREE!)
|
|
42
|
+
npx agentic-flow@beta --agent coder --task "Write Python hello world" \
|
|
43
|
+
--provider openrouter --model "x-ai/grok-4-fast"
|
|
44
|
+
```
|
|
45
|
+
|
|
46
|
+
---
|
|
47
|
+
|
|
48
|
+
## ✅ Verified Working
|
|
49
|
+
|
|
50
|
+
### NPX Command
|
|
51
|
+
```bash
|
|
52
|
+
$ npx agentic-flow@beta --version
|
|
53
|
+
agentic-flow v1.1.14-beta.1
|
|
54
|
+
|
|
55
|
+
$ npx agentic-flow@beta --help
|
|
56
|
+
🤖 Agentic Flow v1.1.14-beta.1 - AI Agent Orchestration with OpenRouter Support
|
|
57
|
+
[Full help output shown]
|
|
58
|
+
|
|
59
|
+
$ npx agentic-flow@beta --agent coder --task "hello world" --provider anthropic
|
|
60
|
+
✅ Completed! [Working perfectly]
|
|
61
|
+
```
|
|
62
|
+
|
|
63
|
+
### OpenRouter Models (8/10 = 80%)
|
|
64
|
+
|
|
65
|
+
| Model | Status | Time | Cost/M Tokens | Use Case |
|
|
66
|
+
|-------|--------|------|---------------|----------|
|
|
67
|
+
| **openai/gpt-4o-mini** | ✅ | 7s | $0.15 | Best value |
|
|
68
|
+
| **openai/gpt-3.5-turbo** | ✅ | 5s | $0.50 | Fastest |
|
|
69
|
+
| **meta-llama/llama-3.1-8b-instruct** | ✅ | 14s | $0.06 | Open source |
|
|
70
|
+
| **anthropic/claude-3.5-sonnet** | ✅ | 11s | $3.00 | Highest quality |
|
|
71
|
+
| **mistralai/mistral-7b-instruct** | ✅ | 6s | $0.25 | Fast & efficient |
|
|
72
|
+
| **google/gemini-2.0-flash-exp** | ✅ | 6s | Free | Free tier |
|
|
73
|
+
| **x-ai/grok-4-fast** | ✅ | 8s | Free | #1 most popular! |
|
|
74
|
+
| **z-ai/glm-4.6** | ✅ | 5s | Varies | Fixed in this release |
|
|
75
|
+
|
|
76
|
+
### Known Issues (2/10)
|
|
77
|
+
| Model | Issue | Workaround |
|
|
78
|
+
|-------|-------|------------|
|
|
79
|
+
| **meta-llama/llama-3.3-70b-instruct** | Intermittent timeout | Use llama-3.1-8b instead |
|
|
80
|
+
| **x-ai/grok-4** | Too slow (60s+) | Use grok-4-fast instead |
|
|
81
|
+
|
|
82
|
+
---
|
|
83
|
+
|
|
84
|
+
## 💰 Cost Savings
|
|
85
|
+
|
|
86
|
+
### Comparison vs Claude Direct API
|
|
87
|
+
|
|
88
|
+
| Model | Cost | vs Claude ($3/M) | Savings |
|
|
89
|
+
|-------|------|------------------|---------|
|
|
90
|
+
| GPT-4o-mini | $0.15/M | $2.85 | **95%** |
|
|
91
|
+
| Llama 3.1 8B | $0.06/M | $2.94 | **98%** |
|
|
92
|
+
| Mistral 7B | $0.25/M | $2.75 | **92%** |
|
|
93
|
+
| GPT-3.5-turbo | $0.50/M | $2.50 | **83%** |
|
|
94
|
+
| Grok 4 Fast | Free | $3.00 | **100%** |
|
|
95
|
+
| Gemini 2.0 Flash | Free | $3.00 | **100%** |
|
|
96
|
+
|
|
97
|
+
**Average savings: ~94% across all working models**
|
|
98
|
+
|
|
99
|
+
---
|
|
100
|
+
|
|
101
|
+
## 🔧 What Was Fixed
|
|
102
|
+
|
|
103
|
+
### Critical Bug
|
|
104
|
+
**TypeError: anthropicReq.system?.substring is not a function**
|
|
105
|
+
|
|
106
|
+
**Root Cause:**
|
|
107
|
+
- Anthropic API allows `system` field to be string OR array of content blocks
|
|
108
|
+
- Claude Agent SDK sends it as array (for prompt caching)
|
|
109
|
+
- Proxy assumed string only → called `.substring()` on array → crash
|
|
110
|
+
- Result: 100% failure rate
|
|
111
|
+
|
|
112
|
+
**Solution:**
|
|
113
|
+
```typescript
|
|
114
|
+
// Before (BROKEN)
|
|
115
|
+
interface AnthropicRequest {
|
|
116
|
+
system?: string;
|
|
117
|
+
}
|
|
118
|
+
|
|
119
|
+
// After (FIXED)
|
|
120
|
+
interface AnthropicRequest {
|
|
121
|
+
system?: string | Array<{ type: string; text?: string; [key: string]: any }>;
|
|
122
|
+
}
|
|
123
|
+
|
|
124
|
+
// Safe extraction logic
|
|
125
|
+
if (typeof anthropicReq.system === 'string') {
|
|
126
|
+
originalSystem = anthropicReq.system;
|
|
127
|
+
} else if (Array.isArray(anthropicReq.system)) {
|
|
128
|
+
originalSystem = anthropicReq.system
|
|
129
|
+
.filter(block => block.type === 'text' && block.text)
|
|
130
|
+
.map(block => block.text)
|
|
131
|
+
.join('\n');
|
|
132
|
+
}
|
|
133
|
+
```
|
|
134
|
+
|
|
135
|
+
---
|
|
136
|
+
|
|
137
|
+
## 📊 Testing Results
|
|
138
|
+
|
|
139
|
+
### Regression Tests
|
|
140
|
+
- ✅ Anthropic Direct: No regressions
|
|
141
|
+
- ✅ Google Gemini: No regressions
|
|
142
|
+
- ✅ OpenRouter: Fixed from 0% → 80%
|
|
143
|
+
|
|
144
|
+
### MCP Tools
|
|
145
|
+
- ✅ All 15 tools working through OpenRouter proxy
|
|
146
|
+
- ✅ File operations validated (Write, Read, Bash)
|
|
147
|
+
- ✅ Tool format conversion working (Anthropic ↔ OpenAI)
|
|
148
|
+
|
|
149
|
+
### Performance
|
|
150
|
+
- GPT-3.5-turbo: 5s (fastest)
|
|
151
|
+
- Mistral 7B: 6s
|
|
152
|
+
- Gemini 2.0 Flash: 6s
|
|
153
|
+
- GPT-4o-mini: 7s
|
|
154
|
+
- Grok 4 Fast: 8s
|
|
155
|
+
- Claude 3.5 Sonnet: 11s
|
|
156
|
+
- Llama 3.1 8B: 14s
|
|
157
|
+
|
|
158
|
+
---
|
|
159
|
+
|
|
160
|
+
## 📖 Documentation
|
|
161
|
+
|
|
162
|
+
### Technical Details
|
|
163
|
+
- [OPENROUTER-FIX-VALIDATION.md](docs/archived/OPENROUTER-FIX-VALIDATION.md) - Technical validation
|
|
164
|
+
- [OPENROUTER-SUCCESS-REPORT.md](docs/archived/OPENROUTER-SUCCESS-REPORT.md) - Comprehensive report
|
|
165
|
+
- [FINAL-TESTING-SUMMARY.md](FINAL-TESTING-SUMMARY.md) - Complete testing summary
|
|
166
|
+
- [REGRESSION-TEST-RESULTS.md](REGRESSION-TEST-RESULTS.md) - Regression validation
|
|
167
|
+
- [V1.1.14-BETA-READY.md](V1.1.14-BETA-READY.md) - Beta readiness assessment
|
|
168
|
+
|
|
169
|
+
### Quick Reference
|
|
170
|
+
- **66+ specialized agents** available
|
|
171
|
+
- **111 MCP tools** for coordination
|
|
172
|
+
- **4 providers:** Anthropic, OpenRouter, Gemini, ONNX
|
|
173
|
+
- **400+ models** via OpenRouter
|
|
174
|
+
- **Zero breaking changes** - fully backward compatible
|
|
175
|
+
|
|
176
|
+
---
|
|
177
|
+
|
|
178
|
+
## 🚀 Example Usage
|
|
179
|
+
|
|
180
|
+
### Basic Code Generation
|
|
181
|
+
```bash
|
|
182
|
+
# With Anthropic (highest quality)
|
|
183
|
+
npx agentic-flow@beta --agent coder --task "Create REST API with Express"
|
|
184
|
+
|
|
185
|
+
# With OpenRouter GPT-4o-mini (best value)
|
|
186
|
+
npx agentic-flow@beta --agent coder --task "Create REST API with Express" \
|
|
187
|
+
--provider openrouter --model "openai/gpt-4o-mini"
|
|
188
|
+
|
|
189
|
+
# With Grok 4 Fast (free!)
|
|
190
|
+
npx agentic-flow@beta --agent coder --task "Create REST API with Express" \
|
|
191
|
+
--provider openrouter --model "x-ai/grok-4-fast"
|
|
192
|
+
```
|
|
193
|
+
|
|
194
|
+
### Multi-Agent Workflows
|
|
195
|
+
```bash
|
|
196
|
+
# Research task with cheaper model
|
|
197
|
+
npx agentic-flow@beta --agent researcher \
|
|
198
|
+
--task "Research best practices for microservices" \
|
|
199
|
+
--provider openrouter --model "openai/gpt-3.5-turbo"
|
|
200
|
+
|
|
201
|
+
# Code review with high-quality model
|
|
202
|
+
npx agentic-flow@beta --agent reviewer \
|
|
203
|
+
--task "Review my authentication code" \
|
|
204
|
+
--provider openrouter --model "anthropic/claude-3.5-sonnet"
|
|
205
|
+
|
|
206
|
+
# Testing with fast model
|
|
207
|
+
npx agentic-flow@beta --agent tester \
|
|
208
|
+
--task "Create Jest tests for my API" \
|
|
209
|
+
--provider openrouter --model "mistralai/mistral-7b-instruct"
|
|
210
|
+
```
|
|
211
|
+
|
|
212
|
+
### Configuration
|
|
213
|
+
```bash
|
|
214
|
+
# Interactive wizard
|
|
215
|
+
npx agentic-flow@beta config
|
|
216
|
+
|
|
217
|
+
# Set OpenRouter API key
|
|
218
|
+
npx agentic-flow@beta config set OPENROUTER_API_KEY "sk-or-..."
|
|
219
|
+
|
|
220
|
+
# List configuration
|
|
221
|
+
npx agentic-flow@beta config list
|
|
222
|
+
```
|
|
223
|
+
|
|
224
|
+
---
|
|
225
|
+
|
|
226
|
+
## 🐛 Reporting Issues
|
|
227
|
+
|
|
228
|
+
This is a **beta release** - please test and report any issues:
|
|
229
|
+
|
|
230
|
+
**GitHub Issues:** https://github.com/ruvnet/agentic-flow/issues
|
|
231
|
+
|
|
232
|
+
When reporting, please include:
|
|
233
|
+
- Model being used
|
|
234
|
+
- Task description
|
|
235
|
+
- Error message (if any)
|
|
236
|
+
- Output received
|
|
237
|
+
- Expected behavior
|
|
238
|
+
|
|
239
|
+
---
|
|
240
|
+
|
|
241
|
+
## 🔄 Upgrade Path
|
|
242
|
+
|
|
243
|
+
### From v1.1.13 → v1.1.14-beta.1
|
|
244
|
+
|
|
245
|
+
**Changes:**
|
|
246
|
+
- OpenRouter proxy now functional (was 100% broken)
|
|
247
|
+
- No breaking changes to API
|
|
248
|
+
- All existing code continues to work
|
|
249
|
+
- New: 8 OpenRouter models now available
|
|
250
|
+
|
|
251
|
+
**Migration:**
|
|
252
|
+
```bash
|
|
253
|
+
# Update to beta
|
|
254
|
+
npm install agentic-flow@beta
|
|
255
|
+
|
|
256
|
+
# Or use npx (always gets latest)
|
|
257
|
+
npx agentic-flow@beta [commands]
|
|
258
|
+
```
|
|
259
|
+
|
|
260
|
+
**Rollback if needed:**
|
|
261
|
+
```bash
|
|
262
|
+
npm install agentic-flow@1.1.13
|
|
263
|
+
```
|
|
264
|
+
|
|
265
|
+
---
|
|
266
|
+
|
|
267
|
+
## 🎯 Next Steps
|
|
268
|
+
|
|
269
|
+
### Before Stable Release (v1.1.14)
|
|
270
|
+
1. ⏳ User beta testing feedback
|
|
271
|
+
2. ⏳ Test DeepSeek models with proper API keys
|
|
272
|
+
3. ⏳ Debug Llama 3.3 70B timeout issue
|
|
273
|
+
4. ⏳ Test streaming responses
|
|
274
|
+
5. ⏳ Performance benchmarking
|
|
275
|
+
6. ⏳ Additional model validation
|
|
276
|
+
|
|
277
|
+
### Future Enhancements (v1.2.0)
|
|
278
|
+
1. Auto-detect best model for task
|
|
279
|
+
2. Automatic failover between models
|
|
280
|
+
3. Model capability detection
|
|
281
|
+
4. Streaming response support
|
|
282
|
+
5. Cost optimization features
|
|
283
|
+
6. Performance metrics dashboard
|
|
284
|
+
|
|
285
|
+
---
|
|
286
|
+
|
|
287
|
+
## 📈 Success Metrics
|
|
288
|
+
|
|
289
|
+
### Before v1.1.14-beta.1
|
|
290
|
+
- OpenRouter success rate: **0%** (100% failure)
|
|
291
|
+
- Working models: 0
|
|
292
|
+
- Cost savings: Not available
|
|
293
|
+
- User complaints: High
|
|
294
|
+
|
|
295
|
+
### After v1.1.14-beta.1
|
|
296
|
+
- OpenRouter success rate: **80%** (8/10 working)
|
|
297
|
+
- Working models: 8
|
|
298
|
+
- Cost savings: Up to **99%**
|
|
299
|
+
- MCP tools: All 15 working
|
|
300
|
+
- Most popular model: ✅ Working (Grok 4 Fast)
|
|
301
|
+
|
|
302
|
+
---
|
|
303
|
+
|
|
304
|
+
## ✅ Release Checklist
|
|
305
|
+
|
|
306
|
+
- [x] Core bug fixed (anthropicReq.system)
|
|
307
|
+
- [x] 10 models tested (8 working)
|
|
308
|
+
- [x] Popular models validated (Grok 4 Fast)
|
|
309
|
+
- [x] MCP tools working (all 15)
|
|
310
|
+
- [x] File operations confirmed
|
|
311
|
+
- [x] No regressions in baseline providers
|
|
312
|
+
- [x] Documentation complete
|
|
313
|
+
- [x] Changelog updated
|
|
314
|
+
- [x] Package version updated
|
|
315
|
+
- [x] TypeScript build successful
|
|
316
|
+
- [x] Git tag created
|
|
317
|
+
- [x] NPM published with beta tag
|
|
318
|
+
- [x] GitHub release created
|
|
319
|
+
- [x] npx command verified
|
|
320
|
+
- [x] User communication prepared
|
|
321
|
+
|
|
322
|
+
---
|
|
323
|
+
|
|
324
|
+
## 🙏 Credits
|
|
325
|
+
|
|
326
|
+
**Debugging time:** ~4 hours
|
|
327
|
+
**Lines changed:** ~50
|
|
328
|
+
**Models tested:** 10
|
|
329
|
+
**Success rate:** 80%
|
|
330
|
+
**Impact:** Unlocked 400+ models via OpenRouter
|
|
331
|
+
|
|
332
|
+
**Built with:** [Claude Code](https://claude.com/claude-code)
|
|
333
|
+
|
|
334
|
+
---
|
|
335
|
+
|
|
336
|
+
**Ready for production after beta testing!** 🚀
|