tachibot-mcp 2.0.5 → 2.0.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.env.example +5 -2
- package/dist/src/config/model-constants.js +85 -72
- package/dist/src/config/model-preferences.js +5 -4
- package/dist/src/config.js +2 -1
- package/dist/src/mcp-client.js +3 -3
- package/dist/src/modes/scout.js +2 -1
- package/dist/src/optimization/model-router.js +19 -16
- package/dist/src/orchestrator-instructions.js +1 -1
- package/dist/src/orchestrator-lite.js +1 -1
- package/dist/src/orchestrator.js +1 -1
- package/dist/src/profiles/balanced.js +1 -2
- package/dist/src/profiles/code_focus.js +1 -2
- package/dist/src/profiles/full.js +1 -2
- package/dist/src/profiles/minimal.js +1 -2
- package/dist/src/profiles/research_power.js +1 -2
- package/dist/src/server.js +13 -12
- package/dist/src/tools/gemini-tools.js +15 -16
- package/dist/src/tools/grok-enhanced.js +21 -17
- package/dist/src/tools/grok-tools.js +26 -20
- package/dist/src/tools/openai-tools.js +28 -61
- package/dist/src/tools/tool-router.js +53 -52
- package/dist/src/tools/unified-ai-provider.js +1 -1
- package/dist/src/tools/workflow-runner.js +16 -0
- package/dist/src/tools/workflow-validator-tool.js +1 -1
- package/dist/src/utils/api-keys.js +20 -0
- package/dist/src/validators/interpolation-validator.js +4 -0
- package/dist/src/validators/tool-registry-validator.js +1 -1
- package/dist/src/validators/tool-types.js +0 -1
- package/dist/src/workflows/custom-workflows.js +4 -3
- package/dist/src/workflows/engine/VariableInterpolator.js +30 -3
- package/dist/src/workflows/engine/WorkflowExecutionEngine.js +2 -2
- package/dist/src/workflows/engine/WorkflowOutputFormatter.js +27 -4
- package/dist/src/workflows/fallback-strategies.js +2 -2
- package/dist/src/workflows/model-router.js +30 -5
- package/dist/src/workflows/tool-mapper.js +41 -14
- package/docs/API_KEYS.md +10 -6
- package/docs/TOOLS_REFERENCE.md +7 -43
- package/package.json +1 -1
- package/profiles/balanced.json +1 -2
- package/profiles/code_focus.json +1 -2
- package/profiles/debug_intensive.json +0 -1
- package/profiles/full.json +2 -3
- package/profiles/minimal.json +1 -2
- package/profiles/research_power.json +1 -2
- package/profiles/workflow_builder.json +1 -2
- package/smithery.yaml +2 -2
- package/tools.config.json +15 -3
- package/workflows/code-architecture-review.yaml +5 -3
- package/workflows/creative-brainstorm-yaml.yaml +1 -1
- package/workflows/pingpong.yaml +5 -3
- package/workflows/system/README.md +1 -1
- package/workflows/system/verifier.yaml +8 -5
- package/workflows/ultra-creative-brainstorm.yaml +3 -3
|
@@ -2,12 +2,13 @@
|
|
|
2
2
|
* Tool Mapper - Maps workflow tool names to actual MCP tool implementations
|
|
3
3
|
* Enables workflows to call real tools instead of returning placeholders
|
|
4
4
|
*/
|
|
5
|
-
import { callGemini
|
|
5
|
+
import { callGemini } from "../tools/gemini-tools.js";
|
|
6
6
|
import { getAllPerplexityTools } from "../tools/perplexity-tools.js";
|
|
7
7
|
import { callOpenAI } from "../tools/openai-tools.js";
|
|
8
8
|
import { callGrok, GrokModel } from "../tools/grok-tools.js";
|
|
9
|
-
import { GPT51_MODELS, TOOL_DEFAULTS, } from "../config/model-constants.js";
|
|
9
|
+
import { GPT51_MODELS, TOOL_DEFAULTS, GEMINI_MODELS, } from "../config/model-constants.js";
|
|
10
10
|
import { validateToolInput } from "../utils/input-validator.js";
|
|
11
|
+
import { hasGrokApiKey } from "../utils/api-keys.js";
|
|
11
12
|
// Lazy load OpenRouter for Qwen models
|
|
12
13
|
let callOpenRouter = null;
|
|
13
14
|
let OpenRouterModel = null;
|
|
@@ -74,7 +75,8 @@ export async function executeWorkflowTool(toolName, input, options = {}) {
|
|
|
74
75
|
if (typeof input === "string")
|
|
75
76
|
return input;
|
|
76
77
|
// Try all common parameter names (order matters!)
|
|
77
|
-
return input.
|
|
78
|
+
return input.thought || // think tool reflection
|
|
79
|
+
input.requirements || // qwen_coder, task-specific
|
|
78
80
|
input.problem || // brainstorm, reasoning tools
|
|
79
81
|
input.query || // search/ask tools
|
|
80
82
|
input.topic || // research tools
|
|
@@ -144,7 +146,7 @@ export async function executeWorkflowTool(toolName, input, options = {}) {
|
|
|
144
146
|
case "gemini_brainstorm":
|
|
145
147
|
case "gemini_analyze_code":
|
|
146
148
|
case "gemini_analyze_text":
|
|
147
|
-
actualModel = model === "flash" ?
|
|
149
|
+
actualModel = model === "flash" ? GEMINI_MODELS.FLASH : GEMINI_MODELS.GEMINI_3_PRO;
|
|
148
150
|
return buildResult(await callGemini(prompt, actualModel, systemPrompt, temperature, options.skipValidation || false), actualModel);
|
|
149
151
|
// ============ PERPLEXITY TOOLS ============
|
|
150
152
|
case "perplexity_ask":
|
|
@@ -209,26 +211,51 @@ export async function executeWorkflowTool(toolName, input, options = {}) {
|
|
|
209
211
|
return buildResult(await callOpenAI(toMessages(prompt, systemPrompt), actualModel, temperature, maxTokens, "low", // reasoningEffort
|
|
210
212
|
false, // requireConfirmation
|
|
211
213
|
options.skipValidation || false), actualModel);
|
|
214
|
+
case "openai_reason":
|
|
215
|
+
// GPT-5 Pro with high reasoning effort for complex reasoning
|
|
216
|
+
actualModel = GPT51_MODELS.PRO;
|
|
217
|
+
return buildResult(await callOpenAI(toMessages(prompt, systemPrompt), actualModel, temperature, maxTokens, "high", // reasoningEffort
|
|
218
|
+
false, // requireConfirmation
|
|
219
|
+
options.skipValidation || false), actualModel);
|
|
220
|
+
case "openai_code_review":
|
|
221
|
+
// GPT-5.1 codex-mini for code review (medium reasoning)
|
|
222
|
+
actualModel = GPT51_MODELS.CODEX_MINI;
|
|
223
|
+
return buildResult(await callOpenAI(toMessages(prompt, systemPrompt || "You are an expert code reviewer. Provide thorough code review with specific, actionable feedback."), actualModel, 0.3, // Low temperature for consistent code review
|
|
224
|
+
maxTokens, "medium", // reasoningEffort
|
|
225
|
+
false, options.skipValidation || false), actualModel);
|
|
226
|
+
case "openai_explain":
|
|
227
|
+
// GPT-5.1 codex-mini for explanations (low reasoning)
|
|
228
|
+
actualModel = GPT51_MODELS.CODEX_MINI;
|
|
229
|
+
return buildResult(await callOpenAI(toMessages(prompt, systemPrompt || "You are an expert educator. Provide clear, engaging explanations."), actualModel, temperature, maxTokens, "low", // reasoningEffort
|
|
230
|
+
false, options.skipValidation || false), actualModel);
|
|
212
231
|
case "gpt5_analyze":
|
|
213
232
|
return buildResult(await callOpenAI(toMessages(prompt, systemPrompt), GPT51_MODELS.CODEX_MINI, 0.7, maxTokens), GPT51_MODELS.CODEX_MINI);
|
|
214
233
|
case "openai_reason":
|
|
215
234
|
return buildResult(await callOpenAI(toMessages(prompt, systemPrompt), GPT51_MODELS.CODEX_MINI, temperature, maxTokens), GPT51_MODELS.CODEX_MINI);
|
|
216
235
|
// ============ GPT-5 TOOLS ============
|
|
217
236
|
case "gpt5":
|
|
237
|
+
// Map to flagship gpt-5.1
|
|
238
|
+
const gpt5Full = GPT51_MODELS.FULL; // gpt-5.1 flagship
|
|
239
|
+
return buildResult(await callOpenAI(toMessages(prompt, systemPrompt), gpt5Full, 0.7, maxTokens, "medium"), gpt5Full);
|
|
218
240
|
case "gpt5_mini":
|
|
219
|
-
|
|
220
|
-
|
|
221
|
-
|
|
222
|
-
return buildResult(await callOpenAI(toMessages(prompt, systemPrompt), gpt51Model, 0.7, maxTokens, "low"), gpt51Model);
|
|
241
|
+
// Map to gpt-5.1-codex-mini for code tasks (most workflows use for code)
|
|
242
|
+
const gpt5CodexMini = GPT51_MODELS.CODEX_MINI; // gpt-5.1-codex-mini
|
|
243
|
+
return buildResult(await callOpenAI(toMessages(prompt, systemPrompt), gpt5CodexMini, 0.7, maxTokens, "low"), gpt5CodexMini);
|
|
223
244
|
// ============ GROK TOOLS ============
|
|
224
245
|
case "grok":
|
|
225
246
|
case "grok_reason":
|
|
226
|
-
case "grok_code":
|
|
227
|
-
case "grok_debug":
|
|
228
247
|
case "grok_brainstorm":
|
|
229
|
-
case "grok_heavy": // Grok Heavy is just grok-4-0709 with more backend resources
|
|
230
248
|
case "grok_search":
|
|
231
|
-
|
|
249
|
+
// Use reasoning model for reasoning/creative tasks
|
|
250
|
+
actualModel = GrokModel.GROK_4_1_FAST_REASONING; // Latest 4.1 (2M context, $0.20/$0.50)
|
|
251
|
+
return buildResult(await callGrok(toMessages(prompt, systemPrompt), actualModel, temperature, maxTokens), actualModel);
|
|
252
|
+
case "grok_code":
|
|
253
|
+
case "grok_debug":
|
|
254
|
+
// Use non-reasoning model for code/debug (tool-calling optimized)
|
|
255
|
+
actualModel = GrokModel.GROK_4_1_FAST; // Latest 4.1 non-reasoning (2M context, $0.20/$0.50)
|
|
256
|
+
return buildResult(await callGrok(toMessages(prompt, systemPrompt), actualModel, temperature, maxTokens), actualModel);
|
|
257
|
+
case "grok_heavy": // Grok Heavy is grok-4-0709 with extended context
|
|
258
|
+
actualModel = GrokModel.GROK_4_HEAVY; // Expensive $3/$15
|
|
232
259
|
return buildResult(await callGrok(toMessages(prompt, systemPrompt), actualModel, temperature, maxTokens), actualModel);
|
|
233
260
|
// ============ ADVANCED MODES ============
|
|
234
261
|
case "verifier":
|
|
@@ -381,9 +408,9 @@ export function getAvailableTools() {
|
|
|
381
408
|
tools.push("perplexity_ask", "perplexity_research", "perplexity_reason", "perplexity_code_search");
|
|
382
409
|
}
|
|
383
410
|
if (process.env.OPENAI_API_KEY) {
|
|
384
|
-
tools.push("openai_brainstorm", "gpt5_analyze", "openai_reason", "gpt5", "gpt5_mini"
|
|
411
|
+
tools.push("openai_brainstorm", "openai_reason", "openai_code_review", "openai_explain", "gpt5_analyze", "openai_reason", "gpt5", "gpt5_mini");
|
|
385
412
|
}
|
|
386
|
-
if (
|
|
413
|
+
if (hasGrokApiKey()) {
|
|
387
414
|
tools.push("grok", "grok_reason", "grok_code", "grok_debug", "grok_brainstorm", "grok_search");
|
|
388
415
|
}
|
|
389
416
|
// Add modes if available
|
package/docs/API_KEYS.md
CHANGED
|
@@ -48,7 +48,7 @@ TachiBot MCP works with multiple AI providers to offer diverse capabilities. You
|
|
|
48
48
|
|----------|--------------|----------------|
|
|
49
49
|
| **Perplexity** | Research, web search | `perplexity_ask`, `perplexity_research`, `perplexity_reason`, `scout` (default) |
|
|
50
50
|
| **Grok/xAI** | Live search, reasoning | `grok_search`, `grok_reason`, `grok_code`, `grok_debug`, `grok_architect`, `grok_brainstorm`, `scout` (with grok) |
|
|
51
|
-
| **OpenAI** | GPT-5 models | `openai_brainstorm`, `
|
|
51
|
+
| **OpenAI** | GPT-5 models | `openai_brainstorm`, `openai_reason`, `openai_code_review`, `openai_explain`, `focus` (some modes), `verifier`, `challenger` |
|
|
52
52
|
| **Google** | Gemini models | `gemini_brainstorm`, `gemini_analyze_code`, `gemini_analyze_text`, `verifier`, `scout` |
|
|
53
53
|
| **OpenRouter** | Qwen models | `qwen_coder`, `qwen_competitive` |
|
|
54
54
|
|
|
@@ -116,15 +116,19 @@ Grok (by xAI) provides live web search, reasoning, and code analysis.
|
|
|
116
116
|
|
|
117
117
|
#### Models Available
|
|
118
118
|
|
|
119
|
-
- **grok-4** - Latest reasoning
|
|
120
|
-
- **grok-4-
|
|
121
|
-
- **grok-4-
|
|
119
|
+
- **grok-4-1-fast-reasoning** - Latest (Nov 2025): Enhanced reasoning, creativity & emotional intelligence (2M context)
|
|
120
|
+
- **grok-4-1-fast-non-reasoning** - Tool-calling optimized: Fast inference, agentic workflows (2M context)
|
|
121
|
+
- **grok-4-fast-reasoning** - Previous reasoning model
|
|
122
|
+
- **grok-4-0709** - Heavy model (expensive, use sparingly)
|
|
123
|
+
- **grok-code-fast-1** - Coding specialist
|
|
122
124
|
|
|
123
125
|
#### Pricing
|
|
124
126
|
|
|
125
127
|
| Model | Input | Output | Notes |
|
|
126
128
|
|-------|-------|--------|-------|
|
|
127
|
-
| Grok-4 | $
|
|
129
|
+
| Grok-4.1 | $0.20 / 1M tokens | $0.50 / 1M tokens | Latest & best! |
|
|
130
|
+
| Grok-4.1-fast | $0.20 / 1M tokens | $0.50 / 1M tokens | Tool-calling optimized |
|
|
131
|
+
| Grok-4 | $5.00 / 1M tokens | $15.00 / 1M tokens | Previous version |
|
|
128
132
|
| Grok-4-heavy | $10.00 / 1M tokens | $30.00 / 1M tokens | 256k context |
|
|
129
133
|
| **Live Search** | **$5 / 1k sources** | - | Extra cost per search! |
|
|
130
134
|
|
|
@@ -203,7 +207,7 @@ OpenAI provides GPT-5 models for brainstorming, comparison, and reasoning.
|
|
|
203
207
|
|
|
204
208
|
- Single `openai_brainstorm` (gpt-5-mini): ~$0.01 - $0.03
|
|
205
209
|
- Single `openai_brainstorm` (gpt-5): ~$0.15 - $0.40
|
|
206
|
-
- Single `
|
|
210
|
+
- Single `openai_code_review`: ~$0.02 - $0.05
|
|
207
211
|
|
|
208
212
|
**Tip:** Use `model: "gpt-5-mini"` by default, only use `gpt-5` for complex tasks.
|
|
209
213
|
|
package/docs/TOOLS_REFERENCE.md
CHANGED
|
@@ -22,9 +22,8 @@
|
|
|
22
22
|
- [grok_architect](#grok_architect)
|
|
23
23
|
- [grok_brainstorm](#grok_brainstorm)
|
|
24
24
|
- [OpenAI Suite](#openai-suite)
|
|
25
|
-
- [
|
|
25
|
+
- [openai_reason](#openai_reason)
|
|
26
26
|
- [openai_brainstorm](#openai_brainstorm)
|
|
27
|
-
- [openai_compare](#openai_compare)
|
|
28
27
|
- [openai_code_review](#openai_code_review)
|
|
29
28
|
- [openai_explain](#openai_explain)
|
|
30
29
|
- [Gemini Suite](#gemini-suite)
|
|
@@ -514,7 +513,7 @@ perplexity_reason({
|
|
|
514
513
|
|
|
515
514
|
### grok_search
|
|
516
515
|
|
|
517
|
-
Cost-optimized web search using Grok-4's live search with advanced filtering.
|
|
516
|
+
Cost-optimized web search using Grok-4.1's live search with advanced filtering and enhanced reasoning.
|
|
518
517
|
|
|
519
518
|
#### Schema
|
|
520
519
|
|
|
@@ -640,7 +639,7 @@ grok_search({
|
|
|
640
639
|
|
|
641
640
|
### grok_reason
|
|
642
641
|
|
|
643
|
-
Deep logical reasoning with Grok-4 using first principles.
|
|
642
|
+
Deep logical reasoning with Grok-4.1 using first principles and enhanced emotional intelligence.
|
|
644
643
|
|
|
645
644
|
#### Schema
|
|
646
645
|
|
|
@@ -686,7 +685,7 @@ grok_reason({
|
|
|
686
685
|
|
|
687
686
|
### grok_code
|
|
688
687
|
|
|
689
|
-
Code analysis and optimization with Grok-4.
|
|
688
|
+
Code analysis and optimization with Grok-4.1 Fast (tool-calling optimized).
|
|
690
689
|
|
|
691
690
|
#### Schema
|
|
692
691
|
|
|
@@ -738,7 +737,7 @@ grok_code({
|
|
|
738
737
|
|
|
739
738
|
### grok_debug
|
|
740
739
|
|
|
741
|
-
Deep debugging assistance with Grok-4.
|
|
740
|
+
Deep debugging assistance with Grok-4.1 Fast.
|
|
742
741
|
|
|
743
742
|
#### Schema
|
|
744
743
|
|
|
@@ -772,7 +771,7 @@ grok_debug({
|
|
|
772
771
|
|
|
773
772
|
### grok_architect
|
|
774
773
|
|
|
775
|
-
System architecture and design with Grok-4.
|
|
774
|
+
System architecture and design with Grok-4.1.
|
|
776
775
|
|
|
777
776
|
#### Schema
|
|
778
777
|
|
|
@@ -800,7 +799,7 @@ grok_architect({
|
|
|
800
799
|
|
|
801
800
|
### grok_brainstorm
|
|
802
801
|
|
|
803
|
-
Creative brainstorming using Grok-4
|
|
802
|
+
Creative brainstorming using Grok-4.1 with enhanced creativity and emotional intelligence.
|
|
804
803
|
|
|
805
804
|
#### Schema
|
|
806
805
|
|
|
@@ -928,41 +927,6 @@ openai_brainstorm({
|
|
|
928
927
|
|
|
929
928
|
---
|
|
930
929
|
|
|
931
|
-
### openai_compare
|
|
932
|
-
|
|
933
|
-
Multi-option consensus analysis with GPT-5.
|
|
934
|
-
|
|
935
|
-
#### Schema
|
|
936
|
-
|
|
937
|
-
```typescript
|
|
938
|
-
{
|
|
939
|
-
topic: string; // REQUIRED
|
|
940
|
-
options: string[]; // REQUIRED - Options to compare
|
|
941
|
-
criteria?: string[]; // Evaluation criteria
|
|
942
|
-
includeRecommendation?: boolean; // Default: true
|
|
943
|
-
}
|
|
944
|
-
```
|
|
945
|
-
|
|
946
|
-
#### Example Calls
|
|
947
|
-
|
|
948
|
-
**Compare frameworks:**
|
|
949
|
-
```typescript
|
|
950
|
-
openai_compare({
|
|
951
|
-
topic: "JavaScript framework selection",
|
|
952
|
-
options: ["React", "Vue", "Svelte", "Angular"],
|
|
953
|
-
criteria: [
|
|
954
|
-
"Learning curve",
|
|
955
|
-
"Performance",
|
|
956
|
-
"Community support",
|
|
957
|
-
"Ecosystem maturity",
|
|
958
|
-
"Job market demand"
|
|
959
|
-
],
|
|
960
|
-
includeRecommendation: true
|
|
961
|
-
})
|
|
962
|
-
```
|
|
963
|
-
|
|
964
|
-
---
|
|
965
|
-
|
|
966
930
|
## Gemini Suite
|
|
967
931
|
|
|
968
932
|
### gemini_brainstorm
|
package/package.json
CHANGED
package/profiles/balanced.json
CHANGED
package/profiles/code_focus.json
CHANGED
|
@@ -13,8 +13,7 @@
|
|
|
13
13
|
"grok_architect": false,
|
|
14
14
|
"grok_brainstorm": false,
|
|
15
15
|
"grok_search": false,
|
|
16
|
-
"
|
|
17
|
-
"openai_compare": false,
|
|
16
|
+
"openai_reason": false,
|
|
18
17
|
"openai_brainstorm": false,
|
|
19
18
|
"openai_code_review": true,
|
|
20
19
|
"openai_explain": false,
|
package/profiles/full.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
{
|
|
2
|
-
"description": "All tools enabled for maximum capability (~Xk tokens,
|
|
2
|
+
"description": "All tools enabled for maximum capability (~Xk tokens, 31 tools)",
|
|
3
3
|
"tools": {
|
|
4
4
|
"think": true,
|
|
5
5
|
"focus": true,
|
|
@@ -13,8 +13,7 @@
|
|
|
13
13
|
"grok_architect": true,
|
|
14
14
|
"grok_brainstorm": true,
|
|
15
15
|
"grok_search": true,
|
|
16
|
-
"
|
|
17
|
-
"openai_compare": true,
|
|
16
|
+
"openai_reason": true,
|
|
18
17
|
"openai_brainstorm": true,
|
|
19
18
|
"openai_code_review": true,
|
|
20
19
|
"openai_explain": true,
|
package/profiles/minimal.json
CHANGED
|
@@ -13,8 +13,7 @@
|
|
|
13
13
|
"grok_architect": false,
|
|
14
14
|
"grok_brainstorm": false,
|
|
15
15
|
"grok_search": false,
|
|
16
|
-
"
|
|
17
|
-
"openai_compare": false,
|
|
16
|
+
"openai_reason": false,
|
|
18
17
|
"openai_brainstorm": false,
|
|
19
18
|
"openai_code_review": false,
|
|
20
19
|
"openai_explain": false,
|
|
@@ -13,8 +13,7 @@
|
|
|
13
13
|
"grok_architect": false,
|
|
14
14
|
"grok_brainstorm": false,
|
|
15
15
|
"grok_search": false,
|
|
16
|
-
"
|
|
17
|
-
"openai_compare": false,
|
|
16
|
+
"openai_reason": false,
|
|
18
17
|
"openai_brainstorm": false,
|
|
19
18
|
"openai_code_review": false,
|
|
20
19
|
"openai_explain": false,
|
package/smithery.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
# Smithery configuration file: https://smithery.ai/docs/config#smitheryyaml
|
|
2
2
|
name: "tachibot-mcp"
|
|
3
|
-
description: "Multi-model AI orchestration platform with
|
|
4
|
-
version: "2.0.
|
|
3
|
+
description: "Multi-model AI orchestration platform with 31 tools across Perplexity, Grok, OpenAI GPT-5, Gemini, and Qwen. Features YAML workflows, 5 token-optimized profiles (4k-20k), smart routing, and cost controls. Build complex AI pipelines with variable passing and parallel execution."
|
|
4
|
+
version: "2.0.6"
|
|
5
5
|
|
|
6
6
|
startCommand:
|
|
7
7
|
type: stdio
|
package/tools.config.json
CHANGED
|
@@ -25,7 +25,7 @@
|
|
|
25
25
|
"grok_brainstorm",
|
|
26
26
|
"grok_search"
|
|
27
27
|
],
|
|
28
|
-
"openai": ["
|
|
28
|
+
"openai": ["openai_brainstorm", "openai_reason", "openai_code_review", "openai_explain"],
|
|
29
29
|
"gemini": [
|
|
30
30
|
"gemini_brainstorm",
|
|
31
31
|
"gemini_analyze_code",
|
|
@@ -38,7 +38,12 @@
|
|
|
38
38
|
"workflow",
|
|
39
39
|
"list_workflows",
|
|
40
40
|
"create_workflow",
|
|
41
|
-
"visualize_workflow"
|
|
41
|
+
"visualize_workflow",
|
|
42
|
+
"workflow_start",
|
|
43
|
+
"continue_workflow",
|
|
44
|
+
"workflow_status",
|
|
45
|
+
"validate_workflow",
|
|
46
|
+
"validate_workflow_file"
|
|
42
47
|
],
|
|
43
48
|
"collaborative": ["pingpong", "qwen_competitive"]
|
|
44
49
|
},
|
|
@@ -59,8 +64,10 @@
|
|
|
59
64
|
"grok_architect": true,
|
|
60
65
|
"grok_brainstorm": true,
|
|
61
66
|
"grok_search": true,
|
|
62
|
-
"openai_compare": true,
|
|
63
67
|
"openai_brainstorm": true,
|
|
68
|
+
"openai_reason": true,
|
|
69
|
+
"openai_code_review": true,
|
|
70
|
+
"openai_explain": true,
|
|
64
71
|
"gemini_brainstorm": true,
|
|
65
72
|
"gemini_analyze_code": true,
|
|
66
73
|
"gemini_analyze_text": true,
|
|
@@ -74,6 +81,11 @@
|
|
|
74
81
|
"list_workflows": true,
|
|
75
82
|
"create_workflow": true,
|
|
76
83
|
"visualize_workflow": true,
|
|
84
|
+
"workflow_start": true,
|
|
85
|
+
"continue_workflow": true,
|
|
86
|
+
"workflow_status": true,
|
|
87
|
+
"validate_workflow": true,
|
|
88
|
+
"validate_workflow_file": true,
|
|
77
89
|
"pingpong": true,
|
|
78
90
|
"qwen_competitive": false
|
|
79
91
|
}
|
|
@@ -176,10 +176,12 @@ steps:
|
|
|
176
176
|
# ═══════════════════════════════════════════════════════════════════════════
|
|
177
177
|
|
|
178
178
|
- name: consensus
|
|
179
|
-
tool:
|
|
179
|
+
tool: openai_brainstorm
|
|
180
180
|
input:
|
|
181
|
-
|
|
182
|
-
|
|
181
|
+
problem: |
|
|
182
|
+
Synthesize final architecture recommendations for: ${query}
|
|
183
|
+
|
|
184
|
+
Combine these expert analyses into actionable recommendations:
|
|
183
185
|
- "Grok's SOLID analysis: ${grok-solid-analysis.output}"
|
|
184
186
|
- "Gemini's pattern analysis: ${gemini-pattern-analysis.output}"
|
|
185
187
|
- "Qwen's CQRS evaluation: ${qwen-cqrs-evaluation.output}"
|
|
@@ -15,7 +15,7 @@ variables:
|
|
|
15
15
|
steps:
|
|
16
16
|
# Step 1: Claude Thinking - Problem Framing
|
|
17
17
|
- name: claude-thinking
|
|
18
|
-
tool:
|
|
18
|
+
tool: openai_reason # Using GPT-5 Mini for structured thinking
|
|
19
19
|
input:
|
|
20
20
|
query: |
|
|
21
21
|
Analyze and structure the brainstorming request: ${query}
|
package/workflows/pingpong.yaml
CHANGED
|
@@ -121,10 +121,12 @@ steps:
|
|
|
121
121
|
# ═══════════════════════════════════════════════════════════════════════════
|
|
122
122
|
|
|
123
123
|
- name: consensus
|
|
124
|
-
tool:
|
|
124
|
+
tool: openai_brainstorm
|
|
125
125
|
input:
|
|
126
|
-
|
|
127
|
-
|
|
126
|
+
problem: |
|
|
127
|
+
Synthesize final consensus on: ${query}
|
|
128
|
+
|
|
129
|
+
Analyze these perspectives and provide a unified recommendation:
|
|
128
130
|
- "Grok's analysis: ${challenge-grok.output}"
|
|
129
131
|
- "Gemini's synthesis: ${challenge-gemini.output}"
|
|
130
132
|
- "Qwen's technical review: ${challenge-qwen.output}"
|
|
@@ -25,7 +25,7 @@ workflow verifier --query "Python is faster than JavaScript for all use cases"
|
|
|
25
25
|
```
|
|
26
26
|
|
|
27
27
|
**Models Used:**
|
|
28
|
-
1. GPT-5 Mini (
|
|
28
|
+
1. GPT-5 Mini (openai_brainstorm)
|
|
29
29
|
2. Gemini 2.5 (gemini_analyze_text)
|
|
30
30
|
3. Grok 4 (grok_code)
|
|
31
31
|
4. Qwen Coder (qwen_coder)
|
|
@@ -10,12 +10,15 @@ steps:
|
|
|
10
10
|
# Each model gets 10k tokens, saved to disk
|
|
11
11
|
|
|
12
12
|
- name: verify_gpt5_mini
|
|
13
|
-
tool:
|
|
13
|
+
tool: openai_brainstorm
|
|
14
14
|
input:
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
15
|
+
problem: |
|
|
16
|
+
Verify the following claim or statement:
|
|
17
|
+
${query}
|
|
18
|
+
|
|
19
|
+
Provide verification analysis including accuracy assessment, evidence, and confidence level.
|
|
20
|
+
style: "systematic"
|
|
21
|
+
quantity: 3
|
|
19
22
|
saveToFile: true
|
|
20
23
|
maxTokens: 10000
|
|
21
24
|
output:
|
|
@@ -8,10 +8,10 @@ version: "3.0"
|
|
|
8
8
|
settings:
|
|
9
9
|
optimization:
|
|
10
10
|
enabled: true
|
|
11
|
-
smartRouting:
|
|
11
|
+
smartRouting: false # Disabled - was selecting invalid gpt-5-nano model
|
|
12
12
|
compressPrompts: false
|
|
13
13
|
autoSynthesis:
|
|
14
|
-
enabled:
|
|
14
|
+
enabled: false # Disabled for testing
|
|
15
15
|
tokenThreshold: 25000
|
|
16
16
|
checkpointInterval: 12000
|
|
17
17
|
synthesisTool: 'gemini_analyze_text'
|
|
@@ -195,7 +195,7 @@ steps:
|
|
|
195
195
|
input:
|
|
196
196
|
query: "${query} - explore creative applications across domains"
|
|
197
197
|
mode: "code-brainstorm"
|
|
198
|
-
models: ["gpt-5.1", "gemini-2.5", "grok-4-fast-reasoning"]
|
|
198
|
+
models: ["gpt-5.1", "gemini-2.5-flash", "grok-4-1-fast-reasoning"]
|
|
199
199
|
rounds: 3
|
|
200
200
|
context: "Research: ${research_findings}\nIdeas: ${innovative_solutions}\nPatterns: ${patterns}"
|
|
201
201
|
saveToFile: true
|