dual-brain 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (68) hide show
  1. package/AGENTS.md +97 -0
  2. package/CLAUDE.md +147 -0
  3. package/LICENSE +21 -0
  4. package/README.md +197 -0
  5. package/agents/implementer.md +22 -0
  6. package/agents/researcher.md +25 -0
  7. package/agents/verifier.md +30 -0
  8. package/bin/dual-brain.mjs +2868 -0
  9. package/hooks/auto-update-wrapper.mjs +102 -0
  10. package/hooks/auto-update.sh +67 -0
  11. package/hooks/budget-balancer.mjs +679 -0
  12. package/hooks/control-panel.mjs +1195 -0
  13. package/hooks/cost-logger.mjs +286 -0
  14. package/hooks/cost-report.mjs +351 -0
  15. package/hooks/decision-ledger.mjs +299 -0
  16. package/hooks/dual-brain-review.mjs +404 -0
  17. package/hooks/dual-brain-think.mjs +393 -0
  18. package/hooks/enforce-tier.mjs +469 -0
  19. package/hooks/failure-detector.mjs +138 -0
  20. package/hooks/gpt-work-dispatcher.mjs +512 -0
  21. package/hooks/head-guard.mjs +105 -0
  22. package/hooks/health-check.mjs +444 -0
  23. package/hooks/install-git-hooks.mjs +106 -0
  24. package/hooks/model-registry.mjs +859 -0
  25. package/hooks/plan-generator.mjs +544 -0
  26. package/hooks/profiles.mjs +254 -0
  27. package/hooks/quality-gate.mjs +355 -0
  28. package/hooks/risk-classifier.mjs +41 -0
  29. package/hooks/session-report.mjs +514 -0
  30. package/hooks/setup-wizard.mjs +130 -0
  31. package/hooks/summary-checkpoint.mjs +432 -0
  32. package/hooks/task-classifier.mjs +328 -0
  33. package/hooks/test-orchestrator.mjs +1077 -0
  34. package/hooks/vibe-memory.mjs +463 -0
  35. package/hooks/vibe-router.mjs +387 -0
  36. package/hooks/wave-orchestrator.mjs +1397 -0
  37. package/install.mjs +1541 -0
  38. package/mcp-server/README.md +81 -0
  39. package/mcp-server/index.mjs +388 -0
  40. package/orchestrator.json +215 -0
  41. package/package.json +108 -0
  42. package/playbooks/debug.json +49 -0
  43. package/playbooks/refactor.json +57 -0
  44. package/playbooks/security-audit.json +57 -0
  45. package/playbooks/security.json +38 -0
  46. package/playbooks/test-gen.json +48 -0
  47. package/plugin.json +22 -0
  48. package/review-rules.md +17 -0
  49. package/shell-hook.sh +26 -0
  50. package/skills/go.md +22 -0
  51. package/skills/review.md +19 -0
  52. package/skills/status.md +13 -0
  53. package/skills/think.md +22 -0
  54. package/src/brief.mjs +266 -0
  55. package/src/decide.mjs +635 -0
  56. package/src/decompose.mjs +331 -0
  57. package/src/detect.mjs +345 -0
  58. package/src/dispatch.mjs +942 -0
  59. package/src/health.mjs +253 -0
  60. package/src/index.mjs +44 -0
  61. package/src/install-hooks.mjs +100 -0
  62. package/src/playbook.mjs +257 -0
  63. package/src/profile.mjs +990 -0
  64. package/src/redact.mjs +192 -0
  65. package/src/repo.mjs +292 -0
  66. package/src/session.mjs +1036 -0
  67. package/src/tui.mjs +197 -0
  68. package/src/update-check.mjs +35 -0
@@ -0,0 +1,328 @@
1
+ #!/usr/bin/env node
2
+ /**
3
+ * task-classifier.mjs — Analyze work descriptions and return model + effort + mode config.
4
+ *
5
+ * Uses model-registry capabilities to make informed routing decisions:
6
+ * - Which model (per provider) handles this task best
7
+ * - What effort/reasoning level to use
8
+ * - Whether to enable extended thinking, fast mode, extended context, web search
9
+ * - How to dispatch (Claude Agent vs Codex exec)
10
+ *
11
+ * Exports: classifyTask, selectModelEffort, INTENTS
12
+ * CLI: node hooks/task-classifier.mjs "description" [--files a,b] [--budget-pressure 0.8]
13
+ */
14
+
15
+ import { classifyRisk, extractPaths } from './risk-classifier.mjs';
16
+ import {
17
+ MODEL_CAPABILITIES, getCapabilities, getDispatchConfig,
18
+ recommendEffort, shouldUseExtendedContext, shouldUseFastMode,
19
+ getBestModelFor,
20
+ } from './model-registry.mjs';
21
+
22
+ // ─── Intent definitions ───────────────────────────────────────────────────────
23
+
24
+ const INTENTS = {
25
+ search: /\b(grep|find|locate|where is|where are|list|explore|read|look up|look for|check|what is|show me|display)\b/i,
26
+ explain: /\b(explain|walk me through|what does|how does|describe|summarize|understand|clarify)\b/i,
27
+ compare: /\b(compare|contrast|difference|versus|vs\.?|trade.?off|which is better|pros and cons|benchmark|performance)\b/i,
28
+ document: /\b(document|docs?|readme|jsdoc|typedoc|api docs|write docs|add docs|update docs)\b/i,
29
+ format: /\b(format|lint|prettier|style|indent|whitespace|typo|typos|comment[s]?|reformat)\b/i,
30
+ planning: /\b(plan|roadmap|strategy|prioritize|break down|decompose|prioritise)\b/i,
31
+ architecture: /\b(design|architect|architecture|propose|how should we|system design|system architecture)\b/i,
32
+ security: /\b(auth|credential|secret|token|password|encrypt|permission[s]?|vulnerability|vulnerabilities|CVE|oauth|jwt|api.?key)\b/i,
33
+ review: /\b(review|audit|check for issues|evaluate|assess|inspect code|code review)\b/i,
34
+ debug: /\b(debug|investigate|why (is|does|isn't|doesn't)|trace|diagnose|figure out|broken|not working|failing|regression)\b/i,
35
+ test: /\b(test[s]?|spec[s]?|add test|fix test|test coverage|unit test|e2e|integration test|jest|vitest|mocha)\b/i,
36
+ refactor: /\b(refactor|restructure|reorganize|reorganise|extract|split|consolidate|clean up|cleanup|dedupe|dedup)\b/i,
37
+ edit: /\b(fix|add|update|modify|change|rename|move|replace|write|implement|create|remove|delete|insert)\b/i,
38
+ };
39
+
40
+ const INTENT_PRIORITY = [
41
+ 'security', 'architecture', 'planning', 'compare', 'review',
42
+ 'debug', 'refactor', 'test', 'explain', 'document', 'format', 'search', 'edit',
43
+ ];
44
+
45
+ // ─── Risk keyword detection (description-level) ──────────────────────────────
46
+
47
+ const RISK_KEYWORDS = [
48
+ { level: 'critical', regex: /\b(auth|secret|credential|token|password|encrypt|certificate|oauth|jwt|api.?key|vulnerability|CVE)\b/i },
49
+ { level: 'high', regex: /\b(billing|payment|migration|deploy|ci.?cd|security|permission|policy|schema|openapi|swagger|production|prod)\b/i },
50
+ { level: 'medium', regex: /\b(test|spec|config|shared|util|lib|integration|public.?api)\b/i },
51
+ { level: 'low', regex: /\b(readme|docs?|comment|format|lint|changelog|typo|whitespace)\b/i },
52
+ ];
53
+
54
+ const LEVEL_ORDER = { critical: 3, high: 2, medium: 1, low: 0 };
55
+
56
+ function detectKeywordRisk(description) {
57
+ for (const { level, regex } of RISK_KEYWORDS) {
58
+ if (regex.test(description)) return level;
59
+ }
60
+ return 'low';
61
+ }
62
+
63
+ function higherRisk(a, b) {
64
+ return LEVEL_ORDER[a] >= LEVEL_ORDER[b] ? a : b;
65
+ }
66
+
67
+ // ─── classifyTask ─────────────────────────────────────────────────────────────
68
+
69
+ function classifyTask(description, options = {}) {
70
+ const { files = [], priorFailures = 0 } = options;
71
+
72
+ // 1. Intent detection
73
+ let intent = 'edit';
74
+ for (const key of INTENT_PRIORITY) {
75
+ if (INTENTS[key].test(description)) {
76
+ intent = key;
77
+ break;
78
+ }
79
+ }
80
+
81
+ // 2. Risk detection
82
+ const allPaths = [...files, ...extractPaths(description)];
83
+ const pathRisk = allPaths.length > 0 ? classifyRisk(allPaths).level : 'low';
84
+ const keywordRisk = detectKeywordRisk(description);
85
+ const risk = higherRisk(pathRisk, keywordRisk);
86
+
87
+ // 3. File count
88
+ const fileCount = files.length;
89
+
90
+ // 4. Complexity detection
91
+ let complexity;
92
+ const isAmbiguous = description.length > 120 || /\b(and also|as well as|plus|additionally|also)\b/i.test(description);
93
+
94
+ if (priorFailures >= 2 || intent === 'architecture' || risk === 'critical' || fileCount >= 6 || isAmbiguous && risk === 'critical') {
95
+ complexity = 'complex';
96
+ } else if (fileCount >= 3 || intent === 'refactor' || intent === 'debug' || risk === 'high' || isAmbiguous) {
97
+ complexity = 'moderate';
98
+ } else if (fileCount <= 2 && (risk === 'low' || risk === 'medium')) {
99
+ if (intent === 'format' || fileCount <= 1 && risk === 'low') {
100
+ complexity = 'trivial';
101
+ } else {
102
+ complexity = 'simple';
103
+ }
104
+ } else {
105
+ complexity = 'moderate';
106
+ }
107
+
108
+ // 5. Effort selection
109
+ const baseEffort = { trivial: 'low', simple: 'medium', moderate: 'high', complex: 'high' }[complexity];
110
+ const effortOrder = ['low', 'medium', 'high', 'xhigh'];
111
+
112
+ function bumpEffort(e, n = 1) {
113
+ return effortOrder[Math.min(effortOrder.indexOf(e) + n, effortOrder.length - 1)];
114
+ }
115
+
116
+ let effort = baseEffort;
117
+
118
+ if (risk === 'critical' && LEVEL_ORDER[effort] < LEVEL_ORDER['high']) effort = 'high';
119
+
120
+ if (priorFailures >= 2) {
121
+ effort = 'xhigh';
122
+ } else if (priorFailures === 1) {
123
+ effort = bumpEffort(effort, 1);
124
+ }
125
+
126
+ if (intent === 'format' || intent === 'search') {
127
+ if (LEVEL_ORDER[effort] > LEVEL_ORDER['medium']) effort = 'medium';
128
+ }
129
+ if ((intent === 'architecture' || intent === 'security') && LEVEL_ORDER[effort] < LEVEL_ORDER['high']) {
130
+ effort = 'high';
131
+ }
132
+
133
+ // 6. Reason
134
+ const reasons = [];
135
+ if (fileCount > 0) reasons.push(`${fileCount} file(s)`);
136
+ if (risk !== 'low') reasons.push(`${risk} risk`);
137
+ if (priorFailures > 0) reasons.push(`${priorFailures} prior failure(s)`);
138
+ reasons.push(`intent=${intent}, complexity=${complexity}`);
139
+ const reason = reasons.join('; ');
140
+
141
+ return { intent, risk, complexity, fileCount, effort, reason };
142
+ }
143
+
144
+ // ─── selectModelEffort ────────────────────────────────────────────────────────
145
+
146
+ function selectModelEffort(taskProfile, options = {}) {
147
+ const { budgetPressure = 0, userBudgetTier = '$100', isIterating = false, estimatedTokens = 0 } = options;
148
+ const { intent, risk, effort, complexity } = taskProfile;
149
+
150
+ // ── Intent classification for routing ──
151
+ const thinkIntents = ['architecture', 'security', 'review', 'planning', 'compare'];
152
+ const searchIntents = ['search', 'format', 'explain'];
153
+ const lightIntents = ['document', 'explain', 'format', 'search'];
154
+
155
+ const needsOpus = thinkIntents.includes(intent)
156
+ || risk === 'critical'
157
+ || effort === 'xhigh';
158
+
159
+ const needsHaiku = searchIntents.includes(intent) && effort === 'low';
160
+
161
+ let claudeModel = needsOpus ? 'opus' : needsHaiku ? 'haiku' : 'sonnet';
162
+
163
+ // ── Claude effort (from registry, null-safe for haiku) ──
164
+ const caps = getCapabilities(claudeModel);
165
+ let claudeEffort = caps?.reasoning?.effortLevels
166
+ ? (recommendEffort(claudeModel, complexity, risk) || effort)
167
+ : null;
168
+
169
+ // ── Claude modes ──
170
+ const claudeModes = {
171
+ extendedThinking: caps?.reasoning?.extendedThinking
172
+ && (complexity === 'moderate' || complexity === 'complex')
173
+ && !lightIntents.includes(intent),
174
+ fastMode: shouldUseFastMode(claudeModel, isIterating),
175
+ extendedContext: shouldUseExtendedContext(claudeModel, estimatedTokens),
176
+ ultrathink: claudeModel === 'opus'
177
+ && (risk === 'critical' || (complexity === 'complex' && thinkIntents.includes(intent))),
178
+ };
179
+
180
+ // ── OpenAI model selection (all models reachable) ──
181
+ let openaiModel;
182
+ if (needsOpus) {
183
+ openaiModel = 'gpt-5.5';
184
+ } else if (searchIntents.includes(intent) && effort === 'low') {
185
+ openaiModel = 'gpt-4.1-mini';
186
+ } else if (['edit', 'test', 'document'].includes(intent) && ['simple', 'trivial'].includes(complexity)) {
187
+ openaiModel = 'gpt-4.1';
188
+ } else if (intent === 'explain' && complexity !== 'trivial') {
189
+ openaiModel = 'gpt-5.2';
190
+ } else if (['edit', 'document'].includes(intent) && complexity === 'moderate') {
191
+ openaiModel = 'gpt-5.3-codex';
192
+ } else if (intent === 'test' && complexity === 'moderate') {
193
+ openaiModel = 'gpt-5.4-mini';
194
+ } else if (['refactor', 'debug'].includes(intent)) {
195
+ openaiModel = complexity === 'complex' ? 'gpt-5.4' : 'gpt-5.3-codex';
196
+ } else {
197
+ openaiModel = 'gpt-5.4';
198
+ }
199
+
200
+ // ── OpenAI effort (from registry) ──
201
+ let openaiEffort = recommendEffort(openaiModel, complexity, risk) || effort;
202
+
203
+ // ── OpenAI modes ──
204
+ const openaiCaps = getCapabilities(openaiModel);
205
+ const openaiModes = {
206
+ webSearch: openaiCaps?.modes?.webSearch ?? false,
207
+ sandbox: openaiCaps?.modes?.sandbox?.[
208
+ thinkIntents.includes(intent) ? 'think' : searchIntents.includes(intent) ? 'search' : 'execute'
209
+ ] ?? 'danger-full-access',
210
+ };
211
+
212
+ // ── Outcome learning override ──
213
+ // If we have enough empirical data, let it influence model selection
214
+ const empiricalClaude = getBestModelFor(intent, 'claude', { minSamples: 5 });
215
+ if (empiricalClaude && empiricalClaude.successRate !== null && empiricalClaude.successRate > 0.8) {
216
+ const caps = getCapabilities(empiricalClaude.model);
217
+ if (caps && !caps.avoidFor?.includes(intent)) {
218
+ claudeModel = empiricalClaude.model;
219
+ }
220
+ }
221
+
222
+ const empiricalOpenai = getBestModelFor(intent, 'openai', { minSamples: 5 });
223
+ if (empiricalOpenai && empiricalOpenai.successRate !== null && empiricalOpenai.successRate > 0.8) {
224
+ const caps = getCapabilities(empiricalOpenai.model);
225
+ if (caps && !caps.avoidFor?.includes(intent)) {
226
+ openaiModel = empiricalOpenai.model;
227
+ }
228
+ }
229
+
230
+ // ── Budget pressure adjustments ──
231
+ const reasons = [];
232
+ const isHighStakes = risk === 'critical' || risk === 'high';
233
+ const openaiModelRank = [
234
+ 'gpt-4.1-mini', 'gpt-4.1', 'gpt-5.2', 'gpt-5.4-mini',
235
+ 'gpt-5.3-codex', 'gpt-5.3-codex-spark', 'gpt-5.4', 'gpt-5.5',
236
+ ];
237
+
238
+ if (budgetPressure > 0.9 && !isHighStakes) {
239
+ claudeModel = claudeModel === 'opus' ? 'sonnet' : 'haiku';
240
+ const oaiIdx = openaiModelRank.indexOf(openaiModel);
241
+ openaiModel = openaiModelRank[Math.max(0, oaiIdx - 2)] || 'gpt-4.1-mini';
242
+ claudeModes.fastMode = false;
243
+ claudeModes.extendedContext = false;
244
+ claudeModes.extendedThinking = false;
245
+ reasons.push('near limit, aggressive downgrade for non-critical task');
246
+ } else if (budgetPressure > 0.7 && !isHighStakes) {
247
+ claudeModel = claudeModel === 'opus' ? 'sonnet' : claudeModel === 'sonnet' ? 'haiku' : 'haiku';
248
+ const oaiIdx = openaiModelRank.indexOf(openaiModel);
249
+ openaiModel = openaiModelRank[Math.max(0, oaiIdx - 1)] || 'gpt-4.1-mini';
250
+ claudeModes.fastMode = false;
251
+ reasons.push('downgraded due to budget pressure');
252
+ }
253
+
254
+ // Recalculate efforts after potential model change
255
+ const newCaps = getCapabilities(claudeModel);
256
+ claudeEffort = newCaps?.reasoning?.effortLevels
257
+ ? (recommendEffort(claudeModel, complexity, risk) || effort)
258
+ : null;
259
+ openaiEffort = recommendEffort(openaiModel, complexity, risk) || effort;
260
+
261
+ // ── Preferred provider (think→claude, isolated execute→openai) ──
262
+ const preferred = thinkIntents.includes(intent) ? 'claude' : 'openai';
263
+
264
+ // ── Dual-brain recommendation ──
265
+ const dualBrain = risk === 'critical'
266
+ || (thinkIntents.includes(intent) && (complexity === 'complex' || complexity === 'moderate'))
267
+ || intent === 'security'
268
+ || (intent === 'review' && risk !== 'low')
269
+ || (intent === 'refactor' && risk === 'critical');
270
+
271
+ if (reasons.length === 0) {
272
+ reasons.push(`${claudeModel}/${openaiModel} matched to ${intent} @ ${complexity} complexity`);
273
+ }
274
+ if (empiricalClaude?.successRate !== null) reasons.push(`claude empirical: ${empiricalClaude.model} ${Math.round(empiricalClaude.successRate * 100)}%`);
275
+ if (empiricalOpenai?.successRate !== null) reasons.push(`openai empirical: ${empiricalOpenai.model} ${Math.round(empiricalOpenai.successRate * 100)}%`);
276
+
277
+ return {
278
+ claude: {
279
+ model: claudeModel,
280
+ effort: claudeEffort,
281
+ modes: claudeModes,
282
+ dispatch: getDispatchConfig(claudeModel),
283
+ },
284
+ openai: {
285
+ model: openaiModel,
286
+ effort: openaiEffort,
287
+ modes: openaiModes,
288
+ dispatch: getDispatchConfig(openaiModel),
289
+ },
290
+ preferred,
291
+ dualBrain,
292
+ reason: reasons.join('; '),
293
+ };
294
+ }
295
+
296
+ // ─── CLI ──────────────────────────────────────────────────────────────────────
297
+
298
+ if (process.argv[1] && new URL(import.meta.url).pathname === process.argv[1]) {
299
+ const args = process.argv.slice(2);
300
+ const description = args.find(a => !a.startsWith('--')) || '';
301
+ const filesArg = args.find(a => a.startsWith('--files=')) || args[args.indexOf('--files') + 1];
302
+ const budgetArg = args.find(a => a.startsWith('--budget-pressure=')) || args[args.indexOf('--budget-pressure') + 1];
303
+ const failuresArg = args.find(a => a.startsWith('--failures=')) || args[args.indexOf('--failures') + 1];
304
+
305
+ const files = (filesArg && !filesArg.startsWith('--'))
306
+ ? filesArg.replace(/^--files=/, '').split(',').map(f => f.trim())
307
+ : [];
308
+
309
+ const budgetPressure = budgetArg
310
+ ? parseFloat(budgetArg.replace(/^--budget-pressure=/, ''))
311
+ : 0;
312
+
313
+ const priorFailures = failuresArg
314
+ ? parseInt(failuresArg.replace(/^--failures=/, ''), 10)
315
+ : 0;
316
+
317
+ if (!description) {
318
+ console.error('Usage: node hooks/task-classifier.mjs "task description" [--files a,b] [--budget-pressure 0.8] [--failures 1]');
319
+ process.exit(1);
320
+ }
321
+
322
+ const profile = classifyTask(description, { files, priorFailures });
323
+ const selection = selectModelEffort(profile, { budgetPressure });
324
+
325
+ console.log(JSON.stringify({ profile, selection }, null, 2));
326
+ }
327
+
328
+ export { classifyTask, selectModelEffort, INTENTS };