opencode-model-router 1.1.4 → 1.1.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +20 -6
- package/package.json +1 -1
- package/tiers.json +58 -3
package/README.md
CHANGED
|
@@ -23,8 +23,8 @@ A keyword routing guide (`@fast→search/grep/read`, `@medium→impl/refactor/te
|
|
|
23
23
|
**Skip delegation overhead for trivial work.**
|
|
24
24
|
Single grep? One file read? The orchestrator executes directly — zero delegation cost, zero latency.
|
|
25
25
|
|
|
26
|
-
**
|
|
27
|
-
`/budget normal` (balanced), `/budget budget` (aggressive savings, defaults everything to @fast), `/budget quality` (liberal use of stronger models). Mode persists across restarts.
|
|
26
|
+
**Four routing modes for different budgets.**
|
|
27
|
+
`/budget normal` (balanced), `/budget budget` (aggressive savings, defaults everything to @fast), `/budget quality` (liberal use of stronger models), `/budget deep` (heavy-first for long architecture/debug runs). Mode persists across restarts.
|
|
28
28
|
|
|
29
29
|
**Cost ratios in the prompt.**
|
|
30
30
|
Every tier carries its `costRatio` (fast=1x, medium=5x, heavy=20x) injected into the system prompt. The orchestrator sees the price before deciding. It picks the cheapest tier that can reliably handle the task.
|
|
@@ -278,6 +278,7 @@ Switch with `/budget <mode>`. Mode is persisted across restarts.
|
|
|
278
278
|
| `normal` | @medium | Balanced — routes by task complexity |
|
|
279
279
|
| `budget` | @fast | Aggressive savings — defaults cheap, escalates only when necessary |
|
|
280
280
|
| `quality` | @medium | Quality-first — liberal use of @medium/@heavy |
|
|
281
|
+
| `deep` | @heavy | Deep-analysis mode — heavy-first for architecture/debug/security with longer heavy runs |
|
|
281
282
|
|
|
282
283
|
```json
|
|
283
284
|
{
|
|
@@ -286,15 +287,28 @@ Switch with `/budget <mode>`. Mode is persisted across restarts.
|
|
|
286
287
|
"defaultTier": "fast",
|
|
287
288
|
"description": "Aggressive cost savings",
|
|
288
289
|
"overrideRules": [
|
|
289
|
-
"
|
|
290
|
-
"
|
|
291
|
-
"
|
|
290
|
+
"default→@fast unless edits/complex-reasoning needed",
|
|
291
|
+
"@medium ONLY: multi-file-edit/refactor/test-suite/build-fix",
|
|
292
|
+
"@heavy ONLY: user-requested OR ≥2 @medium failures"
|
|
293
|
+
]
|
|
294
|
+
},
|
|
295
|
+
"deep": {
|
|
296
|
+
"defaultTier": "heavy",
|
|
297
|
+
"description": "Deep analysis mode — prioritizes thorough architecture/debug work with long heavy runs",
|
|
298
|
+
"overrideRules": [
|
|
299
|
+
"default→@medium for implementation and multi-file changes",
|
|
300
|
+
"@heavy for architecture/debug/security/tradeoff-analysis by default",
|
|
301
|
+
"allow long heavy runs before fallback; avoid premature downshift",
|
|
302
|
+
"trivial(grep/read/glob)→direct,no-delegate",
|
|
303
|
+
"if task is composite: explore@fast then execute@heavy"
|
|
292
304
|
]
|
|
293
305
|
}
|
|
294
306
|
}
|
|
295
307
|
}
|
|
296
308
|
```
|
|
297
309
|
|
|
310
|
+
**Heavy tool-call budget:** `@heavy.steps=120` by default across presets (raised from 60) to reduce premature cutoffs on long architecture/debug tasks.
|
|
311
|
+
|
|
298
312
|
### Task taxonomy (`taskPatterns`)
|
|
299
313
|
|
|
300
314
|
Keyword routing guide injected into the system prompt. Customize to match your workflow:
|
|
@@ -381,7 +395,7 @@ Defines provider fallback order when a delegated task fails:
|
|
|
381
395
|
| `/preset` | List available presets |
|
|
382
396
|
| `/preset <name>` | Switch preset (e.g., `/preset openai`) |
|
|
383
397
|
| `/budget` | Show available modes and which is active |
|
|
384
|
-
| `/budget <mode>` | Switch routing mode (`normal`, `budget`, `quality`) |
|
|
398
|
+
| `/budget <mode>` | Switch routing mode (`normal`, `budget`, `quality`, `deep`) |
|
|
385
399
|
| `/annotate-plan [path]` | Annotate a plan file with `[tier:X]` tags for each step |
|
|
386
400
|
|
|
387
401
|
## Plan annotation
|
package/package.json
CHANGED
package/tiers.json
CHANGED
|
@@ -36,7 +36,7 @@
|
|
|
36
36
|
"variant": "max",
|
|
37
37
|
"costRatio": 20,
|
|
38
38
|
"description": "Opus 4.6 max for architecture, complex debugging, and security",
|
|
39
|
-
"steps":
|
|
39
|
+
"steps": 120,
|
|
40
40
|
"prompt": "You are a senior architecture consultant. Analyze deeply, consider tradeoffs, and provide thorough reasoning. Be exhaustive in your analysis.",
|
|
41
41
|
"whenToUse": [
|
|
42
42
|
"Architecture decisions",
|
|
@@ -77,7 +77,7 @@
|
|
|
77
77
|
"variant": "xhigh",
|
|
78
78
|
"costRatio": 20,
|
|
79
79
|
"description": "GPT-5.3 Codex xhigh for architecture and complex tasks",
|
|
80
|
-
"steps":
|
|
80
|
+
"steps": 120,
|
|
81
81
|
"prompt": "You are a senior architecture consultant. Analyze deeply, consider tradeoffs, and provide thorough reasoning.",
|
|
82
82
|
"whenToUse": [
|
|
83
83
|
"Architecture decisions",
|
|
@@ -120,7 +120,7 @@
|
|
|
120
120
|
"variant": "thinking",
|
|
121
121
|
"costRatio": 20,
|
|
122
122
|
"description": "Claude Opus 4.6 via GitHub Copilot for architecture, complex debugging, and security",
|
|
123
|
-
"steps":
|
|
123
|
+
"steps": 120,
|
|
124
124
|
"prompt": "You are a senior architecture consultant. Analyze deeply, consider tradeoffs, and provide thorough reasoning. Be exhaustive in your analysis.",
|
|
125
125
|
"whenToUse": [
|
|
126
126
|
"Architecture decisions",
|
|
@@ -162,7 +162,51 @@
|
|
|
162
162
|
"model": "google/gemini-3-pro-preview",
|
|
163
163
|
"costRatio": 20,
|
|
164
164
|
"description": "Gemini 3 Pro Preview for architecture, complex debugging, and security",
|
|
165
|
+
"steps": 120,
|
|
166
|
+
"prompt": "You are a senior architecture consultant. Analyze deeply, consider tradeoffs, and provide thorough reasoning. Be exhaustive in your analysis.",
|
|
167
|
+
"whenToUse": [
|
|
168
|
+
"Architecture decisions",
|
|
169
|
+
"Complex debugging (after 2+ failures)",
|
|
170
|
+
"Security review",
|
|
171
|
+
"Performance optimization"
|
|
172
|
+
]
|
|
173
|
+
}
|
|
174
|
+
},
|
|
175
|
+
"hybrid": {
|
|
176
|
+
"fast": {
|
|
177
|
+
"model": "openai/gpt-5.3-codex-spark",
|
|
178
|
+
"costRatio": 1,
|
|
179
|
+
"description": "GPT-5.3 Codex Spark for exploration, search, and simple reads",
|
|
165
180
|
"steps": 30,
|
|
181
|
+
"prompt": "You are a fast exploration agent. Focus on speed and efficiency. Read files, search code, and return findings concisely. Do NOT make edits unless explicitly asked.",
|
|
182
|
+
"whenToUse": [
|
|
183
|
+
"Codebase exploration and search",
|
|
184
|
+
"Simple file reads and listing",
|
|
185
|
+
"Grep/glob operations",
|
|
186
|
+
"Quick lookups and research"
|
|
187
|
+
]
|
|
188
|
+
},
|
|
189
|
+
"medium": {
|
|
190
|
+
"model": "anthropic/claude-sonnet-4-6",
|
|
191
|
+
"variant": "max",
|
|
192
|
+
"costRatio": 5,
|
|
193
|
+
"description": "Claude Sonnet 4.6 max for implementation, refactoring, and tests",
|
|
194
|
+
"steps": 50,
|
|
195
|
+
"prompt": "You are an implementation agent. Write clean, production-quality code matching existing project patterns. Run linters/tests after changes when possible.",
|
|
196
|
+
"whenToUse": [
|
|
197
|
+
"Feature implementation",
|
|
198
|
+
"Refactoring",
|
|
199
|
+
"Writing tests",
|
|
200
|
+
"Code review",
|
|
201
|
+
"Bug fixes"
|
|
202
|
+
]
|
|
203
|
+
},
|
|
204
|
+
"heavy": {
|
|
205
|
+
"model": "anthropic/claude-opus-4-6",
|
|
206
|
+
"variant": "max",
|
|
207
|
+
"costRatio": 20,
|
|
208
|
+
"description": "Claude Opus 4.6 max for architecture, complex debugging, and security",
|
|
209
|
+
"steps": 120,
|
|
166
210
|
"prompt": "You are a senior architecture consultant. Analyze deeply, consider tradeoffs, and provide thorough reasoning. Be exhaustive in your analysis.",
|
|
167
211
|
"whenToUse": [
|
|
168
212
|
"Architecture decisions",
|
|
@@ -235,6 +279,17 @@
|
|
|
235
279
|
"@fast ONLY: trivial single-tool ops (1 grep/1 read)",
|
|
236
280
|
"prefer thoroughness over speed"
|
|
237
281
|
]
|
|
282
|
+
},
|
|
283
|
+
"deep": {
|
|
284
|
+
"defaultTier": "heavy",
|
|
285
|
+
"description": "Deep analysis mode — prioritizes thorough architecture/debug work with long heavy runs",
|
|
286
|
+
"overrideRules": [
|
|
287
|
+
"default→@medium for implementation and multi-file changes",
|
|
288
|
+
"@heavy for architecture/debug/security/tradeoff-analysis by default",
|
|
289
|
+
"allow long heavy runs before fallback; avoid premature downshift",
|
|
290
|
+
"trivial(grep/read/glob)→direct,no-delegate",
|
|
291
|
+
"if task is composite: explore@fast then execute@heavy"
|
|
292
|
+
]
|
|
238
293
|
}
|
|
239
294
|
},
|
|
240
295
|
"fallback": {
|