roadmodel 0.2.4__tar.gz → 0.2.6__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {roadmodel-0.2.4 → roadmodel-0.2.6}/PKG-INFO +1 -1
- {roadmodel-0.2.4 → roadmodel-0.2.6}/docs/catalog.json +219 -20
- {roadmodel-0.2.4 → roadmodel-0.2.6}/docs/model-selector.txt +178 -35
- {roadmodel-0.2.4/roadmodel/data → roadmodel-0.2.6/docs}/model-tier-cost-scale.md +34 -19
- {roadmodel-0.2.4 → roadmodel-0.2.6}/pyproject.toml +1 -1
- {roadmodel-0.2.4 → roadmodel-0.2.6}/roadmodel/data/catalog.json +219 -20
- {roadmodel-0.2.4 → roadmodel-0.2.6}/roadmodel/data/model-selector.txt +178 -35
- {roadmodel-0.2.4/docs → roadmodel-0.2.6/roadmodel/data}/model-tier-cost-scale.md +34 -19
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/__init__.py +1 -1
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/cli.py +34 -1
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/providers/google.py +8 -1
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/recommend.py +73 -11
- {roadmodel-0.2.4 → roadmodel-0.2.6}/.gitignore +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/LICENSE +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/NOTICE +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/README.md +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/docs/templates/phase-roadmap-template.md +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/docs/user-context.example.md +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/hatch_build.py +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/infra/README.md +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/infra/supabase/README.md +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/roadmodel/data/phase-roadmap-template.md +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/roadmodel/data/user-context.example.md +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/__main__.py +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/config.py +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/cost.py +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/errors.py +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/mcp_server.py +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/providers/__init__.py +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/providers/anthropic.py +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/providers/openai.py +0 -0
- {roadmodel-0.2.4 → roadmodel-0.2.6}/src/roadmodel/user_context.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: roadmodel
|
|
3
|
-
Version: 0.2.
|
|
3
|
+
Version: 0.2.6
|
|
4
4
|
Summary: BYO-key CLI that recommends the right AI model, platform, and settings for a prompt.
|
|
5
5
|
Project-URL: Homepage, https://roadmodel.ai
|
|
6
6
|
Project-URL: Repository, https://github.com/nathanramoscfa/roadmodel
|
|
@@ -1,9 +1,9 @@
|
|
|
1
1
|
{
|
|
2
2
|
"schema_version": "2",
|
|
3
|
-
"generated_at_utc": "2026-
|
|
3
|
+
"generated_at_utc": "2026-06-13T03:26:33Z",
|
|
4
4
|
"source_doc_sha256": {
|
|
5
|
-
"model-selector.txt": "
|
|
6
|
-
"model-tier-cost-scale.md": "
|
|
5
|
+
"model-selector.txt": "3678876fce07458df5b821be0cee45475797adab6c243150ac5630bf7169b23a",
|
|
6
|
+
"model-tier-cost-scale.md": "7e874453400fa3a6d5d9122f762abe654f9a9f565a307d9391143585b2eba451"
|
|
7
7
|
},
|
|
8
8
|
"models": [
|
|
9
9
|
{
|
|
@@ -23,10 +23,52 @@
|
|
|
23
23
|
"speed": "S"
|
|
24
24
|
},
|
|
25
25
|
"jurisdiction": "us",
|
|
26
|
-
"headline_benchmarks": "AA Intelligence Index 37.1; Output Speed
|
|
26
|
+
"headline_benchmarks": "AA Intelligence Index 37.1; Output Speed 143.0 tokens/s; AA-Omniscience -4.2; latency leader among Claude family",
|
|
27
27
|
"pricing_notes": "Hidden by default; Bedrock/Vertex: regional endpoints +10% surcharge; Cache: writes 1.25x, reads 0.1x",
|
|
28
28
|
"best_for": "Speed-optimized lowest-cost Claude model, ideal for simple completions, high-volume repetitive tasks, and latency-sensitive workflows where a lightweight capable response matters more than deep reasoning"
|
|
29
29
|
},
|
|
30
|
+
{
|
|
31
|
+
"id": "claude-fable-5",
|
|
32
|
+
"name": "Fable 5",
|
|
33
|
+
"input_price_per_1m": 10.0,
|
|
34
|
+
"output_price_per_1m": 50.0,
|
|
35
|
+
"cache_read_per_1m": null,
|
|
36
|
+
"tier_cost": "very-high",
|
|
37
|
+
"tiers": {
|
|
38
|
+
"coding": "S",
|
|
39
|
+
"planning": "S",
|
|
40
|
+
"agentic": "S",
|
|
41
|
+
"multimodal": "S",
|
|
42
|
+
"long-context": "S",
|
|
43
|
+
"knowledge": "S",
|
|
44
|
+
"speed": "D"
|
|
45
|
+
},
|
|
46
|
+
"jurisdiction": "us",
|
|
47
|
+
"headline_benchmarks": "AA Intelligence Index 64.9 (#1); HLE 53.3% (#1); Terminal-Bench Hard 62.9 (#1)",
|
|
48
|
+
"pricing_notes": "Requires data retention approval for Enterprise customers, Teams and individual customers with Privacy Mode enabled; Anthropic stores agent input and output data for harm-prevention processes; this data is not used to train or improve Anthropic models or products; Requests that trip a security guardrail are automatically routed to Claude Opus; About 2x the cost of Claude Opus 4.8; Requires Max Mode on request-based plans",
|
|
49
|
+
"best_for": "Anthropic's new top-of-line Fable family flagship (no predecessor) \u2014 S-tier across coding, planning, agentic, multimodal, long-context, and knowledge, leading HLE (53.3%) and Terminal-Bench Hard (62.9) with state-of-the-art vision and a 1M default context; about 2x the cost of Opus 4.8 and latency-slow (output ~64 tokens/s), so reserve for the hardest reasoning, agentic, and vision work where maximum capability outweighs cost and speed; security-guardrail trips auto-route to Opus. Tier profile sourced from the catalog cron's 2026-06-11 dry-run reconciliation against the live benchmark sources (\u03c4\u00b2-bench retail not yet published for this model), pending editorial confirmation in the next refresh."
|
|
50
|
+
},
|
|
51
|
+
{
|
|
52
|
+
"id": "codestral",
|
|
53
|
+
"name": "Codestral",
|
|
54
|
+
"input_price_per_1m": 0.3,
|
|
55
|
+
"output_price_per_1m": 0.9,
|
|
56
|
+
"cache_read_per_1m": null,
|
|
57
|
+
"tier_cost": "low",
|
|
58
|
+
"tiers": {
|
|
59
|
+
"coding": "B",
|
|
60
|
+
"planning": "C",
|
|
61
|
+
"agentic": "C",
|
|
62
|
+
"multimodal": "D",
|
|
63
|
+
"long-context": "B",
|
|
64
|
+
"knowledge": "C",
|
|
65
|
+
"speed": "A"
|
|
66
|
+
},
|
|
67
|
+
"jurisdiction": "eu",
|
|
68
|
+
"headline_benchmarks": "Mistral's code-specialist model; fast low-latency completion / fill-in-the-middle across many languages with a large code context window; specific public benchmark numbers pending",
|
|
69
|
+
"pricing_notes": "Provider-direct Mistral API per-token pricing (not via the Cursor pool); eu-jurisdiction; prices manually maintained (Mistral publishes no machine-readable price source)",
|
|
70
|
+
"best_for": "Mistral's dedicated code model \u2014 fast, cheap ($0.90/M output) code completion and fill-in-the-middle under the EU jurisdiction, for autocomplete-style / high-throughput coding loops where an EU operator and low latency matter more than top-tier agentic reasoning. Reached via the `mistral-api` method (provider-direct per-token) with a mistral-api-key; prefer mistral-medium-3.5 for reasoning-heavy coding, codestral for fast bounded completions."
|
|
71
|
+
},
|
|
30
72
|
{
|
|
31
73
|
"id": "composer-2",
|
|
32
74
|
"name": "Composer 2 (Fast)",
|
|
@@ -69,6 +111,48 @@
|
|
|
69
111
|
"pricing_notes": "-",
|
|
70
112
|
"best_for": "Composer 2's successor at the same output price \u2014 Cursor's purpose-built multi-file agentic editor with frontier-level coding quality and speed-optimized inference; prefer over Composer 2 when both are available since 2.5 supersedes 2 within the same series per the equal-output-price replacement rule (Composer 2 is now Hidden by default on Cursor's pricing page)"
|
|
71
113
|
},
|
|
114
|
+
{
|
|
115
|
+
"id": "deepseek-v4-flash",
|
|
116
|
+
"name": "DeepSeek-V4-Flash",
|
|
117
|
+
"input_price_per_1m": 0.14,
|
|
118
|
+
"output_price_per_1m": 0.28,
|
|
119
|
+
"cache_read_per_1m": null,
|
|
120
|
+
"tier_cost": "low",
|
|
121
|
+
"tiers": {
|
|
122
|
+
"coding": "A",
|
|
123
|
+
"planning": "B",
|
|
124
|
+
"agentic": "B",
|
|
125
|
+
"multimodal": "D",
|
|
126
|
+
"long-context": "B",
|
|
127
|
+
"knowledge": "B",
|
|
128
|
+
"speed": "A"
|
|
129
|
+
},
|
|
130
|
+
"jurisdiction": "cn",
|
|
131
|
+
"headline_benchmarks": "AA Intelligence Index 47 (reasoning, max effort) \u2014 independently measured by Artificial Analysis; SWE-bench Verified 79.0% (DeepSeek-reported); 1M-token context; text-only (no image input); ~90 tokens/s",
|
|
132
|
+
"pricing_notes": "Provider-direct DeepSeek API per-token pricing (not via the Cursor pool); cache-hit input $0.0028/M",
|
|
133
|
+
"best_for": "DeepSeek's V4-Flash \u2014 the fast (~90 tokens/s), cheapest DeepSeek variant ($0.28/M output) with a 1M-token context window, for high-throughput / latency-sensitive text and code work under the cn jurisdiction with a deepseek-api-key. Mid-pack general intelligence (Artificial Analysis Intelligence Index 47) paired with a strong, DeepSeek-reported coding result (SWE-bench Verified 79.0%) \u2014 rated coding-A on that basis with the rest of its profile B-tier; text-only (no multimodal). Reached via the `deepseek-api` method (provider-direct per-token). Pick V4-Pro over V4-Flash when reasoning depth or the strongest coding matters; pick V4-Flash when speed and the lowest cost dominate."
|
|
134
|
+
},
|
|
135
|
+
{
|
|
136
|
+
"id": "deepseek-v4-pro",
|
|
137
|
+
"name": "DeepSeek-V4-Pro",
|
|
138
|
+
"input_price_per_1m": 0.435,
|
|
139
|
+
"output_price_per_1m": 0.87,
|
|
140
|
+
"cache_read_per_1m": null,
|
|
141
|
+
"tier_cost": "low",
|
|
142
|
+
"tiers": {
|
|
143
|
+
"coding": "A",
|
|
144
|
+
"planning": "A",
|
|
145
|
+
"agentic": "A",
|
|
146
|
+
"multimodal": "D",
|
|
147
|
+
"long-context": "A",
|
|
148
|
+
"knowledge": "A",
|
|
149
|
+
"speed": "C"
|
|
150
|
+
},
|
|
151
|
+
"jurisdiction": "cn",
|
|
152
|
+
"headline_benchmarks": "AA Intelligence Index 52 (reasoning, max effort) \u2014 independently measured by Artificial Analysis; SWE-bench Verified 80.6%, LiveCodeBench 93.5, Terminal-Bench 2.0 67.9, Codeforces CodeElo 3206, Putnam-2025 120/120 (DeepSeek-reported); 1M-token context; text-only (no image input); ~46 tokens/s (notably slow)",
|
|
153
|
+
"pricing_notes": "Provider-direct DeepSeek API per-token pricing (not via the Cursor pool); cache-hit input $0.003625/M",
|
|
154
|
+
"best_for": "DeepSeek's V4-Pro flagship \u2014 a very low-cost ($0.87/M output), cn-jurisdiction reasoning model with a 1M-token context window and thinking mode on by default. Strong general intelligence (Artificial Analysis Intelligence Index 52, just below Grok 4.3) and a frontier-approaching coding profile (SWE-bench Verified 80.6%, LiveCodeBench 93.5, Codeforces CodeElo 3206) \u2014 these coding numbers are DeepSeek-reported, so it is rated coding-A rather than S pending an independent SWE-bench leaderboard entry. Text-only (no multimodal) and notably slow (~46 tokens/s), so not for latency-sensitive or image work. Reached via the `deepseek-api` method (provider-direct per-token, not the Cursor pool) when the cn jurisdiction is acceptable and a deepseek-api-key is configured \u2014 the cheapest A-tier coding / reasoning option in the catalog."
|
|
155
|
+
},
|
|
72
156
|
{
|
|
73
157
|
"id": "gemini-2.5-flash",
|
|
74
158
|
"name": "Gemini 2.5 Flash",
|
|
@@ -149,7 +233,7 @@
|
|
|
149
233
|
"speed": "B"
|
|
150
234
|
},
|
|
151
235
|
"jurisdiction": "us",
|
|
152
|
-
"headline_benchmarks": "AA Intelligence Index 57.2 (#3); AA-Omniscience 32.9 (#1); HLE 44.7% (#1); LMArena Text Elo 1482.
|
|
236
|
+
"headline_benchmarks": "AA Intelligence Index 57.2 (#3); AA-Omniscience 32.9 (#1); HLE 44.7% (#1); LMArena Text Elo 1482.0 (#4); 1M-token context",
|
|
153
237
|
"pricing_notes": "-",
|
|
154
238
|
"best_for": "True native multimodal understanding (text, image, video, audio, and code in a single pass), 1M-token context optimized for heterogeneous inputs, strong agentic multi-step tool use, and synthesizing insights across large mixed-media datasets or sprawling document corpora \u2014 the obvious choice whenever multimodal or long-context is the primary category"
|
|
155
239
|
},
|
|
@@ -170,7 +254,7 @@
|
|
|
170
254
|
"speed": "S"
|
|
171
255
|
},
|
|
172
256
|
"jurisdiction": "us",
|
|
173
|
-
"headline_benchmarks": "AA Intelligence Index 55.3 (high reasoning); \u03c4\u00b2-bench retail pass_1 45.6 (Gemini 3.5 Flash); Output Speed
|
|
257
|
+
"headline_benchmarks": "AA Intelligence Index 55.3 (high reasoning); \u03c4\u00b2-bench retail pass_1 45.6 (Gemini 3.5 Flash); Output Speed 203.7 tokens/s",
|
|
174
258
|
"pricing_notes": "-",
|
|
175
259
|
"best_for": "Auto-added cheap-tier Google model; pending editorial best-for refinement."
|
|
176
260
|
},
|
|
@@ -296,7 +380,7 @@
|
|
|
296
380
|
"speed": "B"
|
|
297
381
|
},
|
|
298
382
|
"jurisdiction": "us",
|
|
299
|
-
"headline_benchmarks": "AA Intelligence Index 56.8 (#4); LMArena Text Elo
|
|
383
|
+
"headline_benchmarks": "AA Intelligence Index 56.8 (#4); LMArena Text Elo 1452.5 (#23); GPT-5.4 (xhigh) Output Speed 86.1 tokens/s; lowest factual error rate among GPT models",
|
|
300
384
|
"pricing_notes": "Hidden by default; Requires Max Mode on request-based plans; Agentic and reasoning capabilities; 90% discount on cached input tokens; Fast mode is 15% faster with 2x pricing; Long context (Max Mode) supports up to 1M tokens with 2x input pricing",
|
|
301
385
|
"best_for": "Broadest professional domain expertise (outperforms human specialists in 83% of occupations), native computer-use capability surpassing human baselines, lowest factual error rate among GPT models, and cross-domain knowledge work requiring deep real-world accuracy and grounding"
|
|
302
386
|
},
|
|
@@ -317,7 +401,7 @@
|
|
|
317
401
|
"speed": "A"
|
|
318
402
|
},
|
|
319
403
|
"jurisdiction": "us",
|
|
320
|
-
"headline_benchmarks": "AA Intelligence Index 48.9 (xhigh); Output Speed
|
|
404
|
+
"headline_benchmarks": "AA Intelligence Index 48.9 (xhigh); Output Speed 180.8 tokens/s; HLE 26.6% (GPT-5.4-mini xhigh)",
|
|
321
405
|
"pricing_notes": "Hidden by default; Smaller, faster variant of GPT-5.4; 90% discount on cached input tokens",
|
|
322
406
|
"best_for": "Lightweight GPT-5.4 variant balancing quality and cost, well-suited for straightforward coding, short-form generation, and high-throughput workloads needing solid GPT reasoning at a fraction of the flagship price"
|
|
323
407
|
},
|
|
@@ -359,7 +443,7 @@
|
|
|
359
443
|
"speed": "D"
|
|
360
444
|
},
|
|
361
445
|
"jurisdiction": "us",
|
|
362
|
-
"headline_benchmarks": "AA Intelligence Index 60.2 (#1); LMArena Text Elo
|
|
446
|
+
"headline_benchmarks": "AA Intelligence Index 60.2 (#1); LMArena Text Elo 1462.3 (#16); HLE 44.3%; AA-Omniscience 20.1 (#3)",
|
|
363
447
|
"pricing_notes": "Requires Max Mode on request-based plans; Agentic and reasoning capabilities; More token-efficient than GPT-5.4 on comparable tasks; Improved persistence on long-running tasks; Fast mode is available at higher rates; Long context (Max Mode) supports up to 1M tokens with 2x input pricing",
|
|
364
448
|
"best_for": "OpenAI's most capable frontier model and highest-cost GPT offering, best suited for the most demanding reasoning, long-horizon planning, and tasks where maximum intelligence is required regardless of cost \u2014 strongest single model for hard coding, agentic execution, and reasoning, but verify factual claims due to elevated hallucination"
|
|
365
449
|
},
|
|
@@ -381,7 +465,7 @@
|
|
|
381
465
|
},
|
|
382
466
|
"jurisdiction": "us",
|
|
383
467
|
"headline_benchmarks": "AA Intelligence Index 53.2 (#7); AA-Omniscience 18.3 (#4); HLE 35.0%; LMArena Search Elo 1189.2",
|
|
384
|
-
"pricing_notes": "Requires Max Mode on request-based plans",
|
|
468
|
+
"pricing_notes": "Hidden by default; Requires Max Mode on request-based plans",
|
|
385
469
|
"best_for": "Latest Grok release with built-in multi-agent self-verification, configurable reasoning depth, and signature 2M-token context with hallucination-resistant grounding \u2014 leads the low tier on agentic execution and long-context, ideal when massive context, factual accuracy, and aggressive cost efficiency must coexist"
|
|
386
470
|
},
|
|
387
471
|
{
|
|
@@ -405,6 +489,69 @@
|
|
|
405
489
|
"pricing_notes": "Hidden by default",
|
|
406
490
|
"best_for": "Moonshot's affordable mid-volume model \u2014 a non-Google / non-OpenAI / non-Anthropic option at low-tier pricing for cost-conscious code and text generation when provider diversity is desired (vendor-risk hedging, regional preferences); routed via Cursor's pool only \u2014 no direct Moonshot access method is currently enumerated in the access-methods block"
|
|
407
491
|
},
|
|
492
|
+
{
|
|
493
|
+
"id": "mistral-large-3",
|
|
494
|
+
"name": "Mistral Large 3",
|
|
495
|
+
"input_price_per_1m": 0.5,
|
|
496
|
+
"output_price_per_1m": 1.5,
|
|
497
|
+
"cache_read_per_1m": null,
|
|
498
|
+
"tier_cost": "low",
|
|
499
|
+
"tiers": {
|
|
500
|
+
"coding": "C",
|
|
501
|
+
"planning": "C",
|
|
502
|
+
"agentic": "C",
|
|
503
|
+
"multimodal": "D",
|
|
504
|
+
"long-context": "C",
|
|
505
|
+
"knowledge": "C",
|
|
506
|
+
"speed": "B"
|
|
507
|
+
},
|
|
508
|
+
"jurisdiction": "eu",
|
|
509
|
+
"headline_benchmarks": "AA Intelligence Index 23 (independently measured by Artificial Analysis); open-weight Mixture-of-Experts (self-hostable); text-only",
|
|
510
|
+
"pricing_notes": "Provider-direct Mistral API per-token pricing (not via the Cursor pool); eu-jurisdiction; prices manually maintained (Mistral publishes no machine-readable price source)",
|
|
511
|
+
"best_for": "Mistral's open-weight Large 3 (MoE) \u2014 an EU-jurisdiction, self-hostable option at very low cost ($1.50/M output) for data-sovereignty workloads or teams that want to run the weights themselves. Artificial Analysis Intelligence Index 23 sits below the frontier and even below Mistral's own Medium 3.5 (Mistral repositioned Large as an open community model) \u2014 pick it for the open-weights / EU-operator profile, not raw capability. Reached via the `mistral-api` method (provider-direct per-token) or self-hosting."
|
|
512
|
+
},
|
|
513
|
+
{
|
|
514
|
+
"id": "mistral-medium-3.5",
|
|
515
|
+
"name": "Mistral Medium 3.5",
|
|
516
|
+
"input_price_per_1m": 1.5,
|
|
517
|
+
"output_price_per_1m": 7.5,
|
|
518
|
+
"cache_read_per_1m": null,
|
|
519
|
+
"tier_cost": "low",
|
|
520
|
+
"tiers": {
|
|
521
|
+
"coding": "B",
|
|
522
|
+
"planning": "B",
|
|
523
|
+
"agentic": "C",
|
|
524
|
+
"multimodal": "B",
|
|
525
|
+
"long-context": "B",
|
|
526
|
+
"knowledge": "B",
|
|
527
|
+
"speed": "B"
|
|
528
|
+
},
|
|
529
|
+
"jurisdiction": "eu",
|
|
530
|
+
"headline_benchmarks": "AA Intelligence Index 39 (independently measured by Artificial Analysis); unified chat / reasoning / code model with an adjustable reasoning dial (reasoning_effort); multimodal (text + image input)",
|
|
531
|
+
"pricing_notes": "Provider-direct Mistral API per-token pricing (not via the Cursor pool); eu-jurisdiction; prices manually maintained (Mistral publishes no machine-readable price source)",
|
|
532
|
+
"best_for": "Mistral's flagship unified model \u2014 the EU-jurisdiction choice for data-sovereignty / EU-regulatory workloads at low cost ($7.50/M output), with adjustable reasoning and multimodal (vision) input. Artificial Analysis Intelligence Index 39 places it mid-pack (below the US/cn frontier such as Gemini 3.1 Pro or DeepSeek V4-Pro) \u2014 pick it when the operator's EU jurisdiction is the deciding constraint, not when raw capability is. Reached via the `mistral-api` method (provider-direct per-token) with a mistral-api-key."
|
|
533
|
+
},
|
|
534
|
+
{
|
|
535
|
+
"id": "mistral-small-4",
|
|
536
|
+
"name": "Mistral Small 4",
|
|
537
|
+
"input_price_per_1m": 0.1,
|
|
538
|
+
"output_price_per_1m": 0.3,
|
|
539
|
+
"cache_read_per_1m": null,
|
|
540
|
+
"tier_cost": "low",
|
|
541
|
+
"tiers": {
|
|
542
|
+
"coding": "C",
|
|
543
|
+
"planning": "C",
|
|
544
|
+
"agentic": "C",
|
|
545
|
+
"multimodal": "B",
|
|
546
|
+
"long-context": "C",
|
|
547
|
+
"knowledge": "C",
|
|
548
|
+
"speed": "A"
|
|
549
|
+
},
|
|
550
|
+
"jurisdiction": "eu",
|
|
551
|
+
"headline_benchmarks": "AA Intelligence Index 28 (independently measured by Artificial Analysis); compact Mixture-of-Experts unifying the former Small / Magistral / Pixtral / Devstral lines; adjustable reasoning_effort; multimodal (text + image)",
|
|
552
|
+
"pricing_notes": "Provider-direct Mistral API per-token pricing (not via the Cursor pool); eu-jurisdiction; prices manually maintained (Mistral publishes no machine-readable price source)",
|
|
553
|
+
"best_for": "Mistral's cheapest fast model ($0.30/M output) \u2014 a small EU-jurisdiction MoE with multimodal input and an optional reasoning dial, for high-throughput / latency-sensitive text and light multimodal work where the EU operator matters and a mistral-api-key is configured. Artificial Analysis Intelligence Index 28 is low, so it is a cost / sovereignty pick rather than a capability pick. Reached via the `mistral-api` method (provider-direct per-token)."
|
|
554
|
+
},
|
|
408
555
|
{
|
|
409
556
|
"id": "opus-4.7",
|
|
410
557
|
"name": "Opus 4.7",
|
|
@@ -422,7 +569,7 @@
|
|
|
422
569
|
"speed": "D"
|
|
423
570
|
},
|
|
424
571
|
"jurisdiction": "us",
|
|
425
|
-
"headline_benchmarks": "AA Intelligence Index 57.3 (#2); LMArena Text #
|
|
572
|
+
"headline_benchmarks": "AA Intelligence Index 57.3 (#2); LMArena Text #6 (Elo 1480.4); LMArena WebDev #2 (Elo 1556.5); AA-Omniscience 26.2 (#2)",
|
|
426
573
|
"pricing_notes": "Hidden by default; Requires Max Mode on request-based plans; Up to 1M tokens in Max Mode at the same per-token rates (no long-context surcharge)",
|
|
427
574
|
"best_for": "Deepest abstract and scientific reasoning, highest coherence on long unsupervised multi-step agent chains, best long-context recall at 1M tokens, 128K output ceiling for large single-shot deliverables, and novel problem-solving where high ambiguity demands creative judgment over pattern-matching"
|
|
428
575
|
},
|
|
@@ -436,14 +583,14 @@
|
|
|
436
583
|
"tiers": {
|
|
437
584
|
"coding": "S",
|
|
438
585
|
"planning": "S",
|
|
439
|
-
"agentic": "
|
|
586
|
+
"agentic": "S",
|
|
440
587
|
"multimodal": "A",
|
|
441
588
|
"long-context": "S",
|
|
442
589
|
"knowledge": "S",
|
|
443
590
|
"speed": "D"
|
|
444
591
|
},
|
|
445
592
|
"jurisdiction": "us",
|
|
446
|
-
"headline_benchmarks": "
|
|
593
|
+
"headline_benchmarks": "AA Intelligence Index 61.4 (#1); HLE 45.7%; Terminal-Bench Hard 58.3 (top-tier); \u03c4\u00b2-bench retail pass_1 94.4%",
|
|
447
594
|
"pricing_notes": "Requires Max Mode on request-based plans; Fast mode (`claude-opus-4-8-fast`) requires Max Mode; Fast mode is 3x lower per-token pricing than Opus 4.7 fast mode; Up to 1M tokens in Max Mode at the same per-token rates (no long-context surcharge)",
|
|
448
595
|
"best_for": "Anthropic's Opus 4.7 successor at the same very-high tier pricing \u2014 placeholder tier ratings inherited from opus-4.7 pending benchmark coverage; the 3x cheaper fast-mode per-token rate (vs opus-4.7 fast mode) is the headline cost-structure change to surface in the next editorial pass"
|
|
449
596
|
},
|
|
@@ -464,7 +611,7 @@
|
|
|
464
611
|
"speed": "B"
|
|
465
612
|
},
|
|
466
613
|
"jurisdiction": "us",
|
|
467
|
-
"headline_benchmarks": "AA Intelligence Index 51.7; LMArena WebDev Elo 1522.
|
|
614
|
+
"headline_benchmarks": "AA Intelligence Index 51.7; LMArena WebDev Elo 1522.2 (#10); AA-Omniscience 12.4; top-ranked tool-calling on Anthropic lineage",
|
|
468
615
|
"pricing_notes": "Requires Max Mode on request-based plans; Up to 1M tokens in Max Mode at the same per-token rates (no long-context surcharge)",
|
|
469
616
|
"best_for": "Top-ranked tool-calling and agentic execution globally, near-Opus coding quality at 2-3x the speed, strong mathematical reasoning (89% MATH), and complex but well-structured tasks needing reliable high-throughput multi-step implementation"
|
|
470
617
|
}
|
|
@@ -479,6 +626,7 @@
|
|
|
479
626
|
"requires": "anthropic-api-key",
|
|
480
627
|
"supports_models": [
|
|
481
628
|
"claude-4.5-haiku",
|
|
629
|
+
"claude-fable-5",
|
|
482
630
|
"opus-4.7",
|
|
483
631
|
"opus-4.8",
|
|
484
632
|
"sonnet-4.6"
|
|
@@ -514,13 +662,14 @@
|
|
|
514
662
|
"requires": "claude-max-subscription OR anthropic-api-key",
|
|
515
663
|
"supports_models": [
|
|
516
664
|
"claude-4.5-haiku",
|
|
665
|
+
"claude-fable-5",
|
|
517
666
|
"opus-4.7",
|
|
518
667
|
"opus-4.8",
|
|
519
668
|
"sonnet-4.6"
|
|
520
669
|
],
|
|
521
670
|
"exposes_max_mode": "no",
|
|
522
671
|
"exposes_thinking": "yes",
|
|
523
|
-
"best_for": "Default for Claude coding or terminal tasks when a claude.ai Max subscription is active \u2014 $0 marginal cost until the Max budget is exhausted, full tool-use surface, runs as a CLI and as an IDE extension inside Cursor. Heavy Opus usage that would cost over $1,000/mo on per-token API is fully covered by a $100/mo Max plan."
|
|
672
|
+
"best_for": "Default for Claude coding or terminal tasks when a claude.ai Max subscription is active \u2014 $0 marginal cost until the Max budget is exhausted, full tool-use surface, runs as a CLI and as an IDE extension inside Cursor. Heavy Opus usage that would cost over $1,000/mo on per-token API is fully covered by a $100/mo Max plan. Exposes the full `/effort` dial (low/medium/high/xhigh/max \u2014 Opus 4.6 and Sonnet 4.6 top out at max with no xhigh step; Opus 4.7, Opus 4.8, and Fable 5 expose the full range) plus Ultracode (session-wide xhigh + Dynamic Workflows) and the per-turn `ultrathink` keyword."
|
|
524
673
|
},
|
|
525
674
|
{
|
|
526
675
|
"id": "claude-web",
|
|
@@ -569,6 +718,7 @@
|
|
|
569
718
|
"requires": "cursor-pro-or-ultra-subscription",
|
|
570
719
|
"supports_models": [
|
|
571
720
|
"claude-4.5-haiku",
|
|
721
|
+
"claude-fable-5",
|
|
572
722
|
"composer-2",
|
|
573
723
|
"composer-2.5",
|
|
574
724
|
"gemini-2.5-flash",
|
|
@@ -595,6 +745,21 @@
|
|
|
595
745
|
"exposes_thinking": "no",
|
|
596
746
|
"best_for": "Cursor IDE \u2014 single Platform covering both UI modes (Composer for multi-file autonomous editing; Chat for interactive model-picker). The operator picks the mode at task time based on the chosen Model: composer-2 / composer-2.5 imply Composer mode; frontier models (opus-4.7, gpt-5.5, sonnet-4.6, etc.) imply Chat mode. Cursor's own Auto and Premium routing modes are deliberately NOT enumerated as roadmodel-recommendable models because their routing is opaque (see `jurisdiction-context` for the rationale) \u2014 operators who want routing behavior pick a specific fixed model and let Cursor's pool handle the call. All routes through the $0-marginal Cursor pool. Defer to claude-code when the chosen model is Claude and claude.ai Max is active (Max budget is cheaper marginal cost than burning Cursor pool tokens on Claude calls that have a dedicated Anthropic subscription path)."
|
|
597
747
|
},
|
|
748
|
+
{
|
|
749
|
+
"id": "deepseek-api",
|
|
750
|
+
"name": "DeepSeek API",
|
|
751
|
+
"provider": "deepseek",
|
|
752
|
+
"provider_jurisdiction": "cn",
|
|
753
|
+
"billing": "per-token",
|
|
754
|
+
"requires": "deepseek-api-key",
|
|
755
|
+
"supports_models": [
|
|
756
|
+
"deepseek-v4-flash",
|
|
757
|
+
"deepseek-v4-pro"
|
|
758
|
+
],
|
|
759
|
+
"exposes_max_mode": "no",
|
|
760
|
+
"exposes_thinking": "yes",
|
|
761
|
+
"best_for": "Direct DeepSeek API access (provider-direct per-token; OpenAI-format at api.deepseek.com and Anthropic-format at api.deepseek.com/anthropic) for the deepseek-v4 models \u2014 cost-conscious coding / reasoning / long-context (1M) work when the cn jurisdiction is acceptable and a deepseek-api-key is configured. Exposes the full thinking dial (toggle + reasoning_effort `high`/`max`). Not routed via the Cursor pool. cn-jurisdiction: excluded by the default allowed-jurisdictions list unless the user opts into cn."
|
|
762
|
+
},
|
|
598
763
|
{
|
|
599
764
|
"id": "gemini-app",
|
|
600
765
|
"name": "Gemini (web / app)",
|
|
@@ -606,7 +771,8 @@
|
|
|
606
771
|
"gemini-2.5-flash",
|
|
607
772
|
"gemini-3-flash",
|
|
608
773
|
"gemini-3-pro",
|
|
609
|
-
"gemini-3.1-pro"
|
|
774
|
+
"gemini-3.1-pro",
|
|
775
|
+
"gemini-3.5-flash"
|
|
610
776
|
],
|
|
611
777
|
"exposes_max_mode": "no",
|
|
612
778
|
"exposes_thinking": "yes",
|
|
@@ -623,7 +789,8 @@
|
|
|
623
789
|
"gemini-2.5-flash",
|
|
624
790
|
"gemini-3-flash",
|
|
625
791
|
"gemini-3-pro",
|
|
626
|
-
"gemini-3.1-pro"
|
|
792
|
+
"gemini-3.1-pro",
|
|
793
|
+
"gemini-3.5-flash"
|
|
627
794
|
],
|
|
628
795
|
"exposes_max_mode": "no",
|
|
629
796
|
"exposes_thinking": "yes",
|
|
@@ -640,12 +807,30 @@
|
|
|
640
807
|
"gemini-2.5-flash",
|
|
641
808
|
"gemini-3-flash",
|
|
642
809
|
"gemini-3-pro",
|
|
643
|
-
"gemini-3.1-pro"
|
|
810
|
+
"gemini-3.1-pro",
|
|
811
|
+
"gemini-3.5-flash"
|
|
644
812
|
],
|
|
645
813
|
"exposes_max_mode": "no",
|
|
646
814
|
"exposes_thinking": "yes",
|
|
647
815
|
"best_for": "Programmatic / scripted Gemini use with a Google API key. Pay-per-token at Google's published rates. Powers the roadmodel SaaS free-tier surfaces (/recommend on Gemini 2.5 Flash; /roadmap on Gemini 2.5 Flash with 3.1 Pro escalation)."
|
|
648
816
|
},
|
|
817
|
+
{
|
|
818
|
+
"id": "mistral-api",
|
|
819
|
+
"name": "Mistral API",
|
|
820
|
+
"provider": "mistral",
|
|
821
|
+
"provider_jurisdiction": "eu",
|
|
822
|
+
"billing": "per-token",
|
|
823
|
+
"requires": "mistral-api-key",
|
|
824
|
+
"supports_models": [
|
|
825
|
+
"codestral",
|
|
826
|
+
"mistral-large-3",
|
|
827
|
+
"mistral-medium-3.5",
|
|
828
|
+
"mistral-small-4"
|
|
829
|
+
],
|
|
830
|
+
"exposes_max_mode": "no",
|
|
831
|
+
"exposes_thinking": "yes",
|
|
832
|
+
"best_for": "Direct Mistral API access (provider-direct per-token; La Plateforme at api.mistral.ai) for the Mistral models \u2014 the EU-jurisdiction option for data-sovereignty / EU-regulatory workloads at low cost. Exposes a reasoning dial on the unified models (Mistral Small 4 / Medium 3.5) via the `reasoning_effort` parameter. Not routed via the Cursor pool. eu-jurisdiction is in the default allowed-jurisdictions list, so Mistral surfaces for any user with a mistral-api-key configured (no jurisdiction opt-in required, unlike cn providers)."
|
|
833
|
+
},
|
|
649
834
|
{
|
|
650
835
|
"id": "openai-api",
|
|
651
836
|
"name": "OpenAI API",
|
|
@@ -697,6 +882,7 @@
|
|
|
697
882
|
"provider": "Anthropic",
|
|
698
883
|
"tier": "Claude Pro",
|
|
699
884
|
"monthly_usd": 20.0,
|
|
885
|
+
"annual_usd": 200.0,
|
|
700
886
|
"surface_funded": [
|
|
701
887
|
"claude-code",
|
|
702
888
|
"claude-web"
|
|
@@ -707,6 +893,7 @@
|
|
|
707
893
|
"provider": "Anthropic",
|
|
708
894
|
"tier": "claude.ai Max ($100)",
|
|
709
895
|
"monthly_usd": 100.0,
|
|
896
|
+
"annual_usd": null,
|
|
710
897
|
"surface_funded": [
|
|
711
898
|
"claude-code",
|
|
712
899
|
"claude-web"
|
|
@@ -717,6 +904,7 @@
|
|
|
717
904
|
"provider": "Anthropic",
|
|
718
905
|
"tier": "claude.ai Max ($200)",
|
|
719
906
|
"monthly_usd": 200.0,
|
|
907
|
+
"annual_usd": null,
|
|
720
908
|
"surface_funded": [
|
|
721
909
|
"claude-code",
|
|
722
910
|
"claude-web"
|
|
@@ -727,6 +915,7 @@
|
|
|
727
915
|
"provider": "Cursor",
|
|
728
916
|
"tier": "Cursor Pro",
|
|
729
917
|
"monthly_usd": 20.0,
|
|
918
|
+
"annual_usd": 192.0,
|
|
730
919
|
"surface_funded": [
|
|
731
920
|
"cursor"
|
|
732
921
|
],
|
|
@@ -736,6 +925,7 @@
|
|
|
736
925
|
"provider": "Cursor",
|
|
737
926
|
"tier": "Cursor Pro+",
|
|
738
927
|
"monthly_usd": 60.0,
|
|
928
|
+
"annual_usd": null,
|
|
739
929
|
"surface_funded": [
|
|
740
930
|
"cursor"
|
|
741
931
|
],
|
|
@@ -745,6 +935,7 @@
|
|
|
745
935
|
"provider": "Cursor",
|
|
746
936
|
"tier": "Cursor Ultra",
|
|
747
937
|
"monthly_usd": 200.0,
|
|
938
|
+
"annual_usd": null,
|
|
748
939
|
"surface_funded": [
|
|
749
940
|
"cursor"
|
|
750
941
|
],
|
|
@@ -753,17 +944,19 @@
|
|
|
753
944
|
{
|
|
754
945
|
"provider": "Google",
|
|
755
946
|
"tier": "Google AI Plus",
|
|
756
|
-
"monthly_usd":
|
|
947
|
+
"monthly_usd": 4.99,
|
|
948
|
+
"annual_usd": null,
|
|
757
949
|
"surface_funded": [
|
|
758
950
|
"gemini-app",
|
|
759
951
|
"gemini-cli"
|
|
760
952
|
],
|
|
761
|
-
"notes": "Entry-paid Google AI tier with 2x higher usage limits than Free in the Gemini app, access to
|
|
953
|
+
"notes": "Entry-paid Google AI tier with 2x higher usage limits than Free in the Gemini app, access to Gemini 3.1 Pro / Nano Banana Pro / Daily Brief / Gemini Omni video generation, 200 Google Flow Credits, and 400 GB of cloud storage (price cut from $7.99 to $4.99 on 2026-06-08; storage doubled from 200 GB to 400 GB)."
|
|
762
954
|
},
|
|
763
955
|
{
|
|
764
956
|
"provider": "Google",
|
|
765
957
|
"tier": "Google AI Pro",
|
|
766
958
|
"monthly_usd": 20.0,
|
|
959
|
+
"annual_usd": 199.99,
|
|
767
960
|
"surface_funded": [
|
|
768
961
|
"gemini-app",
|
|
769
962
|
"gemini-cli"
|
|
@@ -774,6 +967,7 @@
|
|
|
774
967
|
"provider": "Google",
|
|
775
968
|
"tier": "Google AI Ultra ($100)",
|
|
776
969
|
"monthly_usd": 100.0,
|
|
970
|
+
"annual_usd": null,
|
|
777
971
|
"surface_funded": [
|
|
778
972
|
"gemini-app",
|
|
779
973
|
"gemini-cli"
|
|
@@ -784,6 +978,7 @@
|
|
|
784
978
|
"provider": "Google",
|
|
785
979
|
"tier": "Google AI Ultra ($200)",
|
|
786
980
|
"monthly_usd": 200.0,
|
|
981
|
+
"annual_usd": null,
|
|
787
982
|
"surface_funded": [
|
|
788
983
|
"gemini-app",
|
|
789
984
|
"gemini-cli"
|
|
@@ -794,6 +989,7 @@
|
|
|
794
989
|
"provider": "OpenAI",
|
|
795
990
|
"tier": "ChatGPT Go",
|
|
796
991
|
"monthly_usd": 8.0,
|
|
992
|
+
"annual_usd": null,
|
|
797
993
|
"surface_funded": [
|
|
798
994
|
"chatgpt-app",
|
|
799
995
|
"codex-cli"
|
|
@@ -804,6 +1000,7 @@
|
|
|
804
1000
|
"provider": "OpenAI",
|
|
805
1001
|
"tier": "ChatGPT Plus",
|
|
806
1002
|
"monthly_usd": 20.0,
|
|
1003
|
+
"annual_usd": null,
|
|
807
1004
|
"surface_funded": [
|
|
808
1005
|
"chatgpt-app",
|
|
809
1006
|
"codex-cli"
|
|
@@ -814,6 +1011,7 @@
|
|
|
814
1011
|
"provider": "OpenAI",
|
|
815
1012
|
"tier": "ChatGPT Pro ($100)",
|
|
816
1013
|
"monthly_usd": 100.0,
|
|
1014
|
+
"annual_usd": null,
|
|
817
1015
|
"surface_funded": [
|
|
818
1016
|
"chatgpt-app",
|
|
819
1017
|
"codex-cli"
|
|
@@ -824,6 +1022,7 @@
|
|
|
824
1022
|
"provider": "OpenAI",
|
|
825
1023
|
"tier": "ChatGPT Pro ($200)",
|
|
826
1024
|
"monthly_usd": 200.0,
|
|
1025
|
+
"annual_usd": null,
|
|
827
1026
|
"surface_funded": [
|
|
828
1027
|
"chatgpt-app",
|
|
829
1028
|
"codex-cli"
|