skyloom 1.14.8 → 1.15.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (156) hide show
  1. package/.github/workflows/ci.yml +2 -2
  2. package/.github/workflows/publish.yml +51 -4
  3. package/CONVERSION_PLAN.md +191 -191
  4. package/config/default.yaml +46 -43
  5. package/config/models.yaml +928 -155
  6. package/config/providers.yaml +109 -6
  7. package/dist/agents/snow.d.ts +2 -0
  8. package/dist/agents/snow.d.ts.map +1 -1
  9. package/dist/agents/snow.js +36 -5
  10. package/dist/agents/snow.js.map +1 -1
  11. package/dist/cli/loom_chat.d.ts.map +1 -1
  12. package/dist/cli/loom_chat.js +207 -1
  13. package/dist/cli/loom_chat.js.map +1 -1
  14. package/dist/cli/main.js +190 -40
  15. package/dist/cli/main.js.map +1 -1
  16. package/dist/cli/tui.d.ts.map +1 -1
  17. package/dist/cli/tui.js +6 -31
  18. package/dist/cli/tui.js.map +1 -1
  19. package/dist/core/agent.d.ts +6 -4
  20. package/dist/core/agent.d.ts.map +1 -1
  21. package/dist/core/agent.js +61 -20
  22. package/dist/core/agent.js.map +1 -1
  23. package/dist/core/catalog.d.ts.map +1 -1
  24. package/dist/core/catalog.js +30 -9
  25. package/dist/core/catalog.js.map +1 -1
  26. package/dist/core/commands.d.ts +110 -0
  27. package/dist/core/commands.d.ts.map +1 -0
  28. package/dist/core/commands.js +633 -0
  29. package/dist/core/commands.js.map +1 -0
  30. package/dist/core/concurrency.d.ts +38 -0
  31. package/dist/core/concurrency.d.ts.map +1 -0
  32. package/dist/core/concurrency.js +65 -0
  33. package/dist/core/concurrency.js.map +1 -0
  34. package/dist/core/factory.js +16 -16
  35. package/dist/core/file_checkpoint.d.ts +9 -0
  36. package/dist/core/file_checkpoint.d.ts.map +1 -1
  37. package/dist/core/file_checkpoint.js +33 -1
  38. package/dist/core/file_checkpoint.js.map +1 -1
  39. package/dist/core/llm.d.ts.map +1 -1
  40. package/dist/core/llm.js +66 -13
  41. package/dist/core/llm.js.map +1 -1
  42. package/dist/core/memory.js +51 -51
  43. package/dist/core/schemas.d.ts +16 -0
  44. package/dist/core/schemas.d.ts.map +1 -1
  45. package/dist/core/schemas.js +32 -0
  46. package/dist/core/schemas.js.map +1 -1
  47. package/dist/core/security.d.ts.map +1 -1
  48. package/dist/core/security.js +27 -0
  49. package/dist/core/security.js.map +1 -1
  50. package/dist/core/skymd.js +14 -14
  51. package/dist/core/trace.d.ts +105 -0
  52. package/dist/core/trace.d.ts.map +1 -0
  53. package/dist/core/trace.js +213 -0
  54. package/dist/core/trace.js.map +1 -0
  55. package/dist/tools/builtin.d.ts +2 -6
  56. package/dist/tools/builtin.d.ts.map +1 -1
  57. package/dist/tools/builtin.js +18 -111
  58. package/dist/tools/builtin.js.map +1 -1
  59. package/dist/tools/extra.d.ts +13 -0
  60. package/dist/tools/extra.d.ts.map +1 -0
  61. package/dist/tools/extra.js +827 -0
  62. package/dist/tools/extra.js.map +1 -0
  63. package/dist/tools/guards.d.ts +12 -0
  64. package/dist/tools/guards.d.ts.map +1 -0
  65. package/dist/tools/guards.js +143 -0
  66. package/dist/tools/guards.js.map +1 -0
  67. package/dist/tools/model_tool.d.ts.map +1 -1
  68. package/dist/tools/model_tool.js +24 -4
  69. package/dist/tools/model_tool.js.map +1 -1
  70. package/dist/web/markdown.d.ts +32 -0
  71. package/dist/web/markdown.d.ts.map +1 -0
  72. package/dist/web/markdown.js +202 -0
  73. package/dist/web/markdown.js.map +1 -0
  74. package/dist/web/server.d.ts +4 -0
  75. package/dist/web/server.d.ts.map +1 -1
  76. package/dist/web/server.js +14 -582
  77. package/dist/web/server.js.map +1 -1
  78. package/dist/web/ui.d.ts +31 -0
  79. package/dist/web/ui.d.ts.map +1 -0
  80. package/dist/web/ui.js +1009 -0
  81. package/dist/web/ui.js.map +1 -0
  82. package/docs/AESTHETIC_DESIGN.md +152 -152
  83. package/docs/OPTIMIZATION_PLAN.md +178 -178
  84. package/package.json +1 -1
  85. package/src/agents/snow.ts +38 -5
  86. package/src/cli/commands_md.ts +112 -112
  87. package/src/cli/input_macros.ts +83 -83
  88. package/src/cli/loom.ts +1041 -1041
  89. package/src/cli/loom_chat.ts +772 -603
  90. package/src/cli/main.ts +853 -723
  91. package/src/cli/tui.ts +264 -289
  92. package/src/core/agent/guard.ts +133 -133
  93. package/src/core/agent/task.ts +100 -100
  94. package/src/core/agent.ts +1630 -1590
  95. package/src/core/agent_helpers.ts +500 -500
  96. package/src/core/bus.ts +221 -221
  97. package/src/core/cache.ts +153 -153
  98. package/src/core/catalog.ts +199 -178
  99. package/src/core/circuit_breaker.ts +119 -119
  100. package/src/core/commands.ts +704 -0
  101. package/src/core/concurrency.ts +73 -0
  102. package/src/core/config.ts +365 -365
  103. package/src/core/constants.ts +95 -95
  104. package/src/core/factory.ts +656 -656
  105. package/src/core/file_checkpoint.ts +163 -136
  106. package/src/core/hooks.ts +126 -126
  107. package/src/core/llm.ts +972 -915
  108. package/src/core/logger.ts +143 -143
  109. package/src/core/mcp.ts +1001 -1001
  110. package/src/core/memory.ts +1201 -1201
  111. package/src/core/middleware.ts +350 -350
  112. package/src/core/model_config.ts +159 -159
  113. package/src/core/pipelines.ts +424 -424
  114. package/src/core/schemas.ts +319 -282
  115. package/src/core/security.ts +27 -0
  116. package/src/core/semantic.ts +211 -211
  117. package/src/core/skill.ts +384 -384
  118. package/src/core/skymd.ts +143 -143
  119. package/src/core/theme.ts +65 -65
  120. package/src/core/tool.ts +457 -457
  121. package/src/core/trace.ts +236 -0
  122. package/src/core/verify.ts +71 -71
  123. package/src/plugins/loader.ts +91 -91
  124. package/src/skills/loader.ts +75 -75
  125. package/src/tools/builtin.ts +571 -642
  126. package/src/tools/computer.ts +279 -279
  127. package/src/tools/extra.ts +662 -0
  128. package/src/tools/guards.ts +82 -0
  129. package/src/tools/model_tool.ts +93 -74
  130. package/src/tools/todo.ts +76 -76
  131. package/src/web/markdown.ts +193 -0
  132. package/src/web/server.ts +117 -693
  133. package/src/web/ui.ts +949 -0
  134. package/tests/agent.test.ts +211 -159
  135. package/tests/agent_helpers.test.ts +48 -48
  136. package/tests/catalog.test.ts +86 -86
  137. package/tests/checkpoint_commands.test.ts +124 -124
  138. package/tests/claude_compat.test.ts +110 -110
  139. package/tests/commands.test.ts +103 -0
  140. package/tests/concurrency.test.ts +102 -0
  141. package/tests/config.test.ts +41 -41
  142. package/tests/extra_tools.test.ts +212 -0
  143. package/tests/fence_plugin.test.ts +52 -52
  144. package/tests/guard.test.ts +75 -75
  145. package/tests/loom.test.ts +337 -337
  146. package/tests/memory.test.ts +170 -170
  147. package/tests/model_config.test.ts +109 -109
  148. package/tests/skymd.test.ts +146 -146
  149. package/tests/ssrf.test.ts +38 -38
  150. package/tests/structured_retry.test.ts +87 -0
  151. package/tests/task.test.ts +60 -60
  152. package/tests/todo_toolstats.test.ts +94 -94
  153. package/tests/trace.test.ts +128 -0
  154. package/tests/tui.test.ts +67 -67
  155. package/tests/web.test.ts +169 -0
  156. package/tsconfig.json +38 -38
@@ -1,155 +1,928 @@
1
- # Model Catalog — latest models per provider
2
- # Every model listed here is directly callable via the LLM client.
3
-
4
- openai:
5
- - name: gpt-4.1
6
- context: 1048576
7
- cost_in: 2.00
8
- cost_out: 8.00
9
- desc: "旗舰,百万token上下文"
10
- - name: gpt-4.1-mini
11
- context: 1048576
12
- cost_in: 0.40
13
- cost_out: 1.60
14
- desc: "轻量,同款长上下文"
15
- - name: gpt-4o
16
- context: 131072
17
- cost_in: 2.50
18
- cost_out: 10.00
19
- desc: "多模态全能"
20
- - name: gpt-4o-mini
21
- context: 131072
22
- cost_in: 0.15
23
- cost_out: 0.60
24
- desc: "小模型高性价比"
25
- - name: o4-mini
26
- context: 204800
27
- cost_in: 1.10
28
- cost_out: 4.40
29
- desc: "推理模型轻量版"
30
-
31
- anthropic:
32
- - name: claude-sonnet-4-6
33
- context: 204800
34
- cost_in: 3.00
35
- cost_out: 15.00
36
- desc: "编程+推理首选"
37
- - name: claude-opus-4-7
38
- context: 204800
39
- cost_in: 5.00
40
- cost_out: 25.00
41
- desc: "最强旗舰"
42
- - name: claude-haiku-4-5
43
- context: 204800
44
- cost_in: 0.80
45
- cost_out: 4.00
46
- desc: "速度最快"
47
-
48
- deepseek:
49
- - name: deepseek-chat
50
- context: 131072
51
- cost_in: 0.27
52
- cost_out: 1.10
53
- desc: "通用对话"
54
- - name: deepseek-reasoner
55
- context: 65536
56
- cost_in: 0.55
57
- cost_out: 2.19
58
- desc: "深度推理 (alias → v4-flash)"
59
- - name: deepseek-v4-flash
60
- context: 131072
61
- cost_in: 0.14
62
- cost_out: 0.28
63
- desc: "极速低成本 (deepseek-chat 实际后端)"
64
- - name: deepseek-v4-pro
65
- context: 131072
66
- cost_in: 1.74
67
- cost_out: 3.48
68
- desc: "旗舰版"
69
-
70
- google:
71
- - name: gemini-2.5-pro
72
- context: 1048576
73
- cost_in: 1.25
74
- cost_out: 10.00
75
- desc: "旗舰推理"
76
- - name: gemini-2.5-flash
77
- context: 1048576
78
- cost_in: 0.30
79
- cost_out: 2.50
80
- desc: "快速长上下文"
81
-
82
- groq:
83
- - name: llama-4-scout
84
- context: 131072
85
- cost_in: 0
86
- cost_out: 0
87
- desc: "Meta最新,免费额度"
88
- - name: llama-3.3-70b
89
- context: 131072
90
- cost_in: 0
91
- cost_out: 0
92
- desc: "Llama旗舰"
93
- - name: mixtral-8x7b
94
- context: 32768
95
- cost_in: 0
96
- cost_out: 0
97
- desc: "MoE混合专家"
98
-
99
- mistral:
100
- - name: mistral-large
101
- context: 131072
102
- cost_in: 2.00
103
- cost_out: 6.00
104
- desc: "旗舰通用"
105
- - name: mistral-small
106
- context: 32768
107
- cost_in: 0.20
108
- cost_out: 0.60
109
- desc: "轻量高效"
110
-
111
- openrouter:
112
- - name: openai/gpt-4.1
113
- context: 1048576
114
- cost_in: 2.00
115
- cost_out: 8.00
116
- desc: "通过OpenRouter"
117
- - name: anthropic/claude-sonnet-4-6
118
- context: 204800
119
- cost_in: 3.00
120
- cost_out: 15.00
121
- desc: "通过OpenRouter"
122
- - name: google/gemini-2.5-flash
123
- context: 1048576
124
- cost_in: 0.30
125
- cost_out: 2.50
126
- desc: "通过OpenRouter"
127
- - name: meta-llama/llama-4-maverick
128
- context: 131072
129
- cost_in: 0.20
130
- cost_out: 0.60
131
- desc: "Meta旗舰"
132
-
133
- xai:
134
- - name: grok-4
135
- context: 131072
136
- cost_in: 3.00
137
- cost_out: 15.00
138
- desc: "Grok最新"
139
-
140
- ollama:
141
- - name: llama3
142
- context: 8192
143
- cost_in: 0
144
- cost_out: 0
145
- desc: "本地部署"
146
- - name: qwen2.5
147
- context: 32768
148
- cost_in: 0
149
- cost_out: 0
150
- desc: "通义千问"
151
- - name: deepseek-r1
152
- context: 32768
153
- cost_in: 0
154
- cost_out: 0
155
- desc: "本地推理"
1
+ # Model Catalog — comprehensive multi-provider model directory
2
+ # Every model listed here is directly callable via the LLM client.
3
+ # Costs are USD per 1M tokens. Context windows in tokens.
4
+
5
+ # ═══════════════════════════════════════════
6
+ # OpenAI
7
+ # ═══════════════════════════════════════════
8
+ openai:
9
+ - name: gpt-4.1
10
+ context: 1048576
11
+ cost_in: 2.00
12
+ cost_out: 8.00
13
+ desc: "旗舰,百万token上下文"
14
+ - name: gpt-4.1-mini
15
+ context: 1048576
16
+ cost_in: 0.40
17
+ cost_out: 1.60
18
+ desc: "轻量,同款长上下文"
19
+ - name: gpt-4.1-nano
20
+ context: 1048576
21
+ cost_in: 0.10
22
+ cost_out: 0.40
23
+ desc: "超轻量,极致性价比"
24
+ - name: gpt-4o
25
+ context: 131072
26
+ cost_in: 2.50
27
+ cost_out: 10.00
28
+ desc: "多模态全能"
29
+ - name: gpt-4o-mini
30
+ context: 131072
31
+ cost_in: 0.15
32
+ cost_out: 0.60
33
+ desc: "小模型高性价比"
34
+ - name: o3
35
+ context: 204800
36
+ cost_in: 2.00
37
+ cost_out: 8.00
38
+ desc: "最新推理模型"
39
+ - name: o3-mini
40
+ context: 204800
41
+ cost_in: 1.10
42
+ cost_out: 4.40
43
+ desc: "推理模型轻量版"
44
+ - name: o4-mini
45
+ context: 204800
46
+ cost_in: 1.10
47
+ cost_out: 4.40
48
+ desc: "推理模型轻量版"
49
+ - name: o1
50
+ context: 204800
51
+ cost_in: 15.00
52
+ cost_out: 60.00
53
+ desc: "深度推理旗舰"
54
+ - name: o1-mini
55
+ context: 131072
56
+ cost_in: 3.00
57
+ cost_out: 12.00
58
+ desc: "推理模型轻量版"
59
+ - name: o1-pro
60
+ context: 204800
61
+ cost_in: 150.00
62
+ cost_out: 600.00
63
+ desc: "推理模型专业版(极贵)"
64
+ - name: gpt-4.5-preview
65
+ context: 131072
66
+ cost_in: 75.00
67
+ cost_out: 150.00
68
+ desc: "GPT-4.5预览版"
69
+
70
+ # ═══════════════════════════════════════════
71
+ # Anthropic
72
+ # ═══════════════════════════════════════════
73
+ anthropic:
74
+ - name: claude-sonnet-4-6
75
+ context: 204800
76
+ cost_in: 3.00
77
+ cost_out: 15.00
78
+ desc: "编程+推理首选"
79
+ - name: claude-opus-4-7
80
+ context: 204800
81
+ cost_in: 5.00
82
+ cost_out: 25.00
83
+ desc: "最强旗舰"
84
+ - name: claude-haiku-4-5
85
+ context: 204800
86
+ cost_in: 0.80
87
+ cost_out: 4.00
88
+ desc: "速度最快"
89
+ - name: claude-3-7-sonnet
90
+ context: 204800
91
+ cost_in: 3.00
92
+ cost_out: 15.00
93
+ desc: "Claude 3.7 Sonnet"
94
+ - name: claude-3-5-sonnet
95
+ context: 204800
96
+ cost_in: 3.00
97
+ cost_out: 15.00
98
+ desc: "Claude 3.5 Sonnet"
99
+ - name: claude-3-5-haiku
100
+ context: 204800
101
+ cost_in: 0.80
102
+ cost_out: 4.00
103
+ desc: "Claude 3.5 Haiku"
104
+ - name: claude-3-opus
105
+ context: 204800
106
+ cost_in: 15.00
107
+ cost_out: 75.00
108
+ desc: "Claude 3 Opus"
109
+
110
+ # ═══════════════════════════════════════════
111
+ # Google
112
+ # ═══════════════════════════════════════════
113
+ google:
114
+ - name: gemini-2.5-pro
115
+ context: 1048576
116
+ cost_in: 1.25
117
+ cost_out: 10.00
118
+ desc: "旗舰推理"
119
+ - name: gemini-2.5-flash
120
+ context: 1048576
121
+ cost_in: 0.30
122
+ cost_out: 2.50
123
+ desc: "快速长上下文"
124
+ - name: gemini-2.0-flash
125
+ context: 1048576
126
+ cost_in: 0.10
127
+ cost_out: 0.40
128
+ desc: "快速低成本"
129
+ - name: gemini-2.0-flash-lite
130
+ context: 1048576
131
+ cost_in: 0.075
132
+ cost_out: 0.30
133
+ desc: "超轻量快速"
134
+ - name: gemini-1.5-pro
135
+ context: 2097152
136
+ cost_in: 1.25
137
+ cost_out: 5.00
138
+ desc: "百万上下文"
139
+ - name: gemini-1.5-flash
140
+ context: 1048576
141
+ cost_in: 0.075
142
+ cost_out: 0.30
143
+ desc: "快速低成本"
144
+
145
+ # ═══════════════════════════════════════════
146
+ # DeepSeek
147
+ # ═══════════════════════════════════════════
148
+ deepseek:
149
+ - name: deepseek-chat
150
+ context: 131072
151
+ cost_in: 0.27
152
+ cost_out: 1.10
153
+ desc: "通用对话"
154
+ - name: deepseek-reasoner
155
+ context: 65536
156
+ cost_in: 0.55
157
+ cost_out: 2.19
158
+ desc: "深度推理 (alias → v4-flash)"
159
+ - name: deepseek-v4-flash
160
+ context: 131072
161
+ cost_in: 0.14
162
+ cost_out: 0.28
163
+ desc: "极速低成本 (deepseek-chat 实际后端)"
164
+ - name: deepseek-v4-pro
165
+ context: 131072
166
+ cost_in: 1.74
167
+ cost_out: 3.48
168
+ desc: "旗舰版"
169
+ - name: deepseek-r1
170
+ context: 131072
171
+ cost_in: 0.55
172
+ cost_out: 2.19
173
+ desc: "推理模型"
174
+
175
+ # ═══════════════════════════════════════════
176
+ # xAI (Grok)
177
+ # ═══════════════════════════════════════════
178
+ xai:
179
+ - name: grok-4
180
+ context: 131072
181
+ cost_in: 3.00
182
+ cost_out: 15.00
183
+ desc: "Grok最新旗舰"
184
+ - name: grok-3
185
+ context: 131072
186
+ cost_in: 3.00
187
+ cost_out: 15.00
188
+ desc: "Grok 3"
189
+ - name: grok-3-mini
190
+ context: 131072
191
+ cost_in: 0.30
192
+ cost_out: 0.50
193
+ desc: "Grok 3 Mini"
194
+ - name: grok-2
195
+ context: 131072
196
+ cost_in: 2.00
197
+ cost_out: 10.00
198
+ desc: "Grok 2"
199
+
200
+ # ═══════════════════════════════════════════
201
+ # Mistral
202
+ # ═══════════════════════════════════════════
203
+ mistral:
204
+ - name: mistral-large
205
+ context: 131072
206
+ cost_in: 2.00
207
+ cost_out: 6.00
208
+ desc: "旗舰通用"
209
+ - name: mistral-small
210
+ context: 32768
211
+ cost_in: 0.20
212
+ cost_out: 0.60
213
+ desc: "轻量高效"
214
+ - name: codestral
215
+ context: 32768
216
+ cost_in: 0.30
217
+ cost_out: 0.90
218
+ desc: "代码专用"
219
+ - name: pixtral-large
220
+ context: 131072
221
+ cost_in: 2.00
222
+ cost_out: 6.00
223
+ desc: "多模态旗舰"
224
+ - name: pixtral
225
+ context: 131072
226
+ cost_in: 0.15
227
+ cost_out: 0.45
228
+ desc: "多模态轻量"
229
+ - name: ministral-8b
230
+ context: 131072
231
+ cost_in: 0.10
232
+ cost_out: 0.10
233
+ desc: "8B小模型"
234
+ - name: ministral-3b
235
+ context: 131072
236
+ cost_in: 0.04
237
+ cost_out: 0.04
238
+ desc: "3B超轻量"
239
+
240
+ # ═══════════════════════════════════════════
241
+ # Groq (极速推理)
242
+ # ═══════════════════════════════════════════
243
+ groq:
244
+ - name: llama-4-scout
245
+ context: 131072
246
+ cost_in: 0
247
+ cost_out: 0
248
+ desc: "Meta最新,免费额度"
249
+ - name: llama-3.3-70b
250
+ context: 131072
251
+ cost_in: 0
252
+ cost_out: 0
253
+ desc: "Llama旗舰"
254
+ - name: mixtral-8x7b
255
+ context: 32768
256
+ cost_in: 0
257
+ cost_out: 0
258
+ desc: "MoE混合专家"
259
+ - name: gemma2-9b-it
260
+ context: 8192
261
+ cost_in: 0
262
+ cost_out: 0
263
+ desc: "Google Gemma 9B"
264
+ - name: llama-3.1-8b-instant
265
+ context: 131072
266
+ cost_in: 0
267
+ cost_out: 0
268
+ desc: "Llama 3.1 8B 极速"
269
+
270
+ # ═══════════════════════════════════════════
271
+ # Cohere
272
+ # ═══════════════════════════════════════════
273
+ cohere:
274
+ - name: command-r-plus
275
+ context: 131072
276
+ cost_in: 2.50
277
+ cost_out: 10.00
278
+ desc: "旗舰RAG优化"
279
+ - name: command-r
280
+ context: 131072
281
+ cost_in: 0.50
282
+ cost_out: 1.50
283
+ desc: "RAG优化"
284
+ - name: command-light
285
+ context: 4096
286
+ cost_in: 0.30
287
+ cost_out: 0.60
288
+ desc: "轻量快速"
289
+ - name: command
290
+ context: 4096
291
+ cost_in: 1.00
292
+ cost_out: 2.00
293
+ desc: "通用对话"
294
+
295
+ # ═══════════════════════════════════════════
296
+ # Perplexity (搜索增强)
297
+ # ═══════════════════════════════════════════
298
+ perplexity:
299
+ - name: sonar-pro
300
+ context: 204800
301
+ cost_in: 3.00
302
+ cost_out: 15.00
303
+ desc: "搜索增强旗舰"
304
+ - name: sonar
305
+ context: 131072
306
+ cost_in: 1.00
307
+ cost_out: 1.00
308
+ desc: "搜索增强标准"
309
+ - name: sonar-reasoning
310
+ context: 131072
311
+ cost_in: 5.00
312
+ cost_out: 5.00
313
+ desc: "搜索+推理"
314
+ - name: sonar-reasoning-pro
315
+ context: 131072
316
+ cost_in: 2.00
317
+ cost_out: 8.00
318
+ desc: "搜索+推理专业版"
319
+
320
+ # ═══════════════════════════════════════════
321
+ # Fireworks AI
322
+ # ═══════════════════════════════════════════
323
+ fireworks:
324
+ - name: accounts/fireworks/models/llama-v3p1-405b-instruct
325
+ context: 131072
326
+ cost_in: 3.00
327
+ cost_out: 3.00
328
+ desc: "Llama 3.1 405B"
329
+ - name: accounts/fireworks/models/llama-v3p1-70b-instruct
330
+ context: 131072
331
+ cost_in: 0.90
332
+ cost_out: 0.90
333
+ desc: "Llama 3.1 70B"
334
+ - name: accounts/fireworks/models/mixtral-8x22b-instruct
335
+ context: 65536
336
+ cost_in: 1.20
337
+ cost_out: 1.20
338
+ desc: "Mixtral 8x22B"
339
+ - name: accounts/fireworks/models/qwen2p5-72b-instruct
340
+ context: 32768
341
+ cost_in: 0.90
342
+ cost_out: 0.90
343
+ desc: "Qwen 2.5 72B"
344
+
345
+ # ═══════════════════════════════════════════
346
+ # Together AI
347
+ # ═══════════════════════════════════════════
348
+ together:
349
+ - name: meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo
350
+ context: 32768
351
+ cost_in: 3.50
352
+ cost_out: 3.50
353
+ desc: "Llama 3.1 405B Turbo"
354
+ - name: meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo
355
+ context: 32768
356
+ cost_in: 0.88
357
+ cost_out: 0.88
358
+ desc: "Llama 3.1 70B Turbo"
359
+ - name: meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo
360
+ context: 32768
361
+ cost_in: 0.18
362
+ cost_out: 0.18
363
+ desc: "Llama 3.1 8B Turbo"
364
+ - name: Qwen/Qwen2.5-72B-Instruct-Turbo
365
+ context: 32768
366
+ cost_in: 1.20
367
+ cost_out: 1.20
368
+ desc: "Qwen 2.5 72B Turbo"
369
+ - name: deepseek-ai/DeepSeek-V3
370
+ context: 32768
371
+ cost_in: 1.25
372
+ cost_out: 1.25
373
+ desc: "DeepSeek V3"
374
+ - name: deepseek-ai/DeepSeek-R1
375
+ context: 32768
376
+ cost_in: 7.00
377
+ cost_out: 7.00
378
+ desc: "DeepSeek R1"
379
+
380
+ # ═══════════════════════════════════════════
381
+ # OpenRouter (多模型聚合)
382
+ # ═══════════════════════════════════════════
383
+ openrouter:
384
+ - name: openai/gpt-4.1
385
+ context: 1048576
386
+ cost_in: 2.00
387
+ cost_out: 8.00
388
+ desc: "通过OpenRouter"
389
+ - name: openai/gpt-4o
390
+ context: 131072
391
+ cost_in: 2.50
392
+ cost_out: 10.00
393
+ desc: "通过OpenRouter"
394
+ - name: openai/gpt-4o-mini
395
+ context: 131072
396
+ cost_in: 0.15
397
+ cost_out: 0.60
398
+ desc: "通过OpenRouter"
399
+ - name: anthropic/claude-sonnet-4-6
400
+ context: 204800
401
+ cost_in: 3.00
402
+ cost_out: 15.00
403
+ desc: "通过OpenRouter"
404
+ - name: anthropic/claude-opus-4-7
405
+ context: 204800
406
+ cost_in: 5.00
407
+ cost_out: 25.00
408
+ desc: "通过OpenRouter"
409
+ - name: google/gemini-2.5-pro
410
+ context: 1048576
411
+ cost_in: 1.25
412
+ cost_out: 10.00
413
+ desc: "通过OpenRouter"
414
+ - name: google/gemini-2.5-flash
415
+ context: 1048576
416
+ cost_in: 0.30
417
+ cost_out: 2.50
418
+ desc: "通过OpenRouter"
419
+ - name: meta-llama/llama-4-maverick
420
+ context: 131072
421
+ cost_in: 0.20
422
+ cost_out: 0.60
423
+ desc: "Meta旗舰"
424
+ - name: meta-llama/llama-3.1-405b-instruct
425
+ context: 32768
426
+ cost_in: 2.50
427
+ cost_out: 2.50
428
+ desc: "Llama 3.1 405B"
429
+ - name: deepseek/deepseek-chat
430
+ context: 131072
431
+ cost_in: 0.27
432
+ cost_out: 1.10
433
+ desc: "通过OpenRouter"
434
+ - name: deepseek/deepseek-r1
435
+ context: 131072
436
+ cost_in: 0.55
437
+ cost_out: 2.19
438
+ desc: "通过OpenRouter"
439
+ - name: x-ai/grok-4
440
+ context: 131072
441
+ cost_in: 3.00
442
+ cost_out: 15.00
443
+ desc: "通过OpenRouter"
444
+ - name: mistralai/mistral-large
445
+ context: 131072
446
+ cost_in: 2.00
447
+ cost_out: 6.00
448
+ desc: "通过OpenRouter"
449
+
450
+ # ═══════════════════════════════════════════
451
+ # 通义千问 / Qwen (阿里云)
452
+ # ══════════════════════════════════════════
453
+ qwen:
454
+ - name: qwen-max
455
+ context: 32768
456
+ cost_in: 2.80
457
+ cost_out: 8.40
458
+ desc: "通义千问旗舰"
459
+ - name: qwen-plus
460
+ context: 131072
461
+ cost_in: 0.56
462
+ cost_out: 1.68
463
+ desc: "通义千问增强版"
464
+ - name: qwen-turbo
465
+ context: 131072
466
+ cost_in: 0.084
467
+ cost_out: 0.252
468
+ desc: "通义千问快速版"
469
+ - name: qwen-long
470
+ context: 1000000
471
+ cost_in: 0.07
472
+ cost_out: 0.28
473
+ desc: "百万上下文"
474
+ - name: qwen-vl-max
475
+ context: 32768
476
+ cost_in: 2.80
477
+ cost_out: 8.40
478
+ desc: "视觉理解旗舰"
479
+ - name: qwen-vl-plus
480
+ context: 32768
481
+ cost_in: 0.56
482
+ cost_out: 1.68
483
+ desc: "视觉理解增强"
484
+ - name: qwen-coder-plus
485
+ context: 131072
486
+ cost_in: 0.56
487
+ cost_out: 1.68
488
+ desc: "代码专用增强"
489
+ - name: qwen-coder-turbo
490
+ context: 131072
491
+ cost_in: 0.084
492
+ cost_out: 0.252
493
+ desc: "代码专用快速"
494
+ - name: qwq-plus
495
+ context: 131072
496
+ cost_in: 0.56
497
+ cost_out: 1.68
498
+ desc: "推理增强版"
499
+
500
+ # ═══════════════════════════════════════════
501
+ # 智谱 AI / GLM
502
+ # ═══════════════════════════════════════════
503
+ zhipu:
504
+ - name: glm-4-plus
505
+ context: 131072
506
+ cost_in: 7.00
507
+ cost_out: 7.00
508
+ desc: "智谱旗舰"
509
+ - name: glm-4
510
+ context: 131072
511
+ cost_in: 14.00
512
+ cost_out: 14.00
513
+ desc: "智谱标准版"
514
+ - name: glm-4-flash
515
+ context: 131072
516
+ cost_in: 0
517
+ cost_out: 0
518
+ desc: "智谱免费版"
519
+ - name: glm-4-air
520
+ context: 131072
521
+ cost_in: 1.40
522
+ cost_out: 1.40
523
+ desc: "智谱Air版"
524
+ - name: glm-4-airx
525
+ context: 131072
526
+ cost_in: 14.00
527
+ cost_out: 14.00
528
+ desc: "智谱AirX版"
529
+ - name: glm-4-long
530
+ context: 1000000
531
+ cost_in: 1.40
532
+ cost_out: 1.40
533
+ desc: "智谱长上下文"
534
+ - name: glm-4-flashx
535
+ context: 131072
536
+ cost_in: 0
537
+ cost_out: 0
538
+ desc: "智谱FlashX免费"
539
+ - name: glm-4v-plus
540
+ context: 8192
541
+ cost_in: 14.00
542
+ cost_out: 14.00
543
+ desc: "智谱视觉旗舰"
544
+ - name: glm-4v-flash
545
+ context: 8192
546
+ cost_in: 0
547
+ cost_out: 0
548
+ desc: "智谱视觉免费"
549
+ - name: glm-z1-air
550
+ context: 131072
551
+ cost_in: 1.40
552
+ cost_out: 1.40
553
+ desc: "智谱推理Air"
554
+ - name: glm-z1-flash
555
+ context: 131072
556
+ cost_in: 0
557
+ cost_out: 0
558
+ desc: "智谱推理免费"
559
+
560
+ # ═══════════════════════════════════════════
561
+ # 零一万物 / 01.AI (Yi)
562
+ # ═══════════════════════════════════════════
563
+ lingyiwanwu:
564
+ - name: yi-large
565
+ context: 32768
566
+ cost_in: 2.80
567
+ cost_out: 2.80
568
+ desc: "零一万物旗舰"
569
+ - name: yi-large-turbo
570
+ context: 16384
571
+ cost_in: 1.68
572
+ cost_out: 1.68
573
+ desc: "零一万物快速"
574
+ - name: yi-large-rag
575
+ context: 16384
576
+ cost_in: 3.50
577
+ cost_out: 3.50
578
+ desc: "零一万物RAG"
579
+ - name: yi-medium
580
+ context: 16384
581
+ cost_in: 0.35
582
+ cost_out: 0.35
583
+ desc: "零一万物中等"
584
+ - name: yi-spark
585
+ context: 16384
586
+ cost_in: 0.14
587
+ cost_out: 0.14
588
+ desc: "零一万物轻量"
589
+ - name: yi-vision
590
+ context: 16384
591
+ cost_in: 0.84
592
+ cost_out: 0.84
593
+ desc: "零一万物视觉"
594
+
595
+ # ═══════════════════════════════════════════
596
+ # MiniMax
597
+ # ═══════════════════════════════════════════
598
+ minimax:
599
+ - name: MiniMax-Text-01
600
+ context: 1000000
601
+ cost_in: 0.14
602
+ cost_out: 1.12
603
+ desc: "MiniMax旗舰,百万上下文"
604
+ - name: abab6.5s-chat
605
+ context: 245760
606
+ cost_in: 0.14
607
+ cost_out: 0.14
608
+ desc: "MiniMax 6.5s"
609
+ - name: abab5.5s-chat
610
+ context: 8192
611
+ cost_in: 0.21
612
+ cost_out: 0.21
613
+ desc: "MiniMax 5.5s"
614
+
615
+ # ═══════════════════════════════════════════
616
+ # 月之暗面 / Moonshot
617
+ # ═══════════════════════════════════════════
618
+ moonshot:
619
+ - name: moonshot-v1-128k
620
+ context: 131072
621
+ cost_in: 8.40
622
+ cost_out: 8.40
623
+ desc: "Moonshot 128K"
624
+ - name: moonshot-v1-32k
625
+ context: 32768
626
+ cost_in: 3.36
627
+ cost_out: 3.36
628
+ desc: "Moonshot 32K"
629
+ - name: moonshot-v1-8k
630
+ context: 8192
631
+ cost_in: 1.68
632
+ cost_out: 1.68
633
+ desc: "Moonshot 8K"
634
+ - name: kimi-latest
635
+ context: 131072
636
+ cost_in: 1.68
637
+ cost_out: 1.68
638
+ desc: "Kimi最新模型"
639
+
640
+ # ═══════════════════════════════════════════
641
+ # 百度 / 文心一言
642
+ # ═══════════════════════════════════════════
643
+ baidu:
644
+ - name: ernie-4.0-8k
645
+ context: 8192
646
+ cost_in: 4.20
647
+ cost_out: 12.60
648
+ desc: "文心4.0旗舰"
649
+ - name: ernie-3.5-8k
650
+ context: 8192
651
+ cost_in: 1.68
652
+ cost_out: 1.68
653
+ desc: "文心3.5标准"
654
+ - name: ernie-speed-8k
655
+ context: 8192
656
+ cost_in: 0
657
+ cost_out: 0
658
+ desc: "文心Speed免费"
659
+ - name: ernie-lite-8k
660
+ context: 8192
661
+ cost_in: 0
662
+ cost_out: 0
663
+ desc: "文心Lite免费"
664
+ - name: ernie-tiny-8k
665
+ context: 8192
666
+ cost_in: 0
667
+ cost_out: 0
668
+ desc: "文心Tiny免费"
669
+ - name: ernie-4.0-turbo-8k
670
+ context: 8192
671
+ cost_in: 4.20
672
+ cost_out: 12.60
673
+ desc: "文心4.0 Turbo"
674
+ - name: ernie-4.0-turbo-128k
675
+ context: 131072
676
+ cost_in: 4.20
677
+ cost_out: 12.60
678
+ desc: "文心4.0 Turbo 128K"
679
+
680
+ # ═══════════════════════════════════════════
681
+ # 百川智能 / Baichuan
682
+ # ═══════════════════════════════════════════
683
+ baichuan:
684
+ - name: baichuan4
685
+ context: 32768
686
+ cost_in: 14.00
687
+ cost_out: 14.00
688
+ desc: "百川4旗舰"
689
+ - name: baichuan3-turbo
690
+ context: 32768
691
+ cost_in: 0.98
692
+ cost_out: 0.98
693
+ desc: "百川3 Turbo"
694
+ - name: baichuan2-turbo
695
+ context: 32768
696
+ cost_in: 0.56
697
+ cost_out: 0.56
698
+ desc: "百川2 Turbo"
699
+
700
+ # ═══════════════════════════════════════════
701
+ # 阶跃星辰 / StepFun
702
+ # ═══════════════════════════════════════════
703
+ stepfun:
704
+ - name: step-2-16k
705
+ context: 16384
706
+ cost_in: 1.40
707
+ cost_out: 1.40
708
+ desc: "阶跃2代 16K"
709
+ - name: step-1-128k
710
+ context: 131072
711
+ cost_in: 2.80
712
+ cost_out: 2.80
713
+ desc: "阶跃1代 128K"
714
+ - name: step-1-32k
715
+ context: 32768
716
+ cost_in: 0.70
717
+ cost_out: 0.70
718
+ desc: "阶跃1代 32K"
719
+ - name: step-1-flash
720
+ context: 8192
721
+ cost_in: 0.14
722
+ cost_out: 0.14
723
+ desc: "阶跃1代 Flash"
724
+ - name: step-1v-8k
725
+ context: 8192
726
+ cost_in: 0.70
727
+ cost_out: 0.70
728
+ desc: "阶跃视觉 8K"
729
+
730
+ # ═══════════════════════════════════════════
731
+ # Reka
732
+ # ═══════════════════════════════════════════
733
+ reka:
734
+ - name: reka-core
735
+ context: 131072
736
+ cost_in: 3.00
737
+ cost_out: 15.00
738
+ desc: "Reka旗舰多模态"
739
+ - name: reka-flash
740
+ context: 131072
741
+ cost_in: 0.80
742
+ cost_out: 2.00
743
+ desc: "Reka快速多模态"
744
+ - name: reka-edge
745
+ context: 131072
746
+ cost_in: 0.40
747
+ cost_out: 1.00
748
+ desc: "Reka轻量多模态"
749
+
750
+ # ═══════════════════════════════════════════
751
+ # Nvidia (NIM)
752
+ # ═══════════════════════════════════════════
753
+ nvidia:
754
+ - name: nemotron-4-340b-instruct
755
+ context: 4096
756
+ cost_in: 0
757
+ cost_out: 0
758
+ desc: "Nvidia Nemotron 340B 免费"
759
+ - name: meta/llama-3.1-405b-instruct
760
+ context: 131072
761
+ cost_in: 0
762
+ cost_out: 0
763
+ desc: "Llama 3.1 405B 免费"
764
+ - name: meta/llama-3.1-70b-instruct
765
+ context: 131072
766
+ cost_in: 0
767
+ cost_out: 0
768
+ desc: "Llama 3.1 70B 免费"
769
+ - name: meta/llama-3.1-8b-instruct
770
+ context: 131072
771
+ cost_in: 0
772
+ cost_out: 0
773
+ desc: "Llama 3.1 8B 免费"
774
+ - name: qwen/qwen2.5-72b-instruct
775
+ context: 32768
776
+ cost_in: 0
777
+ cost_out: 0
778
+ desc: "Qwen 2.5 72B 免费"
779
+ - name: google/gemma-2-9b-it
780
+ context: 8192
781
+ cost_in: 0
782
+ cost_out: 0
783
+ desc: "Gemma 2 9B 免费"
784
+ - name: mistralai/mixtral-8x22b-instruct-v0.1
785
+ context: 65536
786
+ cost_in: 0
787
+ cost_out: 0
788
+ desc: "Mixtral 8x22B 免费"
789
+ - name: mistralai/mistral-large-2
790
+ context: 131072
791
+ cost_in: 0
792
+ cost_out: 0
793
+ desc: "Mistral Large 2 免费"
794
+
795
+ # ═══════════════════════════════════════════
796
+ # SambaNova
797
+ # ═══════════════════════════════════════════
798
+ sambanova:
799
+ - name: Meta-Llama-3.1-405B-Instruct
800
+ context: 8192
801
+ cost_in: 0
802
+ cost_out: 0
803
+ desc: "Llama 3.1 405B 免费"
804
+ - name: Meta-Llama-3.1-70B-Instruct
805
+ context: 131072
806
+ cost_in: 0
807
+ cost_out: 0
808
+ desc: "Llama 3.1 70B 免费"
809
+ - name: Meta-Llama-3.1-8B-Instruct
810
+ context: 131072
811
+ cost_in: 0
812
+ cost_out: 0
813
+ desc: "Llama 3.1 8B 免费"
814
+ - name: Qwen2.5-72B-Instruct
815
+ context: 8192
816
+ cost_in: 0
817
+ cost_out: 0
818
+ desc: "Qwen 2.5 72B 免费"
819
+
820
+ # ═══════════════════════════════════════════
821
+ # Ollama (本地部署)
822
+ # ═══════════════════════════════════════════
823
+ ollama:
824
+ - name: llama3.3
825
+ context: 131072
826
+ cost_in: 0
827
+ cost_out: 0
828
+ desc: "Llama 3.3 70B"
829
+ - name: llama3.2
830
+ context: 131072
831
+ cost_in: 0
832
+ cost_out: 0
833
+ desc: "Llama 3.2"
834
+ - name: llama3.1
835
+ context: 131072
836
+ cost_in: 0
837
+ cost_out: 0
838
+ desc: "Llama 3.1"
839
+ - name: llama3
840
+ context: 8192
841
+ cost_in: 0
842
+ cost_out: 0
843
+ desc: "Llama 3"
844
+ - name: qwen2.5
845
+ context: 32768
846
+ cost_in: 0
847
+ cost_out: 0
848
+ desc: "通义千问 2.5"
849
+ - name: qwen2.5-coder
850
+ context: 32768
851
+ cost_in: 0
852
+ cost_out: 0
853
+ desc: "通义千问代码版"
854
+ - name: deepseek-r1
855
+ context: 32768
856
+ cost_in: 0
857
+ cost_out: 0
858
+ desc: "DeepSeek R1 本地推理"
859
+ - name: deepseek-v3
860
+ context: 32768
861
+ cost_in: 0
862
+ cost_out: 0
863
+ desc: "DeepSeek V3 本地"
864
+ - name: mistral
865
+ context: 8192
866
+ cost_in: 0
867
+ cost_out: 0
868
+ desc: "Mistral 7B"
869
+ - name: mixtral
870
+ context: 32768
871
+ cost_in: 0
872
+ cost_out: 0
873
+ desc: "Mixtral 8x7B"
874
+ - name: gemma2
875
+ context: 8192
876
+ cost_in: 0
877
+ cost_out: 0
878
+ desc: "Google Gemma 2"
879
+ - name: phi4
880
+ context: 16384
881
+ cost_in: 0
882
+ cost_out: 0
883
+ desc: "Microsoft Phi-4"
884
+ - name: codellama
885
+ context: 16384
886
+ cost_in: 0
887
+ cost_out: 0
888
+ desc: "Code Llama"
889
+ - name: nomic-embed-text
890
+ context: 8192
891
+ cost_in: 0
892
+ cost_out: 0
893
+ desc: "Nomic 嵌入模型"
894
+ - name: mxbai-embed-large
895
+ context: 512
896
+ cost_in: 0
897
+ cost_out: 0
898
+ desc: "MXBAI 嵌入模型"
899
+
900
+ # ═══════════════════════════════════════════
901
+ # LM Studio (本地 OpenAI 兼容)
902
+ # ═══════════════════════════════════════════
903
+ lmstudio:
904
+ - name: local-model
905
+ context: 8192
906
+ cost_in: 0
907
+ cost_out: 0
908
+ desc: "LM Studio 本地模型"
909
+
910
+ # ═══════════════════════════════════════════
911
+ # vLLM (自托管 OpenAI 兼容)
912
+ # ═══════════════════════════════════════════
913
+ vllm:
914
+ - name: local-model
915
+ context: 8192
916
+ cost_in: 0
917
+ cost_out: 0
918
+ desc: "vLLM 自托管模型"
919
+
920
+ # ═══════════════════════════════════════════
921
+ # LiteLLM Proxy (自托管)
922
+ # ═══════════════════════════════════════════
923
+ litellm:
924
+ - name: local-model
925
+ context: 8192
926
+ cost_in: 0
927
+ cost_out: 0
928
+ desc: "LiteLLM 代理模型"