@aliou/pi-synthetic 0.18.3 → 0.19.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@aliou/pi-synthetic",
3
- "version": "0.18.3",
3
+ "version": "0.19.0",
4
4
  "license": "MIT",
5
5
  "type": "module",
6
6
  "private": false,
@@ -33,11 +33,11 @@ export type SyntheticModelEntry =
33
33
  | SyntheticModelAliasConfig;
34
34
 
35
35
  export const SYNTHETIC_MODELS: SyntheticModelEntry[] = [
36
- // API: syn:large:text → alias for hf:zai-org/GLM-5.1
36
+ // API: syn:large:text → alias for hf:zai-org/GLM-5.2
37
37
  {
38
38
  id: "syn:large:text",
39
39
  name: "syn:large:text",
40
- aliasFor: "hf:zai-org/GLM-5.1",
40
+ aliasFor: "hf:zai-org/GLM-5.2",
41
41
  },
42
42
  // API: syn:small:text → alias for hf:zai-org/GLM-4.7-Flash
43
43
  {
@@ -112,6 +112,44 @@ export const SYNTHETIC_MODELS: SyntheticModelEntry[] = [
112
112
  contextWindow: 196608,
113
113
  maxTokens: 65536,
114
114
  },
115
+ // API: hf:zai-org/GLM-5.2 → ctx=524288, out=65536
116
+ // Reasoning: GLM-5.2 has only two effective levels — `max` (default, highest) and `high`
117
+ // (lower). Per the GLM-5.2 chat template: unset -> max; "high" -> high; every other value
118
+ // ("low", "medium", ...) falls through to max. So `max > high`.
119
+ // (https://docs.sglang.io/cookbook/autoregressive/GLM/GLM-5.2#hw=h200&variant=default&quant=fp8&strategy=low-latency&nodes=single)
120
+ //
121
+ // The Synthetic OpenAI shim validates `reasoning_effort` to the OpenAI enum and rejects
122
+ // literal `max` (and `xhigh` errors). To expose both tiers through Pi we map:
123
+ // off -> "none" (disable thinking)
124
+ // high -> "high" (High, lower)
125
+ // xhigh -> "medium" (falls through to Max, highest)
126
+ // minimal/low/medium are hidden (null) so Pi's named levels aren't remapped unexpectedly.
127
+ {
128
+ id: "hf:zai-org/GLM-5.2",
129
+ name: "zai-org/GLM-5.2",
130
+ provider: "synthetic",
131
+ reasoning: true,
132
+ thinkingLevelMap: {
133
+ off: "none",
134
+ minimal: null,
135
+ low: null,
136
+ medium: null,
137
+ high: "high",
138
+ xhigh: "medium",
139
+ },
140
+ compat: {
141
+ supportsReasoningEffort: true,
142
+ },
143
+ input: ["text"],
144
+ cost: {
145
+ input: 1.4,
146
+ output: 4.4,
147
+ cacheRead: 1.4,
148
+ cacheWrite: 0,
149
+ },
150
+ contextWindow: 524288,
151
+ maxTokens: 65536,
152
+ },
115
153
  // API: hf:zai-org/GLM-4.7-Flash → ctx=196608
116
154
  {
117
155
  id: "hf:zai-org/GLM-4.7-Flash",
@@ -236,10 +274,10 @@ export const SYNTHETIC_MODELS: SyntheticModelEntry[] = [
236
274
  contextWindow: 262144,
237
275
  maxTokens: 65536,
238
276
  },
239
- // API: hf:MiniMaxAI/MiniMax-M2.5 → ctx=191488, out=65536
277
+ // API: hf:MiniMaxAI/MiniMax-M3 → ctx=524288, out=65536
240
278
  {
241
- id: "hf:MiniMaxAI/MiniMax-M2.5",
242
- name: "MiniMaxAI/MiniMax-M2.5",
279
+ id: "hf:MiniMaxAI/MiniMax-M3",
280
+ name: "MiniMaxAI/MiniMax-M3",
243
281
  provider: "synthetic",
244
282
  reasoning: true,
245
283
  thinkingLevelMap: {
@@ -250,19 +288,19 @@ export const SYNTHETIC_MODELS: SyntheticModelEntry[] = [
250
288
  high: null,
251
289
  xhigh: null,
252
290
  },
253
- input: ["text"],
254
- cost: {
255
- input: 0.4,
256
- output: 2,
257
- cacheRead: 0.4,
258
- cacheWrite: 0,
259
- },
260
- contextWindow: 191488,
261
- maxTokens: 65536,
262
291
  compat: {
263
292
  supportsReasoningEffort: true,
264
293
  maxTokensField: "max_completion_tokens",
265
294
  },
295
+ input: ["text", "image"],
296
+ cost: {
297
+ input: 0.6,
298
+ output: 1.2,
299
+ cacheRead: 0.6,
300
+ cacheWrite: 0,
301
+ },
302
+ contextWindow: 524288,
303
+ maxTokens: 65536,
266
304
  },
267
305
  // API: hf:nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-NVFP4 → ctx=262144, out=65536
268
306
  {