@ssweens/pi-vertex 1.1.10 → 1.1.13
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +9 -0
- package/README.md +14 -8
- package/TEST_COVERAGE.md +1 -0
- package/index.ts +2 -1
- package/models/claude.ts +54 -0
- package/models/maas.ts +21 -2
- package/package.json +1 -1
package/CHANGELOG.md
CHANGED
|
@@ -2,6 +2,15 @@
|
|
|
2
2
|
|
|
3
3
|
All notable changes to this project will be documented in this file.
|
|
4
4
|
|
|
5
|
+
## [1.1.13] - 2026-06-09
|
|
6
|
+
### Added
|
|
7
|
+
- **Claude Fable 5** (`claude-fable-5`) — Anthropic's first public Mythos-class model, positioned above Opus 4.8. 1M context, 128K max output, text/image/file input, reasoning (adaptive thinking always on), tools. $10/$50 per 1M tokens (global), $1/1M cache read, 10% regional premium. Available on Vertex AI Model Garden.
|
|
8
|
+
|
|
9
|
+
## [1.1.12] - 2026-06-03
|
|
10
|
+
### Added
|
|
11
|
+
- **Claude Opus 4.8** (`claude-opus-4-8`) — added the new Vertex/Gemini Enterprise Agent Platform Anthropic partner model with 1M context, 128K max output tokens, and the same published global/regional pricing tier used by Opus 4.7.
|
|
12
|
+
- **Grok 4.3** (`grok-4.3`) — added the new Vertex/Gemini Enterprise Agent Platform xAI partner model with 200K context, 32,768 max output tokens (conservative default), and the published Google pricing tier for Grok 4.3.
|
|
13
|
+
|
|
5
14
|
## [1.1.10] - 2026-05-28
|
|
6
15
|
### Fixed
|
|
7
16
|
- Switched `registerProvider("vertex")` `apiKey` from legacy env-var shorthand (`"GOOGLE_CLOUD_PROJECT"`) to explicit env syntax (`"$GOOGLE_CLOUD_PROJECT"`). This removes deprecation warnings and future-proofs provider registration against upcoming removal of implicit env-var detection.
|
package/README.md
CHANGED
|
@@ -15,11 +15,11 @@ Set your GCP project and credentials. Vertex AI models (Gemini, Claude, Llama, D
|
|
|
15
15
|
|
|
16
16
|
## Features
|
|
17
17
|
|
|
18
|
-
- **
|
|
18
|
+
- **45 models** across 4 categories:
|
|
19
19
|
- **Gemini** (9): 3.1 Pro, 3.1 Flash-Lite, 3 Flash, 2.5 Pro, 2.5 Flash, 2.5 Flash-Lite, 2.0 Flash, 2.0 Flash-Lite
|
|
20
|
-
- **Claude** (
|
|
20
|
+
- **Claude** (11): Opus 4.8, Opus 4.7, Opus 4.6, Sonnet 4.6, Opus/Sonnet/Haiku 4.5, Opus 4.1, Opus 4, Sonnet 4, 3.5 Sonnet v2
|
|
21
21
|
- **Llama** (3): 4 Maverick, 4 Scout, 3.3 70B
|
|
22
|
-
- **Other MaaS** (
|
|
22
|
+
- **Other MaaS** (22): Grok 4.3, Grok 4.20, Grok 4.1 Fast, Gemma, Mistral, DeepSeek, Qwen, OpenAI GPT-OSS, Kimi, MiniMax, GLM
|
|
23
23
|
|
|
24
24
|
- **Unified streaming**: Single provider, multiple model families
|
|
25
25
|
- **Full tool calling support**: All models with multi-turn tool use and proper tool result handling
|
|
@@ -86,7 +86,8 @@ pi --provider vertex --model gemini-2.5-pro --version
|
|
|
86
86
|
|
|
87
87
|
```bash
|
|
88
88
|
# Use any supported model
|
|
89
|
-
pi --provider vertex --model claude-opus-4-
|
|
89
|
+
pi --provider vertex --model claude-opus-4-8
|
|
90
|
+
pi --provider vertex --model grok-4.3
|
|
90
91
|
pi --provider vertex --model gemini-2.5-pro
|
|
91
92
|
pi --provider vertex --model llama-4-maverick
|
|
92
93
|
pi --provider vertex --model deepseek-v3.2
|
|
@@ -100,8 +101,11 @@ pi --provider vertex --model claude-sonnet-4-6 --reasoning high
|
|
|
100
101
|
Add to `~/.bashrc` or `~/.zshrc`:
|
|
101
102
|
|
|
102
103
|
```bash
|
|
103
|
-
# Claude 4.
|
|
104
|
-
alias pic="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model claude-opus-4-
|
|
104
|
+
# Claude 4.8 Opus
|
|
105
|
+
alias pic="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model claude-opus-4-8"
|
|
106
|
+
|
|
107
|
+
# Grok 4.3
|
|
108
|
+
alias pig4="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model grok-4.3"
|
|
105
109
|
|
|
106
110
|
# Gemini 2.5 Pro
|
|
107
111
|
alias pig="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model gemini-2.5-pro"
|
|
@@ -132,6 +136,7 @@ Prices shown are for the **global** endpoint. Non-global regions (us-east5, euro
|
|
|
132
136
|
|
|
133
137
|
| Model | Context | Max Tokens | Input | Reasoning | Price global (in/out) | Price regional (in/out) |
|
|
134
138
|
|-------|---------|------------|-------|-----------|----------------------|------------------------|
|
|
139
|
+
| claude-opus-4-8 | 1M | 128,000 | text, image | ✅ | $5.00/$25.00 | $5.50/$27.50 |
|
|
135
140
|
| claude-opus-4-7 | 1M | 128,000 | text, image | ✅ | $5.00/$25.00 | $5.50/$27.50 |
|
|
136
141
|
| claude-opus-4-6 | 1M | 128,000 | text, image | ✅ | $5.00/$25.00 | $5.50/$27.50 |
|
|
137
142
|
| claude-sonnet-4-6 | 1M | 128,000 | text, image | ✅ | $3.00/$15.00 | $3.30/$16.50 |
|
|
@@ -173,8 +178,9 @@ Prices shown are for the **global** endpoint. Non-global regions (us-east5, euro
|
|
|
173
178
|
| minimax-m2 | 196K | minimaxai | $0.30/$1.20 | global |
|
|
174
179
|
| glm-5 | 200K | zai-org | $1.00/$3.20 | global |
|
|
175
180
|
| glm-4.7 | 200K | zai-org | $0.60/$2.20 | global |
|
|
176
|
-
| grok-4.
|
|
177
|
-
| grok-4.
|
|
181
|
+
| grok-4.3 | 1M | xai | $1.25/$2.50 | global |
|
|
182
|
+
| grok-4.20-reasoning | 1M | xai | $1.25/$2.50 | global |
|
|
183
|
+
| grok-4.1-fast-reasoning | 2M | xai | $0.20/$0.50 | global |
|
|
178
184
|
| gemma-4-26b-a4b-it | 262K | google | $0.15/$0.60 | global |
|
|
179
185
|
|
|
180
186
|
## Regional Endpoints
|
package/TEST_COVERAGE.md
CHANGED
|
@@ -7,6 +7,7 @@
|
|
|
7
7
|
## Manual Verification
|
|
8
8
|
- Claude 4.6 streaming verified via Anthropic Vertex SDK.
|
|
9
9
|
- Mid-session model switching (tool call replay) verified interactively in pi.
|
|
10
|
+
- Registry sanity checks verified locally for `claude-opus-4-8` and `grok-4.3` after model additions.
|
|
10
11
|
|
|
11
12
|
## Gaps / Next Steps
|
|
12
13
|
- Add automated integration tests for Anthropic Vertex streaming and tool replay.
|
package/index.ts
CHANGED
|
@@ -21,7 +21,8 @@
|
|
|
21
21
|
* GOOGLE_APPLICATION_CREDENTIALS (optional, for service account auth)
|
|
22
22
|
*
|
|
23
23
|
* Usage:
|
|
24
|
-
* pi --provider vertex --model claude-opus-4-
|
|
24
|
+
* pi --provider vertex --model claude-opus-4-8
|
|
25
|
+
* pi --provider vertex --model grok-4.3
|
|
25
26
|
* pi --provider vertex --model gemini-2.5-pro
|
|
26
27
|
* pi --provider vertex --model llama-4-maverick
|
|
27
28
|
*/
|
package/models/claude.ts
CHANGED
|
@@ -11,6 +11,60 @@
|
|
|
11
11
|
import type { VertexModelConfig } from "../types.js";
|
|
12
12
|
|
|
13
13
|
export const CLAUDE_MODELS: VertexModelConfig[] = [
|
|
14
|
+
// Claude Fable 5 (Mythos-class)
|
|
15
|
+
{
|
|
16
|
+
id: "claude-fable-5",
|
|
17
|
+
name: "Claude Fable 5",
|
|
18
|
+
apiId: "claude-fable-5",
|
|
19
|
+
publisher: "anthropic",
|
|
20
|
+
endpointType: "maas",
|
|
21
|
+
contextWindow: 1000000,
|
|
22
|
+
maxTokens: 128000,
|
|
23
|
+
input: ["text", "image", "file"],
|
|
24
|
+
reasoning: true,
|
|
25
|
+
tools: true,
|
|
26
|
+
cost: {
|
|
27
|
+
input: 10.00,
|
|
28
|
+
output: 50.00,
|
|
29
|
+
cacheRead: 1.00,
|
|
30
|
+
cacheWrite: 12.50,
|
|
31
|
+
},
|
|
32
|
+
costRegional: {
|
|
33
|
+
input: 11.00,
|
|
34
|
+
output: 55.00,
|
|
35
|
+
cacheRead: 1.10,
|
|
36
|
+
cacheWrite: 13.75,
|
|
37
|
+
},
|
|
38
|
+
region: "global",
|
|
39
|
+
},
|
|
40
|
+
|
|
41
|
+
// Claude 4.8 series
|
|
42
|
+
{
|
|
43
|
+
id: "claude-opus-4-8",
|
|
44
|
+
name: "Claude Opus 4.8",
|
|
45
|
+
apiId: "claude-opus-4-8",
|
|
46
|
+
publisher: "anthropic",
|
|
47
|
+
endpointType: "maas",
|
|
48
|
+
contextWindow: 1000000,
|
|
49
|
+
maxTokens: 128000,
|
|
50
|
+
input: ["text", "image"],
|
|
51
|
+
reasoning: true,
|
|
52
|
+
tools: true,
|
|
53
|
+
cost: {
|
|
54
|
+
input: 5.00,
|
|
55
|
+
output: 25.00,
|
|
56
|
+
cacheRead: 0.50,
|
|
57
|
+
cacheWrite: 6.25,
|
|
58
|
+
},
|
|
59
|
+
costRegional: {
|
|
60
|
+
input: 5.50,
|
|
61
|
+
output: 27.50,
|
|
62
|
+
cacheRead: 0.55,
|
|
63
|
+
cacheWrite: 6.875,
|
|
64
|
+
},
|
|
65
|
+
region: "global",
|
|
66
|
+
},
|
|
67
|
+
|
|
14
68
|
// Claude 4.7 series
|
|
15
69
|
{
|
|
16
70
|
id: "claude-opus-4-7",
|
package/models/maas.ts
CHANGED
|
@@ -9,13 +9,32 @@ import type { VertexModelConfig } from "../types.js";
|
|
|
9
9
|
|
|
10
10
|
export const MAAS_MODELS: VertexModelConfig[] = [
|
|
11
11
|
// --- xAI Grok ---
|
|
12
|
+
{
|
|
13
|
+
id: "grok-4.3",
|
|
14
|
+
name: "Grok 4.3",
|
|
15
|
+
apiId: "grok-4.3",
|
|
16
|
+
publisher: "xai",
|
|
17
|
+
endpointType: "maas",
|
|
18
|
+
contextWindow: 1000000,
|
|
19
|
+
maxTokens: 32768,
|
|
20
|
+
input: ["text", "image"],
|
|
21
|
+
reasoning: true,
|
|
22
|
+
tools: true,
|
|
23
|
+
cost: {
|
|
24
|
+
input: 1.25,
|
|
25
|
+
output: 2.50,
|
|
26
|
+
cacheRead: 0.20,
|
|
27
|
+
cacheWrite: 0,
|
|
28
|
+
},
|
|
29
|
+
region: "global",
|
|
30
|
+
},
|
|
12
31
|
{
|
|
13
32
|
id: "grok-4.20-reasoning",
|
|
14
33
|
name: "Grok 4.20 Reasoning",
|
|
15
34
|
apiId: "grok-4.20-reasoning",
|
|
16
35
|
publisher: "xai",
|
|
17
36
|
endpointType: "maas",
|
|
18
|
-
contextWindow:
|
|
37
|
+
contextWindow: 1000000,
|
|
19
38
|
maxTokens: 32000,
|
|
20
39
|
input: ["text", "image"],
|
|
21
40
|
reasoning: true,
|
|
@@ -34,7 +53,7 @@ export const MAAS_MODELS: VertexModelConfig[] = [
|
|
|
34
53
|
apiId: "grok-4.1-fast-reasoning",
|
|
35
54
|
publisher: "xai",
|
|
36
55
|
endpointType: "maas",
|
|
37
|
-
contextWindow:
|
|
56
|
+
contextWindow: 2000000,
|
|
38
57
|
maxTokens: 32000,
|
|
39
58
|
input: ["text", "image"],
|
|
40
59
|
reasoning: true,
|