@ssweens/pi-vertex 1.1.9 → 1.1.12
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +9 -0
- package/README.md +14 -8
- package/TEST_COVERAGE.md +1 -0
- package/index.ts +4 -3
- package/models/claude.ts +27 -0
- package/models/maas.ts +21 -2
- package/package.json +1 -1
package/CHANGELOG.md
CHANGED
|
@@ -2,6 +2,15 @@
|
|
|
2
2
|
|
|
3
3
|
All notable changes to this project will be documented in this file.
|
|
4
4
|
|
|
5
|
+
## [1.1.12] - 2026-06-03
|
|
6
|
+
### Added
|
|
7
|
+
- **Claude Opus 4.8** (`claude-opus-4-8`) — added the new Vertex/Gemini Enterprise Agent Platform Anthropic partner model with 1M context, 128K max output tokens, and the same published global/regional pricing tier used by Opus 4.7.
|
|
8
|
+
- **Grok 4.3** (`grok-4.3`) — added the new Vertex/Gemini Enterprise Agent Platform xAI partner model with 200K context, 32,768 max output tokens (conservative default), and the published Google pricing tier for Grok 4.3.
|
|
9
|
+
|
|
10
|
+
## [1.1.10] - 2026-05-28
|
|
11
|
+
### Fixed
|
|
12
|
+
- Switched `registerProvider("vertex")` `apiKey` from legacy env-var shorthand (`"GOOGLE_CLOUD_PROJECT"`) to explicit env syntax (`"$GOOGLE_CLOUD_PROJECT"`). This removes deprecation warnings and future-proofs provider registration against upcoming removal of implicit env-var detection.
|
|
13
|
+
|
|
5
14
|
## [1.1.9] - 2026-05-19
|
|
6
15
|
### Fixed
|
|
7
16
|
- **Gemini 3/3.5 default thinking preserved** — previously, if no reasoning effort level was specified, we silently overrode Gemini 3/3.5 models to use their lowest thinking level (`MINIMAL`). This severely degraded the intelligence of Gemini 3.5 Flash (defaulting it to no real reasoning/thinking) and Gemini 3 Pro/Flash. We now completely omit `thinkingConfig` when `options.reasoning` is undefined, allowing Gemini 3/3.5 models to use their native GA defaults (`MEDIUM` for 3.5 Flash, `HIGH` for others).
|
package/README.md
CHANGED
|
@@ -15,11 +15,11 @@ Set your GCP project and credentials. Vertex AI models (Gemini, Claude, Llama, D
|
|
|
15
15
|
|
|
16
16
|
## Features
|
|
17
17
|
|
|
18
|
-
- **
|
|
18
|
+
- **45 models** across 4 categories:
|
|
19
19
|
- **Gemini** (9): 3.1 Pro, 3.1 Flash-Lite, 3 Flash, 2.5 Pro, 2.5 Flash, 2.5 Flash-Lite, 2.0 Flash, 2.0 Flash-Lite
|
|
20
|
-
- **Claude** (
|
|
20
|
+
- **Claude** (11): Opus 4.8, Opus 4.7, Opus 4.6, Sonnet 4.6, Opus/Sonnet/Haiku 4.5, Opus 4.1, Opus 4, Sonnet 4, 3.5 Sonnet v2
|
|
21
21
|
- **Llama** (3): 4 Maverick, 4 Scout, 3.3 70B
|
|
22
|
-
- **Other MaaS** (
|
|
22
|
+
- **Other MaaS** (22): Grok 4.3, Grok 4.20, Grok 4.1 Fast, Gemma, Mistral, DeepSeek, Qwen, OpenAI GPT-OSS, Kimi, MiniMax, GLM
|
|
23
23
|
|
|
24
24
|
- **Unified streaming**: Single provider, multiple model families
|
|
25
25
|
- **Full tool calling support**: All models with multi-turn tool use and proper tool result handling
|
|
@@ -86,7 +86,8 @@ pi --provider vertex --model gemini-2.5-pro --version
|
|
|
86
86
|
|
|
87
87
|
```bash
|
|
88
88
|
# Use any supported model
|
|
89
|
-
pi --provider vertex --model claude-opus-4-
|
|
89
|
+
pi --provider vertex --model claude-opus-4-8
|
|
90
|
+
pi --provider vertex --model grok-4.3
|
|
90
91
|
pi --provider vertex --model gemini-2.5-pro
|
|
91
92
|
pi --provider vertex --model llama-4-maverick
|
|
92
93
|
pi --provider vertex --model deepseek-v3.2
|
|
@@ -100,8 +101,11 @@ pi --provider vertex --model claude-sonnet-4-6 --reasoning high
|
|
|
100
101
|
Add to `~/.bashrc` or `~/.zshrc`:
|
|
101
102
|
|
|
102
103
|
```bash
|
|
103
|
-
# Claude 4.
|
|
104
|
-
alias pic="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model claude-opus-4-
|
|
104
|
+
# Claude 4.8 Opus
|
|
105
|
+
alias pic="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model claude-opus-4-8"
|
|
106
|
+
|
|
107
|
+
# Grok 4.3
|
|
108
|
+
alias pig4="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model grok-4.3"
|
|
105
109
|
|
|
106
110
|
# Gemini 2.5 Pro
|
|
107
111
|
alias pig="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model gemini-2.5-pro"
|
|
@@ -132,6 +136,7 @@ Prices shown are for the **global** endpoint. Non-global regions (us-east5, euro
|
|
|
132
136
|
|
|
133
137
|
| Model | Context | Max Tokens | Input | Reasoning | Price global (in/out) | Price regional (in/out) |
|
|
134
138
|
|-------|---------|------------|-------|-----------|----------------------|------------------------|
|
|
139
|
+
| claude-opus-4-8 | 1M | 128,000 | text, image | ✅ | $5.00/$25.00 | $5.50/$27.50 |
|
|
135
140
|
| claude-opus-4-7 | 1M | 128,000 | text, image | ✅ | $5.00/$25.00 | $5.50/$27.50 |
|
|
136
141
|
| claude-opus-4-6 | 1M | 128,000 | text, image | ✅ | $5.00/$25.00 | $5.50/$27.50 |
|
|
137
142
|
| claude-sonnet-4-6 | 1M | 128,000 | text, image | ✅ | $3.00/$15.00 | $3.30/$16.50 |
|
|
@@ -173,8 +178,9 @@ Prices shown are for the **global** endpoint. Non-global regions (us-east5, euro
|
|
|
173
178
|
| minimax-m2 | 196K | minimaxai | $0.30/$1.20 | global |
|
|
174
179
|
| glm-5 | 200K | zai-org | $1.00/$3.20 | global |
|
|
175
180
|
| glm-4.7 | 200K | zai-org | $0.60/$2.20 | global |
|
|
176
|
-
| grok-4.
|
|
177
|
-
| grok-4.
|
|
181
|
+
| grok-4.3 | 1M | xai | $1.25/$2.50 | global |
|
|
182
|
+
| grok-4.20-reasoning | 1M | xai | $1.25/$2.50 | global |
|
|
183
|
+
| grok-4.1-fast-reasoning | 2M | xai | $0.20/$0.50 | global |
|
|
178
184
|
| gemma-4-26b-a4b-it | 262K | google | $0.15/$0.60 | global |
|
|
179
185
|
|
|
180
186
|
## Regional Endpoints
|
package/TEST_COVERAGE.md
CHANGED
|
@@ -7,6 +7,7 @@
|
|
|
7
7
|
## Manual Verification
|
|
8
8
|
- Claude 4.6 streaming verified via Anthropic Vertex SDK.
|
|
9
9
|
- Mid-session model switching (tool call replay) verified interactively in pi.
|
|
10
|
+
- Registry sanity checks verified locally for `claude-opus-4-8` and `grok-4.3` after model additions.
|
|
10
11
|
|
|
11
12
|
## Gaps / Next Steps
|
|
12
13
|
- Add automated integration tests for Anthropic Vertex streaming and tool replay.
|
package/index.ts
CHANGED
|
@@ -21,7 +21,8 @@
|
|
|
21
21
|
* GOOGLE_APPLICATION_CREDENTIALS (optional, for service account auth)
|
|
22
22
|
*
|
|
23
23
|
* Usage:
|
|
24
|
-
* pi --provider vertex --model claude-opus-4-
|
|
24
|
+
* pi --provider vertex --model claude-opus-4-8
|
|
25
|
+
* pi --provider vertex --model grok-4.3
|
|
25
26
|
* pi --provider vertex --model gemini-2.5-pro
|
|
26
27
|
* pi --provider vertex --model llama-4-maverick
|
|
27
28
|
*/
|
|
@@ -90,8 +91,8 @@ export default function (pi: ExtensionAPI) {
|
|
|
90
91
|
// Use a placeholder baseUrl (actual URLs built per-request based on model region)
|
|
91
92
|
baseUrl: "https://aiplatform.googleapis.com",
|
|
92
93
|
|
|
93
|
-
// Use env var
|
|
94
|
-
apiKey: "GOOGLE_CLOUD_PROJECT",
|
|
94
|
+
// Use explicit env var reference
|
|
95
|
+
apiKey: "$GOOGLE_CLOUD_PROJECT",
|
|
95
96
|
|
|
96
97
|
// API type varies by model
|
|
97
98
|
api: "vertex-unified",
|
package/models/claude.ts
CHANGED
|
@@ -11,6 +11,33 @@
|
|
|
11
11
|
import type { VertexModelConfig } from "../types.js";
|
|
12
12
|
|
|
13
13
|
export const CLAUDE_MODELS: VertexModelConfig[] = [
|
|
14
|
+
// Claude 4.8 series
|
|
15
|
+
{
|
|
16
|
+
id: "claude-opus-4-8",
|
|
17
|
+
name: "Claude Opus 4.8",
|
|
18
|
+
apiId: "claude-opus-4-8",
|
|
19
|
+
publisher: "anthropic",
|
|
20
|
+
endpointType: "maas",
|
|
21
|
+
contextWindow: 1000000,
|
|
22
|
+
maxTokens: 128000,
|
|
23
|
+
input: ["text", "image"],
|
|
24
|
+
reasoning: true,
|
|
25
|
+
tools: true,
|
|
26
|
+
cost: {
|
|
27
|
+
input: 5.00,
|
|
28
|
+
output: 25.00,
|
|
29
|
+
cacheRead: 0.50,
|
|
30
|
+
cacheWrite: 6.25,
|
|
31
|
+
},
|
|
32
|
+
costRegional: {
|
|
33
|
+
input: 5.50,
|
|
34
|
+
output: 27.50,
|
|
35
|
+
cacheRead: 0.55,
|
|
36
|
+
cacheWrite: 6.875,
|
|
37
|
+
},
|
|
38
|
+
region: "global",
|
|
39
|
+
},
|
|
40
|
+
|
|
14
41
|
// Claude 4.7 series
|
|
15
42
|
{
|
|
16
43
|
id: "claude-opus-4-7",
|
package/models/maas.ts
CHANGED
|
@@ -9,13 +9,32 @@ import type { VertexModelConfig } from "../types.js";
|
|
|
9
9
|
|
|
10
10
|
export const MAAS_MODELS: VertexModelConfig[] = [
|
|
11
11
|
// --- xAI Grok ---
|
|
12
|
+
{
|
|
13
|
+
id: "grok-4.3",
|
|
14
|
+
name: "Grok 4.3",
|
|
15
|
+
apiId: "grok-4.3",
|
|
16
|
+
publisher: "xai",
|
|
17
|
+
endpointType: "maas",
|
|
18
|
+
contextWindow: 1000000,
|
|
19
|
+
maxTokens: 32768,
|
|
20
|
+
input: ["text", "image"],
|
|
21
|
+
reasoning: true,
|
|
22
|
+
tools: true,
|
|
23
|
+
cost: {
|
|
24
|
+
input: 1.25,
|
|
25
|
+
output: 2.50,
|
|
26
|
+
cacheRead: 0.20,
|
|
27
|
+
cacheWrite: 0,
|
|
28
|
+
},
|
|
29
|
+
region: "global",
|
|
30
|
+
},
|
|
12
31
|
{
|
|
13
32
|
id: "grok-4.20-reasoning",
|
|
14
33
|
name: "Grok 4.20 Reasoning",
|
|
15
34
|
apiId: "grok-4.20-reasoning",
|
|
16
35
|
publisher: "xai",
|
|
17
36
|
endpointType: "maas",
|
|
18
|
-
contextWindow:
|
|
37
|
+
contextWindow: 1000000,
|
|
19
38
|
maxTokens: 32000,
|
|
20
39
|
input: ["text", "image"],
|
|
21
40
|
reasoning: true,
|
|
@@ -34,7 +53,7 @@ export const MAAS_MODELS: VertexModelConfig[] = [
|
|
|
34
53
|
apiId: "grok-4.1-fast-reasoning",
|
|
35
54
|
publisher: "xai",
|
|
36
55
|
endpointType: "maas",
|
|
37
|
-
contextWindow:
|
|
56
|
+
contextWindow: 2000000,
|
|
38
57
|
maxTokens: 32000,
|
|
39
58
|
input: ["text", "image"],
|
|
40
59
|
reasoning: true,
|