@ssweens/pi-vertex 1.1.9 → 1.1.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/CHANGELOG.md CHANGED
@@ -2,6 +2,15 @@
2
2
 
3
3
  All notable changes to this project will be documented in this file.
4
4
 
5
+ ## [1.1.12] - 2026-06-03
6
+ ### Added
7
+ - **Claude Opus 4.8** (`claude-opus-4-8`) — added the new Vertex/Gemini Enterprise Agent Platform Anthropic partner model with 1M context, 128K max output tokens, and the same published global/regional pricing tier used by Opus 4.7.
8
+ - **Grok 4.3** (`grok-4.3`) — added the new Vertex/Gemini Enterprise Agent Platform xAI partner model with 200K context, 32,768 max output tokens (conservative default), and the published Google pricing tier for Grok 4.3.
9
+
10
+ ## [1.1.10] - 2026-05-28
11
+ ### Fixed
12
+ - Switched `registerProvider("vertex")` `apiKey` from legacy env-var shorthand (`"GOOGLE_CLOUD_PROJECT"`) to explicit env syntax (`"$GOOGLE_CLOUD_PROJECT"`). This removes deprecation warnings and future-proofs provider registration against upcoming removal of implicit env-var detection.
13
+
5
14
  ## [1.1.9] - 2026-05-19
6
15
  ### Fixed
7
16
  - **Gemini 3/3.5 default thinking preserved** — previously, if no reasoning effort level was specified, we silently overrode Gemini 3/3.5 models to use their lowest thinking level (`MINIMAL`). This severely degraded the intelligence of Gemini 3.5 Flash (defaulting it to no real reasoning/thinking) and Gemini 3 Pro/Flash. We now completely omit `thinkingConfig` when `options.reasoning` is undefined, allowing Gemini 3/3.5 models to use their native GA defaults (`MEDIUM` for 3.5 Flash, `HIGH` for others).
package/README.md CHANGED
@@ -15,11 +15,11 @@ Set your GCP project and credentials. Vertex AI models (Gemini, Claude, Llama, D
15
15
 
16
16
  ## Features
17
17
 
18
- - **48 models** across 4 categories:
18
+ - **45 models** across 4 categories:
19
19
  - **Gemini** (9): 3.1 Pro, 3.1 Flash-Lite, 3 Flash, 2.5 Pro, 2.5 Flash, 2.5 Flash-Lite, 2.0 Flash, 2.0 Flash-Lite
20
- - **Claude** (10): Opus 4.7, Opus 4.6, Sonnet 4.6, Opus/Sonnet/Haiku 4.5, Opus 4.1, Opus 4, Sonnet 4, 3.5 Sonnet v2
20
+ - **Claude** (11): Opus 4.8, Opus 4.7, Opus 4.6, Sonnet 4.6, Opus/Sonnet/Haiku 4.5, Opus 4.1, Opus 4, Sonnet 4, 3.5 Sonnet v2
21
21
  - **Llama** (3): 4 Maverick, 4 Scout, 3.3 70B
22
- - **Other MaaS** (26): Grok, Gemma, Mistral, DeepSeek, Qwen, OpenAI GPT-OSS, Kimi, MiniMax, GLM
22
+ - **Other MaaS** (22): Grok 4.3, Grok 4.20, Grok 4.1 Fast, Gemma, Mistral, DeepSeek, Qwen, OpenAI GPT-OSS, Kimi, MiniMax, GLM
23
23
 
24
24
  - **Unified streaming**: Single provider, multiple model families
25
25
  - **Full tool calling support**: All models with multi-turn tool use and proper tool result handling
@@ -86,7 +86,8 @@ pi --provider vertex --model gemini-2.5-pro --version
86
86
 
87
87
  ```bash
88
88
  # Use any supported model
89
- pi --provider vertex --model claude-opus-4-6
89
+ pi --provider vertex --model claude-opus-4-8
90
+ pi --provider vertex --model grok-4.3
90
91
  pi --provider vertex --model gemini-2.5-pro
91
92
  pi --provider vertex --model llama-4-maverick
92
93
  pi --provider vertex --model deepseek-v3.2
@@ -100,8 +101,11 @@ pi --provider vertex --model claude-sonnet-4-6 --reasoning high
100
101
  Add to `~/.bashrc` or `~/.zshrc`:
101
102
 
102
103
  ```bash
103
- # Claude 4.6 Opus
104
- alias pic="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model claude-opus-4-6"
104
+ # Claude 4.8 Opus
105
+ alias pic="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model claude-opus-4-8"
106
+
107
+ # Grok 4.3
108
+ alias pig4="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model grok-4.3"
105
109
 
106
110
  # Gemini 2.5 Pro
107
111
  alias pig="GOOGLE_CLOUD_PROJECT=your-project pi --provider vertex --model gemini-2.5-pro"
@@ -132,6 +136,7 @@ Prices shown are for the **global** endpoint. Non-global regions (us-east5, euro
132
136
 
133
137
  | Model | Context | Max Tokens | Input | Reasoning | Price global (in/out) | Price regional (in/out) |
134
138
  |-------|---------|------------|-------|-----------|----------------------|------------------------|
139
+ | claude-opus-4-8 | 1M | 128,000 | text, image | ✅ | $5.00/$25.00 | $5.50/$27.50 |
135
140
  | claude-opus-4-7 | 1M | 128,000 | text, image | ✅ | $5.00/$25.00 | $5.50/$27.50 |
136
141
  | claude-opus-4-6 | 1M | 128,000 | text, image | ✅ | $5.00/$25.00 | $5.50/$27.50 |
137
142
  | claude-sonnet-4-6 | 1M | 128,000 | text, image | ✅ | $3.00/$15.00 | $3.30/$16.50 |
@@ -173,8 +178,9 @@ Prices shown are for the **global** endpoint. Non-global regions (us-east5, euro
173
178
  | minimax-m2 | 196K | minimaxai | $0.30/$1.20 | global |
174
179
  | glm-5 | 200K | zai-org | $1.00/$3.20 | global |
175
180
  | glm-4.7 | 200K | zai-org | $0.60/$2.20 | global |
176
- | grok-4.20-reasoning | 200K | xai | $1.25/$2.50 | global |
177
- | grok-4.1-fast-reasoning | 128K | xai | $0.20/$0.50 | global |
181
+ | grok-4.3 | 1M | xai | $1.25/$2.50 | global |
182
+ | grok-4.20-reasoning | 1M | xai | $1.25/$2.50 | global |
183
+ | grok-4.1-fast-reasoning | 2M | xai | $0.20/$0.50 | global |
178
184
  | gemma-4-26b-a4b-it | 262K | google | $0.15/$0.60 | global |
179
185
 
180
186
  ## Regional Endpoints
package/TEST_COVERAGE.md CHANGED
@@ -7,6 +7,7 @@
7
7
  ## Manual Verification
8
8
  - Claude 4.6 streaming verified via Anthropic Vertex SDK.
9
9
  - Mid-session model switching (tool call replay) verified interactively in pi.
10
+ - Registry sanity checks verified locally for `claude-opus-4-8` and `grok-4.3` after model additions.
10
11
 
11
12
  ## Gaps / Next Steps
12
13
  - Add automated integration tests for Anthropic Vertex streaming and tool replay.
package/index.ts CHANGED
@@ -21,7 +21,8 @@
21
21
  * GOOGLE_APPLICATION_CREDENTIALS (optional, for service account auth)
22
22
  *
23
23
  * Usage:
24
- * pi --provider vertex --model claude-opus-4-6
24
+ * pi --provider vertex --model claude-opus-4-8
25
+ * pi --provider vertex --model grok-4.3
25
26
  * pi --provider vertex --model gemini-2.5-pro
26
27
  * pi --provider vertex --model llama-4-maverick
27
28
  */
@@ -90,8 +91,8 @@ export default function (pi: ExtensionAPI) {
90
91
  // Use a placeholder baseUrl (actual URLs built per-request based on model region)
91
92
  baseUrl: "https://aiplatform.googleapis.com",
92
93
 
93
- // Use env var name for detection
94
- apiKey: "GOOGLE_CLOUD_PROJECT",
94
+ // Use explicit env var reference
95
+ apiKey: "$GOOGLE_CLOUD_PROJECT",
95
96
 
96
97
  // API type varies by model
97
98
  api: "vertex-unified",
package/models/claude.ts CHANGED
@@ -11,6 +11,33 @@
11
11
  import type { VertexModelConfig } from "../types.js";
12
12
 
13
13
  export const CLAUDE_MODELS: VertexModelConfig[] = [
14
+ // Claude 4.8 series
15
+ {
16
+ id: "claude-opus-4-8",
17
+ name: "Claude Opus 4.8",
18
+ apiId: "claude-opus-4-8",
19
+ publisher: "anthropic",
20
+ endpointType: "maas",
21
+ contextWindow: 1000000,
22
+ maxTokens: 128000,
23
+ input: ["text", "image"],
24
+ reasoning: true,
25
+ tools: true,
26
+ cost: {
27
+ input: 5.00,
28
+ output: 25.00,
29
+ cacheRead: 0.50,
30
+ cacheWrite: 6.25,
31
+ },
32
+ costRegional: {
33
+ input: 5.50,
34
+ output: 27.50,
35
+ cacheRead: 0.55,
36
+ cacheWrite: 6.875,
37
+ },
38
+ region: "global",
39
+ },
40
+
14
41
  // Claude 4.7 series
15
42
  {
16
43
  id: "claude-opus-4-7",
package/models/maas.ts CHANGED
@@ -9,13 +9,32 @@ import type { VertexModelConfig } from "../types.js";
9
9
 
10
10
  export const MAAS_MODELS: VertexModelConfig[] = [
11
11
  // --- xAI Grok ---
12
+ {
13
+ id: "grok-4.3",
14
+ name: "Grok 4.3",
15
+ apiId: "grok-4.3",
16
+ publisher: "xai",
17
+ endpointType: "maas",
18
+ contextWindow: 1000000,
19
+ maxTokens: 32768,
20
+ input: ["text", "image"],
21
+ reasoning: true,
22
+ tools: true,
23
+ cost: {
24
+ input: 1.25,
25
+ output: 2.50,
26
+ cacheRead: 0.20,
27
+ cacheWrite: 0,
28
+ },
29
+ region: "global",
30
+ },
12
31
  {
13
32
  id: "grok-4.20-reasoning",
14
33
  name: "Grok 4.20 Reasoning",
15
34
  apiId: "grok-4.20-reasoning",
16
35
  publisher: "xai",
17
36
  endpointType: "maas",
18
- contextWindow: 200000,
37
+ contextWindow: 1000000,
19
38
  maxTokens: 32000,
20
39
  input: ["text", "image"],
21
40
  reasoning: true,
@@ -34,7 +53,7 @@ export const MAAS_MODELS: VertexModelConfig[] = [
34
53
  apiId: "grok-4.1-fast-reasoning",
35
54
  publisher: "xai",
36
55
  endpointType: "maas",
37
- contextWindow: 128000,
56
+ contextWindow: 2000000,
38
57
  maxTokens: 32000,
39
58
  input: ["text", "image"],
40
59
  reasoning: true,
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@ssweens/pi-vertex",
3
- "version": "1.1.9",
3
+ "version": "1.1.12",
4
4
  "description": "Google Vertex AI provider for Pi coding agent - supports Gemini, Claude, and all MaaS models",
5
5
  "type": "module",
6
6
  "main": "index.ts",