npm - @ai-sdk/google-vertex - Versions diffs - 4.0.28 → 4.0.29 - Mend

@ai-sdk/google-vertex 4.0.28 → 4.0.29

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/CHANGELOG.md +9 -0
package/dist/anthropic/edge/index.js +1 -1
package/dist/anthropic/edge/index.mjs +1 -1
package/dist/edge/index.js +1 -1
package/dist/edge/index.mjs +1 -1
package/dist/index.js +1 -1
package/dist/index.mjs +1 -1
package/docs/16-google-vertex.mdx +108 -0
package/package.json +4 -4

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,14 @@
 # @ai-sdk/google-vertex
+## 4.0.29
+### Patch Changes
+- Updated dependencies [462ad00]
+  - @ai-sdk/provider-utils@4.0.10
+  - @ai-sdk/anthropic@3.0.24
+  - @ai-sdk/google@3.0.14
 ## 4.0.28
 ### Patch Changes

package/dist/anthropic/edge/index.js CHANGED Viewed

@@ -32,7 +32,7 @@ var import_provider_utils3 = require("@ai-sdk/provider-utils");
 var import_provider_utils = require("@ai-sdk/provider-utils");
 // src/version.ts
-var VERSION = true ? "4.0.28" : "0.0.0-test";
+var VERSION = true ? "4.0.29" : "0.0.0-test";
 // src/edge/google-vertex-auth-edge.ts
 var loadCredentials = async () => {

package/dist/anthropic/edge/index.mjs CHANGED Viewed

@@ -10,7 +10,7 @@ import {
 } from "@ai-sdk/provider-utils";
 // src/version.ts
-var VERSION = true ? "4.0.28" : "0.0.0-test";
+var VERSION = true ? "4.0.29" : "0.0.0-test";
 // src/edge/google-vertex-auth-edge.ts
 var loadCredentials = async () => {

package/dist/edge/index.js CHANGED Viewed

@@ -33,7 +33,7 @@ var import_internal2 = require("@ai-sdk/google/internal");
 var import_provider_utils4 = require("@ai-sdk/provider-utils");
 // src/version.ts
-var VERSION = true ? "4.0.28" : "0.0.0-test";
+var VERSION = true ? "4.0.29" : "0.0.0-test";
 // src/google-vertex-embedding-model.ts
 var import_provider = require("@ai-sdk/provider");

package/dist/edge/index.mjs CHANGED Viewed

@@ -14,7 +14,7 @@ import {
 } from "@ai-sdk/provider-utils";
 // src/version.ts
-var VERSION = true ? "4.0.28" : "0.0.0-test";
+var VERSION = true ? "4.0.29" : "0.0.0-test";
 // src/google-vertex-embedding-model.ts
 import {

package/dist/index.js CHANGED Viewed

@@ -55,7 +55,7 @@ var import_internal2 = require("@ai-sdk/google/internal");
 var import_provider_utils4 = require("@ai-sdk/provider-utils");
 // src/version.ts
-var VERSION = true ? "4.0.28" : "0.0.0-test";
+var VERSION = true ? "4.0.29" : "0.0.0-test";
 // src/google-vertex-embedding-model.ts
 var import_provider = require("@ai-sdk/provider");

package/dist/index.mjs CHANGED Viewed

@@ -35,7 +35,7 @@ import {
 } from "@ai-sdk/provider-utils";
 // src/version.ts
-var VERSION = true ? "4.0.28" : "0.0.0-test";
+var VERSION = true ? "4.0.29" : "0.0.0-test";
 // src/google-vertex-embedding-model.ts
 import {

package/docs/16-google-vertex.mdx CHANGED Viewed

@@ -287,6 +287,11 @@ await generateText({
 The following optional provider options are available for Google Vertex models:
+- **cachedContent** _string_
+  Optional. The name of the cached content used as context to serve the prediction.
+  Format: projects/\{project\}/locations/\{location\}/cachedContents/\{cachedContent\}
 - **structuredOutputs** _boolean_
   Optional. Enable structured output. Default is true.
@@ -546,6 +551,109 @@ const { text } = await generateText({
 See [File Parts](/docs/foundations/prompts#file-parts) for details on how to use files in prompts.
+### Cached Content
+Google Vertex AI supports both explicit and implicit caching to help reduce costs on repetitive content.
+#### Implicit Caching
+```ts
+import { vertex } from '@ai-sdk/google-vertex';
+import { generateText } from 'ai';
+// Structure prompts with consistent content at the beginning
+const baseContext =
+  'You are a cooking assistant with expertise in Italian cuisine. Here are 1000 lasagna recipes for reference...';
+const { text: veggieLasagna } = await generateText({
+  model: vertex('gemini-2.5-pro'),
+  prompt: `${baseContext}\n\nWrite a vegetarian lasagna recipe for 4 people.`,
+});
+// Second request with same prefix - eligible for cache hit
+const { text: meatLasagna, providerMetadata } = await generateText({
+  model: vertex('gemini-2.5-pro'),
+  prompt: `${baseContext}\n\nWrite a meat lasagna recipe for 12 people.`,
+});
+// Check cached token count in usage metadata
+console.log('Cached tokens:', providerMetadata.google);
+// e.g.
+// {
+//   groundingMetadata: null,
+//   safetyRatings: null,
+//   usageMetadata: {
+//     cachedContentTokenCount: 2027,
+//     thoughtsTokenCount: 702,
+//     promptTokenCount: 2152,
+//     candidatesTokenCount: 710,
+//     totalTokenCount: 3564
+//   }
+// }
+```
+#### Explicit Caching
+You can use explicit caching with Gemini models. See the [Vertex AI context caching documentation](https://cloud.google.com/vertex-ai/generative-ai/docs/context-cache/context-cache-overview) to check if caching is supported for your model.
+First, create a cache using the Google GenAI SDK with Vertex mode enabled:
+```ts
+import { GoogleGenAI } from '@google/genai';
+const ai = new GoogleGenAI({
+  vertexai: true,
+  project: process.env.GOOGLE_VERTEX_PROJECT,
+  location: process.env.GOOGLE_VERTEX_LOCATION,
+});
+const model = 'gemini-2.5-pro';
+// Create a cache with the content you want to reuse
+const cache = await ai.caches.create({
+  model,
+  config: {
+    contents: [
+      {
+        role: 'user',
+        parts: [{ text: '1000 Lasagna Recipes...' }],
+      },
+    ],
+    ttl: '300s', // Cache expires after 5 minutes
+  },
+});
+console.log('Cache created:', cache.name);
+// e.g. projects/my-project/locations/us-central1/cachedContents/abc123
+```
+Then use the cache with the AI SDK:
+```ts
+import { vertex } from '@ai-sdk/google-vertex';
+import { generateText } from 'ai';
+const { text: veggieLasagnaRecipe } = await generateText({
+  model: vertex('gemini-2.5-pro'),
+  prompt: 'Write a vegetarian lasagna recipe for 4 people.',
+  providerOptions: {
+    google: {
+      cachedContent: cache.name,
+    },
+  },
+});
+const { text: meatLasagnaRecipe } = await generateText({
+  model: vertex('gemini-2.5-pro'),
+  prompt: 'Write a meat lasagna recipe for 12 people.',
+  providerOptions: {
+    google: {
+      cachedContent: cache.name,
+    },
+  },
+});
+```
 ### Safety Ratings
 The safety ratings provide insight into the safety of the model's response.

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@ai-sdk/google-vertex",
-  "version": "4.0.28",
+  "version": "4.0.29",
   "license": "Apache-2.0",
   "sideEffects": false,
   "main": "./dist/index.js",
@@ -48,10 +48,10 @@
   },
   "dependencies": {
     "google-auth-library": "^10.5.0",
-    "@ai-sdk/anthropic": "3.0.23",
-    "@ai-sdk/google": "3.0.13",
+    "@ai-sdk/anthropic": "3.0.24",
     "@ai-sdk/provider": "3.0.5",
-    "@ai-sdk/provider-utils": "4.0.9"
+    "@ai-sdk/provider-utils": "4.0.10",
+    "@ai-sdk/google": "3.0.14"
   },
   "devDependencies": {
     "@types/node": "20.17.24",