npm - @llumiverse/drivers - Versions diffs - 0.20.0 → 0.22.0-dev.1 - Mend

@llumiverse/drivers 0.20.0 → 0.22.0-dev.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (293) hide show

package/lib/cjs/adobe/firefly.js +6 -5
package/lib/cjs/adobe/firefly.js.map +1 -1
package/lib/cjs/azure/azure_foundry.js +388 -0
package/lib/cjs/azure/azure_foundry.js.map +1 -0
package/lib/cjs/bedrock/index.js +62 -39
package/lib/cjs/bedrock/index.js.map +1 -1
package/lib/cjs/groq/index.js +178 -22
package/lib/cjs/groq/index.js.map +1 -1
package/lib/cjs/huggingface_ie.js +5 -4
package/lib/cjs/huggingface_ie.js.map +1 -1
package/lib/cjs/index.js +3 -2
package/lib/cjs/index.js.map +1 -1
package/lib/cjs/mistral/index.js +5 -3
package/lib/cjs/mistral/index.js.map +1 -1
package/lib/cjs/openai/azure_openai.js +72 -0
package/lib/cjs/openai/azure_openai.js.map +1 -0
package/lib/cjs/openai/index.js +13 -16
package/lib/cjs/openai/index.js.map +1 -1
package/lib/cjs/openai/openai.js +2 -2
package/lib/cjs/openai/openai.js.map +1 -1
package/lib/cjs/openai/openai_format.js +138 -0
package/lib/cjs/openai/openai_format.js.map +1 -0
package/lib/cjs/replicate.js +3 -3
package/lib/cjs/replicate.js.map +1 -1
package/lib/cjs/test/utils.js +1 -1
package/lib/cjs/test/utils.js.map +1 -1
package/lib/cjs/test-driver/TestErrorCompletionStream.js +20 -0
package/lib/cjs/test-driver/TestErrorCompletionStream.js.map +1 -0
package/lib/cjs/test-driver/TestValidationErrorCompletionStream.js +24 -0
package/lib/cjs/test-driver/TestValidationErrorCompletionStream.js.map +1 -0
package/lib/cjs/test-driver/index.js +109 -0
package/lib/cjs/test-driver/index.js.map +1 -0
package/lib/cjs/test-driver/utils.js +30 -0
package/lib/cjs/test-driver/utils.js.map +1 -0
package/lib/cjs/togetherai/index.js +2 -2
package/lib/cjs/togetherai/index.js.map +1 -1
package/lib/cjs/vertexai/embeddings/embeddings-text.js +1 -1
package/lib/cjs/vertexai/embeddings/embeddings-text.js.map +1 -1
package/lib/cjs/vertexai/index.js +90 -28
package/lib/cjs/vertexai/index.js.map +1 -1
package/lib/cjs/vertexai/models/claude.js +14 -12
package/lib/cjs/vertexai/models/claude.js.map +1 -1
package/lib/cjs/vertexai/models/gemini.js +158 -52
package/lib/cjs/vertexai/models/gemini.js.map +1 -1
package/lib/cjs/vertexai/models/imagen.js +11 -22
package/lib/cjs/vertexai/models/imagen.js.map +1 -1
package/lib/cjs/vertexai/models/llama.js +4 -3
package/lib/cjs/vertexai/models/llama.js.map +1 -1
package/lib/cjs/watsonx/index.js +3 -3
package/lib/cjs/watsonx/index.js.map +1 -1
package/lib/cjs/xai/index.js +4 -4
package/lib/cjs/xai/index.js.map +1 -1
package/lib/esm/adobe/firefly.js +6 -5
package/lib/esm/adobe/firefly.js.map +1 -1
package/lib/esm/azure/azure_foundry.js +382 -0
package/lib/esm/azure/azure_foundry.js.map +1 -0
package/lib/esm/bedrock/index.js +62 -39
package/lib/esm/bedrock/index.js.map +1 -1
package/lib/esm/groq/index.js +178 -22
package/lib/esm/groq/index.js.map +1 -1
package/lib/esm/huggingface_ie.js +6 -5
package/lib/esm/huggingface_ie.js.map +1 -1
package/lib/esm/index.js +3 -2
package/lib/esm/index.js.map +1 -1
package/lib/esm/mistral/index.js +5 -3
package/lib/esm/mistral/index.js.map +1 -1
package/lib/esm/openai/azure_openai.js +68 -0
package/lib/esm/openai/azure_openai.js.map +1 -0
package/lib/esm/openai/index.js +12 -15
package/lib/esm/openai/index.js.map +1 -1
package/lib/esm/openai/openai.js +2 -2
package/lib/esm/openai/openai.js.map +1 -1
package/lib/esm/openai/openai_format.js +134 -0
package/lib/esm/openai/openai_format.js.map +1 -0
package/lib/esm/replicate.js +3 -3
package/lib/esm/replicate.js.map +1 -1
package/lib/esm/src/adobe/firefly.js +116 -0
package/lib/esm/src/adobe/firefly.js.map +1 -0
package/lib/esm/src/azure/azure_foundry.js +382 -0
package/lib/esm/src/azure/azure_foundry.js.map +1 -0
package/lib/esm/src/bedrock/converse.js +278 -0
package/lib/esm/src/bedrock/converse.js.map +1 -0
package/lib/esm/src/bedrock/index.js +819 -0
package/lib/esm/src/bedrock/index.js.map +1 -0
package/lib/esm/src/bedrock/nova-image-payload.js +203 -0
package/lib/esm/src/bedrock/nova-image-payload.js.map +1 -0
package/lib/esm/src/bedrock/payloads.js +2 -0
package/lib/esm/src/bedrock/payloads.js.map +1 -0
package/lib/esm/src/bedrock/s3.js +99 -0
package/lib/esm/src/bedrock/s3.js.map +1 -0
package/lib/esm/src/groq/index.js +286 -0
package/lib/esm/src/groq/index.js.map +1 -0
package/lib/esm/src/huggingface_ie.js +196 -0
package/lib/esm/src/huggingface_ie.js.map +1 -0
package/lib/esm/src/index.js +14 -0
package/lib/esm/src/index.js.map +1 -0
package/lib/esm/src/mistral/index.js +169 -0
package/lib/esm/src/mistral/index.js.map +1 -0
package/lib/esm/src/mistral/types.js +80 -0
package/lib/esm/src/mistral/types.js.map +1 -0
package/lib/esm/src/openai/azure_openai.js +68 -0
package/lib/esm/src/openai/azure_openai.js.map +1 -0
package/lib/esm/src/openai/index.js +460 -0
package/lib/esm/src/openai/index.js.map +1 -0
package/lib/esm/src/openai/openai.js +14 -0
package/lib/esm/src/openai/openai.js.map +1 -0
package/lib/esm/src/openai/openai_format.js +134 -0
package/lib/esm/src/openai/openai_format.js.map +1 -0
package/lib/esm/src/replicate.js +268 -0
package/lib/esm/src/replicate.js.map +1 -0
package/lib/esm/src/test/TestErrorCompletionStream.js +16 -0
package/lib/esm/src/test/TestErrorCompletionStream.js.map +1 -0
package/lib/esm/src/test/TestValidationErrorCompletionStream.js +20 -0
package/lib/esm/src/test/TestValidationErrorCompletionStream.js.map +1 -0
package/lib/esm/src/test/index.js +91 -0
package/lib/esm/src/test/index.js.map +1 -0
package/lib/esm/src/test/utils.js +25 -0
package/lib/esm/src/test/utils.js.map +1 -0
package/lib/esm/src/togetherai/index.js +122 -0
package/lib/esm/src/togetherai/index.js.map +1 -0
package/lib/esm/src/togetherai/interfaces.js +2 -0
package/lib/esm/src/togetherai/interfaces.js.map +1 -0
package/lib/esm/src/vertexai/debug.js +6 -0
package/lib/esm/src/vertexai/debug.js.map +1 -0
package/lib/esm/src/vertexai/embeddings/embeddings-image.js +24 -0
package/lib/esm/src/vertexai/embeddings/embeddings-image.js.map +1 -0
package/lib/esm/src/vertexai/embeddings/embeddings-text.js +20 -0
package/lib/esm/src/vertexai/embeddings/embeddings-text.js.map +1 -0
package/lib/esm/src/vertexai/index.js +332 -0
package/lib/esm/src/vertexai/index.js.map +1 -0
package/lib/esm/src/vertexai/models/claude.js +372 -0
package/lib/esm/src/vertexai/models/claude.js.map +1 -0
package/lib/esm/src/vertexai/models/gemini.js +806 -0
package/lib/esm/src/vertexai/models/gemini.js.map +1 -0
package/lib/esm/src/vertexai/models/imagen.js +302 -0
package/lib/esm/src/vertexai/models/imagen.js.map +1 -0
package/lib/esm/src/vertexai/models/llama.js +179 -0
package/lib/esm/src/vertexai/models/llama.js.map +1 -0
package/lib/esm/src/vertexai/models.js +21 -0
package/lib/esm/src/vertexai/models.js.map +1 -0
package/lib/esm/src/watsonx/index.js +157 -0
package/lib/esm/src/watsonx/index.js.map +1 -0
package/lib/esm/src/watsonx/interfaces.js +2 -0
package/lib/esm/src/watsonx/interfaces.js.map +1 -0
package/lib/esm/src/xai/index.js +64 -0
package/lib/esm/src/xai/index.js.map +1 -0
package/lib/esm/test/utils.js +1 -1
package/lib/esm/test/utils.js.map +1 -1
package/lib/esm/test-driver/TestErrorCompletionStream.js +16 -0
package/lib/esm/test-driver/TestErrorCompletionStream.js.map +1 -0
package/lib/esm/test-driver/TestValidationErrorCompletionStream.js +20 -0
package/lib/esm/test-driver/TestValidationErrorCompletionStream.js.map +1 -0
package/lib/esm/test-driver/index.js +91 -0
package/lib/esm/test-driver/index.js.map +1 -0
package/lib/esm/test-driver/utils.js +25 -0
package/lib/esm/test-driver/utils.js.map +1 -0
package/lib/esm/togetherai/index.js +2 -2
package/lib/esm/togetherai/index.js.map +1 -1
package/lib/esm/tsconfig.tsbuildinfo +1 -0
package/lib/esm/vertexai/embeddings/embeddings-text.js +1 -1
package/lib/esm/vertexai/embeddings/embeddings-text.js.map +1 -1
package/lib/esm/vertexai/index.js +91 -29
package/lib/esm/vertexai/index.js.map +1 -1
package/lib/esm/vertexai/models/claude.js +14 -12
package/lib/esm/vertexai/models/claude.js.map +1 -1
package/lib/esm/vertexai/models/gemini.js +159 -53
package/lib/esm/vertexai/models/gemini.js.map +1 -1
package/lib/esm/vertexai/models/imagen.js +8 -16
package/lib/esm/vertexai/models/imagen.js.map +1 -1
package/lib/esm/vertexai/models/llama.js +4 -3
package/lib/esm/vertexai/models/llama.js.map +1 -1
package/lib/esm/vertexai/models.js.map +1 -1
package/lib/esm/watsonx/index.js +3 -3
package/lib/esm/watsonx/index.js.map +1 -1
package/lib/esm/xai/index.js +3 -3
package/lib/esm/xai/index.js.map +1 -1
package/lib/types/adobe/firefly.d.ts +3 -3
package/lib/types/adobe/firefly.d.ts.map +1 -1
package/lib/types/azure/azure_foundry.d.ts +50 -0
package/lib/types/azure/azure_foundry.d.ts.map +1 -0
package/lib/types/bedrock/index.d.ts +4 -4
package/lib/types/bedrock/index.d.ts.map +1 -1
package/lib/types/groq/index.d.ts +8 -5
package/lib/types/groq/index.d.ts.map +1 -1
package/lib/types/huggingface_ie.d.ts +8 -5
package/lib/types/huggingface_ie.d.ts.map +1 -1
package/lib/types/index.d.ts +3 -2
package/lib/types/index.d.ts.map +1 -1
package/lib/types/mistral/index.d.ts +4 -4
package/lib/types/mistral/index.d.ts.map +1 -1
package/lib/types/openai/azure_openai.d.ts +25 -0
package/lib/types/openai/azure_openai.d.ts.map +1 -0
package/lib/types/openai/index.d.ts +6 -7
package/lib/types/openai/index.d.ts.map +1 -1
package/lib/types/openai/openai.d.ts +2 -2
package/lib/types/openai/openai.d.ts.map +1 -1
package/lib/types/openai/openai_format.d.ts +19 -0
package/lib/types/openai/openai_format.d.ts.map +1 -0
package/lib/types/replicate.d.ts +6 -3
package/lib/types/replicate.d.ts.map +1 -1
package/lib/types/src/adobe/firefly.d.ts +29 -0
package/lib/types/src/azure/azure_foundry.d.ts +49 -0
package/lib/types/src/bedrock/converse.d.ts +8 -0
package/lib/types/src/bedrock/index.d.ts +57 -0
package/lib/types/src/bedrock/nova-image-payload.d.ts +73 -0
package/lib/types/src/bedrock/payloads.d.ts +11 -0
package/lib/types/src/bedrock/s3.d.ts +22 -0
package/lib/types/src/groq/index.d.ts +26 -0
package/lib/types/src/huggingface_ie.d.ts +34 -0
package/lib/types/src/index.d.ts +13 -0
package/lib/types/src/mistral/index.d.ts +24 -0
package/lib/types/src/mistral/types.d.ts +131 -0
package/lib/types/src/openai/azure_openai.d.ts +24 -0
package/lib/types/src/openai/index.d.ts +24 -0
package/lib/types/src/openai/openai.d.ts +14 -0
package/lib/types/src/openai/openai_format.d.ts +18 -0
package/lib/types/src/replicate.d.ts +47 -0
package/lib/types/src/test/TestErrorCompletionStream.d.ts +8 -0
package/lib/types/src/test/TestValidationErrorCompletionStream.d.ts +8 -0
package/lib/types/src/test/index.d.ts +23 -0
package/lib/types/src/test/utils.d.ts +4 -0
package/lib/types/src/togetherai/index.d.ts +22 -0
package/lib/types/src/togetherai/interfaces.d.ts +95 -0
package/lib/types/src/vertexai/debug.d.ts +1 -0
package/lib/types/src/vertexai/embeddings/embeddings-image.d.ts +10 -0
package/lib/types/src/vertexai/embeddings/embeddings-text.d.ts +9 -0
package/lib/types/src/vertexai/index.d.ts +52 -0
package/lib/types/src/vertexai/models/claude.d.ts +17 -0
package/lib/types/src/vertexai/models/gemini.d.ts +17 -0
package/lib/types/src/vertexai/models/imagen.d.ts +74 -0
package/lib/types/src/vertexai/models/llama.d.ts +19 -0
package/lib/types/src/vertexai/models.d.ts +14 -0
package/lib/types/src/watsonx/index.d.ts +26 -0
package/lib/types/src/watsonx/interfaces.d.ts +64 -0
package/lib/types/src/xai/index.d.ts +18 -0
package/lib/types/test-driver/TestErrorCompletionStream.d.ts +9 -0
package/lib/types/test-driver/TestErrorCompletionStream.d.ts.map +1 -0
package/lib/types/test-driver/TestValidationErrorCompletionStream.d.ts +9 -0
package/lib/types/test-driver/TestValidationErrorCompletionStream.d.ts.map +1 -0
package/lib/types/test-driver/index.d.ts +24 -0
package/lib/types/test-driver/index.d.ts.map +1 -0
package/lib/types/test-driver/utils.d.ts +5 -0
package/lib/types/test-driver/utils.d.ts.map +1 -0
package/lib/types/togetherai/index.d.ts +3 -3
package/lib/types/togetherai/index.d.ts.map +1 -1
package/lib/types/vertexai/index.d.ts +10 -7
package/lib/types/vertexai/index.d.ts.map +1 -1
package/lib/types/vertexai/models/claude.d.ts.map +1 -1
package/lib/types/vertexai/models/gemini.d.ts +3 -2
package/lib/types/vertexai/models/gemini.d.ts.map +1 -1
package/lib/types/vertexai/models/imagen.d.ts +2 -2
package/lib/types/vertexai/models/imagen.d.ts.map +1 -1
package/lib/types/vertexai/models/llama.d.ts +2 -2
package/lib/types/vertexai/models/llama.d.ts.map +1 -1
package/lib/types/vertexai/models.d.ts +2 -2
package/lib/types/vertexai/models.d.ts.map +1 -1
package/lib/types/watsonx/index.d.ts +3 -3
package/lib/types/watsonx/index.d.ts.map +1 -1
package/lib/types/xai/index.d.ts.map +1 -1
package/package.json +29 -25
package/src/adobe/firefly.ts +12 -20
package/src/azure/azure_foundry.ts +458 -0
package/src/bedrock/index.ts +65 -43
package/src/groq/index.ts +219 -32
package/src/huggingface_ie.ts +13 -14
package/src/index.ts +3 -2
package/src/mistral/index.ts +11 -9
package/src/openai/azure_openai.ts +92 -0
package/src/openai/index.ts +27 -28
package/src/openai/openai.ts +2 -5
package/src/openai/openai_format.ts +165 -0
package/src/replicate.ts +12 -12
package/src/{test → test-driver}/utils.ts +1 -1
package/src/togetherai/index.ts +7 -7
package/src/vertexai/embeddings/embeddings-text.ts +2 -2
package/src/vertexai/index.ts +104 -38
package/src/vertexai/models/claude.ts +18 -16
package/src/vertexai/models/gemini.ts +195 -67
package/src/vertexai/models/imagen.ts +15 -26
package/src/vertexai/models/llama.ts +6 -5
package/src/vertexai/models.ts +4 -4
package/src/watsonx/index.ts +10 -10
package/src/xai/index.ts +13 -15
package/lib/cjs/openai/azure.js +0 -31
package/lib/cjs/openai/azure.js.map +0 -1
package/lib/esm/openai/azure.js +0 -27
package/lib/esm/openai/azure.js.map +0 -1
package/lib/types/openai/azure.d.ts +0 -20
package/lib/types/openai/azure.d.ts.map +0 -1
package/src/openai/azure.ts +0 -54
/package/src/{test → test-driver}/TestErrorCompletionStream.ts +0 -0
/package/src/{test → test-driver}/TestValidationErrorCompletionStream.ts +0 -0
/package/src/{test → test-driver}/index.ts +0 -0

package/src/replicate.ts CHANGED Viewed

@@ -2,7 +2,7 @@ import {
     AIModel,
     AbstractDriver,
     Completion,
-    CompletionChunk,
+    CompletionChunkObject,
     DataSource,
     DriverOptions,
     EmbeddingsResult,
@@ -64,12 +64,12 @@ export class ReplicateDriver extends AbstractDriver<DriverOptions, string> {
         };
     }
-    async requestTextCompletionStream(prompt: string, options: ExecutionOptions): Promise<AsyncIterable<CompletionChunk>> {
+    async requestTextCompletionStream(prompt: string, options: ExecutionOptions): Promise<AsyncIterable<CompletionChunkObject>> {
         if (options.model_options?._option_id !== "text-fallback") {
-            this.logger.warn("Invalid model options", {options: options.model_options });
+            this.logger.warn("Invalid model options", { options: options.model_options });
         }
         options.model_options = options.model_options as TextFallbackOptions;
         const model = ReplicateDriver.parseModelId(options.model);
         const predictionData = {
             input: {
@@ -84,11 +84,11 @@ export class ReplicateDriver extends AbstractDriver<DriverOptions, string> {
         const prediction =
             await this.service.predictions.create(predictionData);
-        const stream = new EventStream<CompletionChunk>();
+        const stream = new EventStream<CompletionChunkObject>();
         const source = new EventSource(prediction.urls.stream!);
         source.addEventListener("output", (e: any) => {
-            stream.push(e.data);
+            stream.push({result: [{ type: "text", value: e.data }] });
         });
         source.addEventListener("error", (e: any) => {
             let error: any;
@@ -97,7 +97,7 @@ export class ReplicateDriver extends AbstractDriver<DriverOptions, string> {
             } catch (error) {
                 error = JSON.stringify(e);
             }
-            this.logger?.error("Error in SSE stream", {e, error});
+            this.logger?.error("Error in SSE stream", { e, error });
         });
         source.addEventListener("done", () => {
             try {
@@ -111,7 +111,7 @@ export class ReplicateDriver extends AbstractDriver<DriverOptions, string> {
     async requestTextCompletion(prompt: string, options: ExecutionOptions) {
         if (options.model_options?._option_id !== "text-fallback") {
-            this.logger.warn("Invalid model options", {options: options.model_options });
+            this.logger.warn("Invalid model options", { options: options.model_options });
         }
         options.model_options = options.model_options as TextFallbackOptions;
         const model = ReplicateDriver.parseModelId(options.model);
@@ -136,9 +136,9 @@ export class ReplicateDriver extends AbstractDriver<DriverOptions, string> {
         //not streaming, wait for the result
         const res = await this.service.wait(prediction, {});
-        const text = res.output.join("");
+        const text: string = res.output.join("");
         return {
-            result: text,
+            result: [{ type: "text" as const, value: text }],
             original_response: options.include_original_response ? res : undefined,
         };
     }
@@ -236,7 +236,7 @@ export class ReplicateDriver extends AbstractDriver<DriverOptions, string> {
             this.service.models.versions.list(owner, model),
         ]);
-        if (!rModel || !versions || versions.length === 0) {
+        if (!rModel || !versions || (versions as any).results?.length === 0) {
             throw new Error("Model not found or no versions available");
         }
@@ -298,7 +298,7 @@ function jobInfo(job: Prediction, modelName?: string): TrainingJob {
         status = TrainingJobStatus.succeeded;
     } else if (jobStatus === 'failed') {
         status = TrainingJobStatus.failed;
-        const error = job.error as any;
+        const error = job.error as any;
         if (typeof error === 'string') {
             details = error;
         } else {

package/src/{test → test-driver}/utils.ts RENAMED Viewed

@@ -8,7 +8,7 @@ export function throwError(message: string, prompt: PromptSegment[]): never {
 export function createValidationErrorCompletion(segments: PromptSegment[]) {
     return {
-        result: "An invalid result",
+        result: [{ type: "text", value: "An invalid result" }],
         prompt: segments,
         execution_time: 3000,
         error: {

package/src/togetherai/index.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { AIModel, AbstractDriver, Completion, CompletionChunk, DriverOptions, EmbeddingsResult, ExecutionOptions, TextFallbackOptions } from "@llumiverse/core";
+import { AIModel, AbstractDriver, Completion, CompletionChunkObject, DriverOptions, EmbeddingsResult, ExecutionOptions, TextFallbackOptions } from "@llumiverse/core";
 import { transformSSEStream } from "@llumiverse/core/async";
 import { FetchClient } from "@vertesia/api-fetch-client";
 import { TextCompletion, TogetherModelInfo } from "./interfaces.js";
@@ -29,9 +29,9 @@ export class TogetherAIDriver extends AbstractDriver<TogetherAIDriverOptions, st
             } : undefined;
     }
-    async requestTextCompletion(prompt: string, options: ExecutionOptions): Promise<Completion<any>> {
+    async requestTextCompletion(prompt: string, options: ExecutionOptions): Promise<Completion> {
         if (options.model_options?._option_id !== "text-fallback") {
-            this.logger.warn("Invalid model options", {options: options.model_options });
+            this.logger.warn("Invalid model options", { options: options.model_options });
         }
         options.model_options = options.model_options as TextFallbackOptions;
@@ -60,7 +60,7 @@ export class TogetherAIDriver extends AbstractDriver<TogetherAIDriverOptions, st
         const text = choice.text ?? '';
         const usage = res.usage || {};
         return {
-            result: text,
+            result: [{ type: "text", value: text }],
             token_usage: {
                 prompt: usage.prompt_tokens,
                 result: usage.completion_tokens,
@@ -71,9 +71,9 @@ export class TogetherAIDriver extends AbstractDriver<TogetherAIDriverOptions, st
         }
     }
-    async requestTextCompletionStream(prompt: string, options: ExecutionOptions): Promise<AsyncIterable<CompletionChunk>> {
+    async requestTextCompletionStream(prompt: string, options: ExecutionOptions): Promise<AsyncIterable<CompletionChunkObject>> {
         if (options.model_options?._option_id !== "text-fallback") {
-            this.logger.warn("Invalid model options", {options: options.model_options });
+            this.logger.warn("Invalid model options", { options: options.model_options });
         }
         options.model_options = options.model_options as TextFallbackOptions;
@@ -103,7 +103,7 @@ export class TogetherAIDriver extends AbstractDriver<TogetherAIDriverOptions, st
         return transformSSEStream(stream, (data: string) => {
             const json = JSON.parse(data);
             return {
-                result: json.choices[0]?.text ?? '',
+                result: [{ type: "text", value: json.choices[0]?.text ?? '' }],
                 finish_reason: json.choices[0]?.finish_reason,          //Uses expected "stop" , "length" format
                 token_usage: {
                     prompt: json.usage?.prompt_tokens,

package/src/vertexai/embeddings/embeddings-text.ts CHANGED Viewed

@@ -36,9 +36,9 @@ export async function getEmbeddingsForText(driver: VertexAIDriver, options: Text
             title: options.title,
             content: options.content
         }]
-    } as EmbeddingsForTextPrompt;
+    } satisfies EmbeddingsForTextPrompt;
-    const model = options.model || "text-embedding-004";
+    const model = options.model || "gemini-embedding-001";
     const client = driver.getFetchClient();

package/src/vertexai/index.ts CHANGED Viewed

@@ -2,11 +2,10 @@ import {
     AIModel,
     AbstractDriver,
     Completion,
-    CompletionChunk,
+    CompletionChunkObject,
     DriverOptions,
     EmbeddingsResult,
     ExecutionOptions,
-    ImageGeneration,
     Modalities,
     ModelSearchPayload,
     PromptSegment,
@@ -20,10 +19,10 @@ import { TextEmbeddingsOptions, getEmbeddingsForText } from "./embeddings/embedd
 import { getModelDefinition } from "./models.js";
 import { EmbeddingsOptions } from "@llumiverse/core";
 import { getEmbeddingsForImages } from "./embeddings/embeddings-image.js";
-import { v1beta1 } from "@google-cloud/aiplatform";
+import { PredictionServiceClient, v1beta1 } from "@google-cloud/aiplatform";
 import { AnthropicVertex } from "@anthropic-ai/vertex-sdk";
 import { ImagenModelDefinition, ImagenPrompt } from "./models/imagen.js";
-import { GoogleGenAI, Content } from "@google/genai";
+import { GoogleGenAI, Content, Model } from "@google/genai";
 export interface VertexAIDriverOptions extends DriverOptions {
     project: string;
@@ -54,6 +53,7 @@ export class VertexAIDriver extends AbstractDriver<VertexAIDriverOptions, Vertex
     googleGenAI: GoogleGenAI | undefined;
     llamaClient: FetchClient & { region?: string } | undefined;
     modelGarden: v1beta1.ModelGardenServiceClient | undefined;
+    imagenClient: PredictionServiceClient | undefined;
     authClient: JSONClient | GoogleAuth<JSONClient>;
@@ -66,16 +66,28 @@ export class VertexAIDriver extends AbstractDriver<VertexAIDriverOptions, Vertex
         this.googleGenAI = undefined;
         this.modelGarden = undefined;
         this.llamaClient = undefined;
+        this.imagenClient = undefined;
         this.authClient = options.googleAuthOptions?.authClient ?? new GoogleAuth(options.googleAuthOptions);
     }
-    public getGoogleGenAIClient(): GoogleGenAI {
-        //Lazy initialisation
+    public getGoogleGenAIClient(region: string = this.options.region): GoogleGenAI {
+        //Lazy initialization
+        if (region !== this.options.region) {
+            //Get one off client for different region
+            return new GoogleGenAI({
+                project: this.options.project,
+                location: region,
+                vertexai: true,
+                googleAuthOptions: {
+                    authClient: this.authClient as JSONClient,
+                }
+            });
+        }
         if (!this.googleGenAI) {
             this.googleGenAI = new GoogleGenAI({
                 project: this.options.project,
-                location: this.options.region,
+                location: region,
                 vertexai: true,
                 googleAuthOptions: {
                     authClient: this.authClient as JSONClient,
@@ -86,7 +98,7 @@ export class VertexAIDriver extends AbstractDriver<VertexAIDriverOptions, Vertex
     }
     public getFetchClient(): FetchClient {
-        //Lazy initialisation
+        //Lazy initialization
         if (!this.fetchClient) {
             this.fetchClient = createFetchClient({
                 region: this.options.region,
@@ -101,7 +113,7 @@ export class VertexAIDriver extends AbstractDriver<VertexAIDriverOptions, Vertex
     }
     public getLLamaClient(region: string = "us-central1"): FetchClient {
-        //Lazy initialisation
+        //Lazy initialization
         if (!this.llamaClient || this.llamaClient["region"] !== region) {
             this.llamaClient = createFetchClient({
                 region: region,
@@ -119,19 +131,24 @@ export class VertexAIDriver extends AbstractDriver<VertexAIDriverOptions, Vertex
     }
     public getAnthropicClient(): AnthropicVertex {
-        //Lazy initialisation
+        //Lazy initialization
         if (!this.anthropicClient) {
             this.anthropicClient = new AnthropicVertex({
                 timeout: 20 * 60 * 10000, // Set to 20 minutes, 10 minute default, setting this disables long request error: https://github.com/anthropics/anthropic-sdk-typescript?#long-requests
                 region: "us-east5",
-                projectId: process.env.GOOGLE_PROJECT_ID,
+                projectId: this.options.project,
+                googleAuth: new GoogleAuth({
+                    scopes: ["https://www.googleapis.com/auth/cloud-platform"],
+                    authClient: this.authClient as JSONClient,
+                    projectId: this.options.project,
+                }),
             });
         }
         return this.anthropicClient;
     }
     public getAIPlatformClient(): v1beta1.ModelServiceClient {
-        //Lazy initialisation
+        //Lazy initialization
         if (!this.aiplatform) {
             this.aiplatform = new v1beta1.ModelServiceClient({
                 projectId: this.options.project,
@@ -143,7 +160,7 @@ export class VertexAIDriver extends AbstractDriver<VertexAIDriverOptions, Vertex
     }
     public getModelGardenClient(): v1beta1.ModelGardenServiceClient {
-        //Lazy initialisation
+        //Lazy initialization
         if (!this.modelGarden) {
             this.modelGarden = new v1beta1.ModelGardenServiceClient({
                 projectId: this.options.project,
@@ -154,6 +171,19 @@ export class VertexAIDriver extends AbstractDriver<VertexAIDriverOptions, Vertex
         return this.modelGarden;
     }
+    public getImagenClient(): PredictionServiceClient {
+        //Lazy initialization
+        if (!this.imagenClient) {
+            // TODO: make location configurable, fixed to us-central1 for now
+            this.imagenClient = new PredictionServiceClient({
+                projectId: this.options.project,
+                apiEndpoint: `us-central1-${API_BASE_PATH}`,
+                authClient: this.authClient as JSONClient,
+            });
+        }
+        return this.imagenClient;
+    }
     validateResult(result: Completion, options: ExecutionOptions) {
         // Optionally preprocess the result before validation
         const modelDef = getModelDefinition(options.model);
@@ -180,44 +210,42 @@ export class VertexAIDriver extends AbstractDriver<VertexAIDriverOptions, Vertex
         return getModelDefinition(options.model).createPrompt(this, segments, options);
     }
-    async requestTextCompletion(prompt: VertexAIPrompt, options: ExecutionOptions): Promise<Completion<any>> {
+    async requestTextCompletion(prompt: VertexAIPrompt, options: ExecutionOptions): Promise<Completion> {
         return getModelDefinition(options.model).requestTextCompletion(this, prompt, options);
     }
     async requestTextCompletionStream(
         prompt: VertexAIPrompt,
         options: ExecutionOptions,
-    ): Promise<AsyncIterable<CompletionChunk>> {
+    ): Promise<AsyncIterable<CompletionChunkObject>> {
         return getModelDefinition(options.model).requestTextCompletionStream(this, prompt, options);
     }
     async requestImageGeneration(
         _prompt: ImagenPrompt,
         _options: ExecutionOptions,
-    ): Promise<Completion<ImageGeneration>> {
+    ): Promise<Completion> {
         const splits = _options.model.split("/");
         const modelName = trimModelName(splits[splits.length - 1]);
         return new ImagenModelDefinition(modelName).requestImageGeneration(this, _prompt, _options);
     }
+    async getGenAIModelsArray(client: GoogleGenAI): Promise<Model[]> {
+        const models: Model[] = [];
+        const pager = await client.models.list();
+        for await (const item of pager) {
+            models.push(item);
+        }
+        return models;
+    }
     async listModels(_params?: ModelSearchPayload): Promise<AIModel<string>[]> {
         // Get clients
         const modelGarden = this.getModelGardenClient();
         const aiplatform = this.getAIPlatformClient();
+        const globalGenAiClient = this.getGoogleGenAIClient("global");
         let models: AIModel<string>[] = [];
-        //Project specific deployed models
-        const [response] = await aiplatform.listModels({
-            parent: `projects/${this.options.project}/locations/${this.options.region}`,
-        });
-        models = models.concat(
-            response.map((model) => ({
-                id: model.name?.split("/").pop() ?? "",
-                name: model.displayName ?? "",
-                provider: "vertexai"
-            })),
-        );
         //Model Garden Publisher models - Pretrained models
         const publishers = ["google", "anthropic", "meta"];
         // Meta "maas" models are LLama Models-As-A-Service. Non-maas models are not pre-deployed.
@@ -225,7 +253,9 @@ export class VertexAIDriver extends AbstractDriver<VertexAIDriverOptions, Vertex
         // Additional models not in the listings, but we want to include
         // TODO: Remove once the models are available in the listing API, or no longer needed
         const additionalModels = {
-            google: ["imagen-3.0-fast-generate-001"],
+            google: [
+                "imagen-3.0-fast-generate-001",
+            ],
             anthropic: [],
             meta: [
                 "llama-4-maverick-17b-128e-instruct-maas",
@@ -241,25 +271,61 @@ export class VertexAIDriver extends AbstractDriver<VertexAIDriverOptions, Vertex
         //Used to exclude retired models that are still in the listing API but not available for use.
         //Or models we do not support yet
         const unsupportedModelsByPublisher = {
-            google: ["gemini-pro", "gemini-ultra"],
+            google: ["gemini-pro", "gemini-ultra", "imagen-product-recontext-preview", "embedding"],
             anthropic: [],
             meta: [],
         };
-        for (const publisher of publishers) {
-            let [response] = await modelGarden.listPublisherModels({
+        // Start all network requests in parallel
+        const aiplatformPromise = aiplatform.listModels({
+            parent: `projects/${this.options.project}/locations/${this.options.region}`,
+        });
+        const publisherPromises = publishers.map(async (publisher) => {
+            const [response] = await modelGarden.listPublisherModels({
                 parent: `publishers/${publisher}`,
                 orderBy: "name",
                 listAllVersions: true,
             });
+            return { publisher, response };
+        });
-            // Filter out the 100+ long list coming from Google models
-            if (publisher === "google") {
-                response = response.filter((model) => {
-                    return (model.supportedActions?.openGenerationAiStudio || undefined) !== undefined;
-                });
-            }
+        const globalGooglePromise = this.getGenAIModelsArray(globalGenAiClient);
+        // Await all network requests
+        const [aiplatformResult, globalGoogleResult, ...publisherResults] = await Promise.all([
+            aiplatformPromise,
+            globalGooglePromise,
+            ...publisherPromises,
+        ]);
+        // Process aiplatform models, project specific models
+        const [response] = aiplatformResult;
+        models = models.concat(
+            response.map((model) => ({
+                id: model.name?.split("/").pop() ?? "",
+                name: model.displayName ?? "",
+                provider: "vertexai"
+            }))
+        );
+        // Process global google models from GenAI
+        models = models.concat(
+            globalGoogleResult.map((model) => {
+                const modelCapability = getModelCapabilities(model.name ?? '', "vertexai");
+                return {
+                    id: "locations/global/" + model.name,
+                    name: "Global " + model.name?.split('/').pop(),
+                    provider: "vertexai",
+                    owner: "google",
+                    input_modalities: modelModalitiesToArray(modelCapability.input),
+                    output_modalities: modelModalitiesToArray(modelCapability.output),
+                    tool_support: modelCapability.tool_support,
+                };
+            })
+        );
+        // Process publisher models
+        for (const result of publisherResults) {
+            const { publisher, response } = result;
             const modelFamily = supportedModels[publisher as keyof typeof supportedModels];
             const retiredModels = unsupportedModelsByPublisher[publisher as keyof typeof unsupportedModelsByPublisher];

package/src/vertexai/models/claude.ts CHANGED Viewed

@@ -72,11 +72,13 @@ function maxToken(option: StatelessExecutionOptions): number {
     if (modelOptions && typeof modelOptions.max_tokens === "number") {
         return modelOptions.max_tokens;
     } else {
+        const thinking_budget = modelOptions?.thinking_budget_tokens ?? 0;
+        let maxSupportedTokens = getMaxTokensLimitVertexAi(option.model);
         // Fallback to the default max tokens limit for the model
-        if (option.model.includes('claude-3-7-sonnet') && (modelOptions?.thinking_budget_tokens ?? 0) < 64000) {
-            return 64000; // Claude 3.7 can go up to 128k with a beta header, but when no max tokens is specified, we default to 64k.
+        if (option.model.includes('claude-3-7-sonnet') && (modelOptions?.thinking_budget_tokens ?? 0) < 48000) {
+            maxSupportedTokens = 64000; // Claude 3.7 can go up to 128k with a beta header, but when no max tokens is specified, we default to 64k.
         }
-        return getMaxTokensLimitVertexAi(option.model);
+        return Math.min(16000 + thinking_budget, maxSupportedTokens); // Cap to 16k, to avoid taking up too much context window and quota.
     }
 }
@@ -85,7 +87,7 @@ async function collectFileBlocks(segment: PromptSegment, restrictedTypes: true):
 async function collectFileBlocks(segment: PromptSegment, restrictedTypes?: false): Promise<ContentBlockParam[]>;
 async function collectFileBlocks(segment: PromptSegment, restrictedTypes: boolean = false): Promise<ContentBlockParam[]> {
     const contentBlocks: ContentBlockParam[] = [];
     for (const file of segment.files || []) {
         if (file.mime_type?.startsWith("image/")) {
             const allowedTypes = ["image/png", "image/jpeg", "image/gif", "image/webp"];
@@ -126,7 +128,7 @@ async function collectFileBlocks(segment: PromptSegment, restrictedTypes: boolea
             }
         }
     }
     return contentBlocks;
 }
@@ -189,7 +191,7 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
                         text: segment.content
                     } satisfies TextBlockParam);
                 }
                 // Collect file blocks with type safety
                 const fileBlocks = await collectFileBlocks(segment, true);
                 contentBlocks.push(...fileBlocks);
@@ -206,7 +208,7 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
             } else {
                 // Build content blocks for regular messages (all types allowed)
                 const contentBlocks: ContentBlockParam[] = [];
                 if (segment.content) {
                     contentBlocks.push({
                         type: 'text',
@@ -271,7 +273,7 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
         conversation = updateConversation(conversation, createPromptFromResponse(result));
         return {
-            result: text ?? '',
+            result: text ? [{ type: "text", value: text }] : [{ type: "text", value: '' }],
             tool_use,
             token_usage: {
                 prompt: result.usage.input_tokens,
@@ -301,7 +303,7 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
             switch (streamEvent.type) {
                 case "message_start":
                     return {
-                        result: '',
+                        result: [{ type: "text", value: '' }],
                         token_usage: {
                             prompt: streamEvent.message.usage.input_tokens,
                             result: streamEvent.message.usage.output_tokens
@@ -309,7 +311,7 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
                     } satisfies CompletionChunkObject;
                 case "message_delta":
                     return {
-                        result: '',
+                        result: [{ type: "text", value: '' }],
                         token_usage: {
                             result: streamEvent.usage.output_tokens
                         },
@@ -319,7 +321,7 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
                     // Handle redacted thinking blocks
                     if (streamEvent.content_block.type === "redacted_thinking" && model_options?.include_thoughts) {
                         return {
-                            result: `[Redacted thinking: ${streamEvent.content_block.data}]`
+                            result: [{ type: "text", value: `[Redacted thinking: ${streamEvent.content_block.data}]` }]
                         } satisfies CompletionChunkObject;
                     }
                     break;
@@ -328,12 +330,12 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
                     switch (streamEvent.delta.type) {
                         case "text_delta":
                             return {
-                                result: streamEvent.delta.text ?? ''
+                                result: streamEvent.delta.text ? [{ type: "text", value: streamEvent.delta.text }] : []
                             } satisfies CompletionChunkObject;
                         case "thinking_delta":
                             if (model_options?.include_thoughts) {
                                 return {
-                                    result: streamEvent.delta.thinking ?? '',
+                                    result: streamEvent.delta.thinking ? [{ type: "text", value: streamEvent.delta.thinking }] : [],
                                 } satisfies CompletionChunkObject;
                             }
                             break;
@@ -341,7 +343,7 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
                             // Signature deltas, signify the end of the thoughts.
                             if (model_options?.include_thoughts) {
                                 return {
-                                    result: '\n\n', // Double newline for more spacing
+                                    result: [{ type: "text", value: '\n\n' }], // Double newline for more spacing
                                 } satisfies CompletionChunkObject;
                             }
                             break;
@@ -351,7 +353,7 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
                     // Handle the end of content blocks, for redacted thinking blocks
                     if (model_options?.include_thoughts) {
                         return {
-                            result: '\n\n' // Add double newline for spacing
+                            result: [{ type: "text", value: '\n\n' }] // Add double newline for spacing
                         } satisfies CompletionChunkObject;
                     }
                     break;
@@ -359,7 +361,7 @@ export class ClaudeModelDefinition implements ModelDefinition<ClaudePrompt> {
             // Default case for all other event types
             return {
-                result: ''
+                result: []
             } satisfies CompletionChunkObject;
         });