npm - @saltcorn/large-language-model - Versions diffs - 0.6.5 → 0.7.0 - Mend

@saltcorn/large-language-model 0.6.5 → 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/generate.js CHANGED Viewed

@@ -2,6 +2,13 @@ const fetch = require("node-fetch");
 const util = require("util");
 const exec = util.promisify(require("child_process").exec);
 const db = require("@saltcorn/data/db");
+const { VertexAI } = require("@google-cloud/vertexai");
+const {
+  PredictionServiceClient,
+  helpers,
+} = require("@google-cloud/aiplatform");
+const { google } = require("googleapis");
+const Plugin = require("@saltcorn/data/models/plugin");
 const { features, getState } = require("@saltcorn/data/db/state");
 let ollamaMod;
@@ -57,6 +64,13 @@ const getEmbedding = async (config, opts) => {
         //console.log("embedding response ", olres);
         return olres.embedding;
       }
+    case "Google Vertex AI":
+      const oauth2Client = await initOAuth2Client(config);
+      if (oauth2Client.isTokenExpiring()) {
+        const { credentials } = await oauth2Client.refreshAccessToken();
+        await updatePluginTokenCfg(credentials);
+      }
+      return await getEmbeddingGoogleVertex(config, opts, oauth2Client);
     default:
       throw new Error("Not implemented for this backend");
   }
@@ -117,6 +131,13 @@ const getCompletion = async (config, opts) => {
         { cwd: config.llama_dir }
       );
       return stdout;
+    case "Google Vertex AI":
+      const oauth2Client = await initOAuth2Client(config);
+      if (oauth2Client.isTokenExpiring()) {
+        const { credentials } = await oauth2Client.refreshAccessToken();
+        await updatePluginTokenCfg(credentials);
+      }
+      return await getCompletionGoogleVertex(config, opts, oauth2Client);
     default:
       break;
   }
@@ -174,12 +195,12 @@ const getCompletionOpenAICompatible = async (
     console.log("OpenAI response", JSON.stringify(results, null, 2));
   if (results.error) throw new Error(`OpenAI error: ${results.error.message}`);
-  return (
-    results?.choices?.[0]?.message?.content ||
-    (results?.choices?.[0]?.message?.tool_calls
-      ? { tool_calls: results?.choices?.[0]?.message?.tool_calls }
-      : null)
-  );
+  return results?.choices?.[0]?.message?.tool_calls
+    ? {
+        tool_calls: results?.choices?.[0]?.message?.tool_calls,
+        content: results?.choices?.[0]?.message?.content || null,
+      }
+    : results?.choices?.[0]?.message?.content || null;
 };
 const getEmbeddingOpenAICompatible = async (
@@ -211,4 +232,103 @@ const getEmbeddingOpenAICompatible = async (
   if (Array.isArray(prompt)) return results?.data?.map?.((d) => d?.embedding);
   return results?.data?.[0]?.embedding;
 };
+const updatePluginTokenCfg = async (credentials) => {
+  let plugin = await Plugin.findOne({ name: "large-language-model" });
+  if (!plugin) {
+    plugin = await Plugin.findOne({
+      name: "@saltcorn/large-language-model",
+    });
+  }
+  const newConfig = {
+    ...(plugin.configuration || {}),
+    tokens: credentials,
+  };
+  plugin.configuration = newConfig;
+  await plugin.upsert();
+  getState().processSend({
+    refresh_plugin_cfg: plugin.name,
+    tenant: db.getTenantSchema(),
+  });
+};
+const initOAuth2Client = async (config) => {
+  const { client_id, client_secret } = config || {};
+  const state = getState();
+  const pluginCfg =
+    state.plugin_cfgs.large_language_model ||
+    state.plugin_cfgs["@saltcorn/large-language-model"];
+  const baseUrl = (
+    getState().getConfig("base_url") || "http://localhost:3000"
+  ).replace(/\/$/, "");
+  const redirect_uri = `${baseUrl}/callback`;
+  const oauth2Client = new google.auth.OAuth2(
+    client_id,
+    client_secret,
+    redirect_uri
+  );
+  oauth2Client.setCredentials(pluginCfg.tokens);
+  return oauth2Client;
+};
+const getCompletionGoogleVertex = async (config, opts, oauth2Client) => {
+  const vertexAI = new VertexAI({
+    project: config.project_id,
+    location: config.region || "us-central1",
+    googleAuthOptions: {
+      authClient: oauth2Client,
+    },
+  });
+  const generativeModel = vertexAI.getGenerativeModel({
+    model: config.model,
+  });
+  const chat = generativeModel.startChat();
+  const result = await chat.sendMessageStream(opts.prompt);
+  const chunks = [];
+  for await (const item of result.stream) {
+    chunks.push(item.candidates[0].content.parts[0].text);
+  }
+  return chunks.join();
+};
+const getEmbeddingGoogleVertex = async (config, opts, oauth2Client) => {
+  const predClient = new PredictionServiceClient({
+    apiEndpoint: "us-central1-aiplatform.googleapis.com",
+    authClient: oauth2Client,
+  });
+  const model = config.embed_model || "text-embedding-005";
+  let instances = null;
+  if (Array.isArray(opts.prompt)) {
+    instances = opts.prompt.map((p) =>
+      helpers.toValue({
+        content: p,
+        task_type: config.task_type || "RETRIEVAL_QUERY",
+      })
+    );
+  } else {
+    instances = [
+      helpers.toValue({
+        content: opts.prompt,
+        task_type: config.task_type || "RETRIEVAL_QUERY",
+      }),
+    ];
+  }
+  const [response] = await predClient.predict({
+    endpoint: `projects/${config.project_id}/locations/${
+      config.region || "us-central1"
+    }/publishers/google/models/${model}`,
+    instances,
+    // default outputDimensionality is 768, can be changed with:
+    // parameters: helpers.toValue({ outputDimensionality: parseInt(512) }),
+  });
+  const predictions = response.predictions;
+  const embeddings = predictions.map((p) => {
+    const embeddingsProto = p.structValue.fields.embeddings;
+    const valuesProto = embeddingsProto.structValue.fields.values;
+    return valuesProto.listValue.values.map((v) => v.numberValue);
+  });
+  return embeddings;
+};
 module.exports = { getCompletion, getEmbedding };

package/index.js CHANGED Viewed

@@ -1,11 +1,15 @@
 const Workflow = require("@saltcorn/data/models/workflow");
 const Form = require("@saltcorn/data/models/form");
 const FieldRepeat = require("@saltcorn/data/models/fieldrepeat");
+const Plugin = require("@saltcorn/data/models/plugin");
+const { domReady } = require("@saltcorn/markup/tags");
 const db = require("@saltcorn/data/db");
 const { getCompletion, getEmbedding } = require("./generate");
 const { OPENAI_MODELS } = require("./constants.js");
 const { eval_expression } = require("@saltcorn/data/models/expression");
 const { interpolate } = require("@saltcorn/data/utils");
+const { getState } = require("@saltcorn/data/db/state");
+const { google } = require("googleapis");
 const configuration_workflow = () =>
   new Workflow({
@@ -15,6 +19,35 @@ const configuration_workflow = () =>
         form: async (context) => {
           const isRoot = db.getTenantSchema() === db.connectObj.default_schema;
           return new Form({
+            additionalHeaders: [
+              {
+                headerTag: `<script>
+function backendChange(e) {
+  const val = e.value;
+  const authBtn = document.getElementById('vertex_authorize_btn');
+  if (val === 'Google Vertex AI') {
+    authBtn.classList.remove('d-none');
+  } else {
+    authBtn.classList.add('d-none');
+  }
+}
+${domReady(`
+  const backend = document.getElementById('inputbackend');
+  if (backend) {
+    backendChange(backend);
+  }`)}
+</script>`,
+              },
+            ],
+            additionalButtons: [
+              {
+                label: "authorize",
+                id: "vertex_authorize_btn",
+                onclick:
+                  "location.href='/large-language-model/vertex/authorize'",
+                class: "btn btn-primary d-none",
+              },
+            ],
             fields: [
               {
                 name: "backend",
@@ -27,8 +60,85 @@ const configuration_workflow = () =>
                     "OpenAI-compatible API",
                     "Local Ollama",
                     ...(isRoot ? ["Local llama.cpp"] : []),
+                    "Google Vertex AI",
+                  ],
+                  onChange: "backendChange(this)",
+                },
+              },
+              {
+                name: "client_id",
+                label: "Client ID",
+                sublabel: "OAuth2 client ID from your Google Cloud account",
+                type: "String",
+                required: true,
+                showIf: { backend: "Google Vertex AI" },
+              },
+              {
+                name: "client_secret",
+                label: "Client Secret",
+                sublabel: "Client secret from your Google Cloud account",
+                type: "String",
+                required: true,
+                showIf: { backend: "Google Vertex AI" },
+              },
+              {
+                name: "project_id",
+                label: "Project ID",
+                sublabel: "Google Cloud project ID",
+                type: "String",
+                required: true,
+                showIf: { backend: "Google Vertex AI" },
+              },
+              {
+                name: "model",
+                label: "Model",
+                type: "String",
+                showIf: { backend: "Google Vertex AI" },
+                attributes: {
+                  options: ["gemini-1.5-pro", "gemini-1.5-flash"],
+                },
+                required: true,
+              },
+              {
+                name: "embed_model",
+                label: "Embedding model",
+                type: "String",
+                required: true,
+                showIf: { backend: "Google Vertex AI" },
+                attributes: {
+                  options: [
+                    "text-embedding-005",
+                    "text-embedding-004",
+                    "textembedding-gecko@003",
                   ],
                 },
+                default: "text-embedding-005",
+              },
+              {
+                name: "embed_task_type",
+                label: "Embedding task type",
+                type: "String",
+                showIf: { backend: "Google Vertex AI" },
+                attributes: {
+                  options: [
+                    "RETRIEVAL_QUERY",
+                    "RETRIEVAL_DOCUMENT",
+                    "SEMANTIC_SIMILARITY",
+                    "CLASSIFICATION",
+                    "CLUSTERING",
+                    "QUESTION_ANSWERING",
+                    "FACT_VERIFICATION",
+                    "CODE_RETRIEVAL_QUERY",
+                  ],
+                },
+                default: "RETRIEVAL_QUERY",
+              },
+              {
+                name: "region",
+                label: "Region",
+                sublabel: "Google Cloud region (default: us-central1)",
+                type: "String",
+                default: "us-central1",
               },
               {
                 name: "api_key",
@@ -186,14 +296,90 @@ const functions = (config) => {
   };
 };
+const routes = (config) => {
+  return [
+    {
+      url: "/large-language-model/vertex/authorize",
+      method: "get",
+      callback: async (req, res) => {
+        const { client_id, client_secret } = config || {};
+        const baseUrl = (
+          getState().getConfig("base_url") || "http://localhost:3000"
+        ).replace(/\/$/, "");
+        const redirect_uri = `${baseUrl}/large-language-model/vertex/callback`;
+        const oauth2Client = new google.auth.OAuth2(
+          client_id,
+          client_secret,
+          redirect_uri
+        );
+        const authUrl = oauth2Client.generateAuthUrl({
+          access_type: "offline",
+          scope: "https://www.googleapis.com/auth/cloud-platform",
+        });
+        res.redirect(authUrl);
+      },
+    },
+    {
+      url: "/large-language-model/vertex/callback",
+      method: "get",
+      callback: async (req, res) => {
+        const { client_id, client_secret } = config || {};
+        const baseUrl = (
+          getState().getConfig("base_url") || "http://localhost:3000"
+        ).replace(/\/$/, "");
+        const redirect_uri = `${baseUrl}/large-language-model/vertex/callback`;
+        const oauth2Client = new google.auth.OAuth2(
+          client_id,
+          client_secret,
+          redirect_uri
+        );
+        let plugin = await Plugin.findOne({ name: "large-language-model" });
+        if (!plugin) {
+          plugin = await Plugin.findOne({
+            name: "@saltcorn/large-language-model",
+          });
+        }
+        try {
+          const code = req.query.code;
+          if (!code) throw new Error("Missing code in query string.");
+          const { tokens } = await oauth2Client.getToken(code);
+          if (!tokens.refresh_token) {
+            req.flash(
+              "warning",
+              req.__(
+                "No refresh token received. Please revoke the plugin's access and try again."
+              )
+            );
+          } else {
+            const newConfig = { ...(plugin.configuration || {}), tokens };
+            plugin.configuration = newConfig;
+            await plugin.upsert();
+            req.flash(
+              "success",
+              req.__("Authentication successful! You can now use Vertex AI.")
+            );
+          }
+        } catch (error) {
+          console.error("Error retrieving access token:", error);
+          req.flash("error", req.__("Error retrieving access"));
+        } finally {
+          res.redirect(`/plugins/configure/${encodeURIComponent(plugin.name)}`);
+        }
+      },
+    },
+  ];
+};
 module.exports = {
   sc_plugin_api_version: 1,
   configuration_workflow,
   functions,
   modelpatterns: require("./model.js"),
+  routes,
   actions: (config) => ({
     llm_function_call: require("./function-insert-action.js")(config),
     llm_generate: {
+      description: "Generate text with AI based on a text prompt",
       requireRow: true,
       configFields: ({ table, mode }) => {
         const override_fields =
@@ -317,7 +503,7 @@ module.exports = {
           upd[chat_history_field] = [
             ...history,
             { role: "user", content: prompt },
-            { role: "system", content: ans },
+            { role: "assistant", content: ans },
           ];
         }
         if (mode === "workflow") return upd;
@@ -325,6 +511,8 @@ module.exports = {
       },
     },
     llm_generate_json: {
+      description:
+        "Generate JSON with AI based on a text prompt. You must sppecify the JSON fields in the configuration.",
       requireRow: true,
       configFields: ({ table, mode }) => {
         const override_fields =
@@ -427,7 +615,7 @@ module.exports = {
             label: "Multiple",
             type: "Bool",
             sublabel:
-              "Select to generate an array of objects. Unselect for a single object",
+              "Select (true) to generate an array of objects. Unselect (false) for a single object",
           },
           {
             name: "gen_description",
@@ -506,13 +694,15 @@ module.exports = {
           ...opts,
           ...toolargs,
         });
-        const ans = JSON.parse(compl.tool_calls[0].function.arguments)[answer_field];
+        const ans = JSON.parse(compl.tool_calls[0].function.arguments)[
+          answer_field
+        ];
         const upd = { [answer_field]: ans };
         if (chat_history_field) {
           upd[chat_history_field] = [
             ...history,
             { role: "user", content: prompt },
-            { role: "system", content: ans },
+            { role: "assistant", content: ans },
           ];
         }
         if (mode === "workflow") return upd;

package/package.json CHANGED Viewed

@@ -1,13 +1,16 @@
 {
   "name": "@saltcorn/large-language-model",
-  "version": "0.6.5",
+  "version": "0.7.0",
   "description": "Large language models and functionality for Saltcorn",
   "main": "index.js",
   "dependencies": {
     "@saltcorn/data": "^0.9.0",
     "node-fetch": "2.6.9",
     "underscore": "1.13.6",
-    "ollama": "0.5.0"
+    "ollama": "0.5.0",
+    "@google-cloud/vertexai": "^1.9.3",
+    "@google-cloud/aiplatform": "^3.34.0",
+    "googleapis": "^144.0.0"
   },
   "author": "Tom Nielsen",
   "license": "MIT",