npm - bedrock-wrapper - Versions diffs - 1.0.14 → 1.1.0 - Mend

bedrock-wrapper 1.0.14 → 1.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/README.md CHANGED Viewed

@@ -29,7 +29,7 @@ Bedrock Wrapper is an npm package that simplifies the integration of existing Op
     ```javascript
     const openaiChatCompletionsCreateObject = {
         "messages": messages,
-        "model": "Llama-3-8b",
+        "model": "Llama-3-1-8b",
         "max_tokens": LLM_MAX_GEN_TOKENS,
         "stream": true,
         "temperature": LLM_TEMPERATURE,
@@ -94,13 +94,15 @@ Bedrock Wrapper is an npm package that simplifies the integration of existing Op
 ### Supported Models
-| modelName      | modelId                            |
-|----------------|------------------------------------|
-| Llama-3-8b     | meta.llama3-8b-instruct-v1:0       |
-| Llama-3-70b    | meta.llama3-70b-instruct-v1:0      |
-| Mistral-7b     | mistral.mistral-7b-instruct-v0:2   |
-| Mixtral-8x7b   | mistral.mixtral-8x7b-instruct-v0:1 |
-| Mistral-Large  | mistral.mistral-large-2402-v1:0    |
+| modelName     | modelId                            |
+|---------------|------------------------------------|
+| Llama-3-1-8b  | meta.llama3-1-8b-instruct-v1:0     |
+| Llama-3-1-70b | meta.llama3-1-70b-instruct-v1:0    |
+| Llama-3-8b    | meta.llama3-8b-instruct-v1:0       |
+| Llama-3-70b   | meta.llama3-70b-instruct-v1:0      |
+| Mistral-7b    | mistral.mistral-7b-instruct-v0:2   |
+| Mixtral-8x7b  | mistral.mixtral-8x7b-instruct-v0:1 |
+| Mistral-Large | mistral.mistral-large-2402-v1:0    |
 To return the list progrmatically you can import and call `listBedrockWrapperSupportedModels`:
 ```javascript

package/bedrock-models.js CHANGED Viewed

@@ -1,5 +1,55 @@
 // Description: This file contains the model configurations
 export const bedrock_models = [
+    {
+        // ==================
+        // == Llama 3.1 8b ==
+        // ==================
+        "modelName":                     "Llama-3-1-8b",
+        "modelId":                       "meta.llama3-1-8b-instruct-v1:0",
+        "bos_text":                      "<|begin_of_text|>",
+        "role_system_message_prefix":    "",
+        "role_system_message_suffix":    "",
+        "role_system_prefix":            "<|start_header_id|>",
+        "role_system_suffix":            "<|end_header_id|>",
+        "role_user_message_prefix":      "",
+        "role_user_message_suffix":      "",
+        "role_user_prefix":              "<|start_header_id|>",
+        "role_user_suffix":              "<|end_header_id|>",
+        "role_assistant_message_prefix": "",
+        "role_assistant_message_suffix": "",
+        "role_assistant_prefix":         "<|start_header_id|>",
+        "role_assistant_suffix":         "<|end_header_id|>",
+        "eom_text":                      "<|eot_id|>",
+        "display_role_names":            true,
+        "max_tokens_param_name":         "max_gen_len",
+        "max_supported_response_tokens": 2048,
+        "response_chunk_element":        "generation",
+    },
+    {
+        // ===================
+        // == Llama 3.1 70b ==
+        // ===================
+        "modelName":                     "Llama-3-1-70b",
+        "modelId":                       "meta.llama3-1-70b-instruct-v1:0",
+        "bos_text":                      "<|begin_of_text|>",
+        "role_system_message_prefix":    "",
+        "role_system_message_suffix":    "",
+        "role_system_prefix":            "<|start_header_id|>",
+        "role_system_suffix":            "<|end_header_id|>",
+        "role_user_message_prefix":      "",
+        "role_user_message_suffix":      "",
+        "role_user_prefix":              "<|start_header_id|>",
+        "role_user_suffix":              "<|end_header_id|>",
+        "role_assistant_message_prefix": "",
+        "role_assistant_message_suffix": "",
+        "role_assistant_prefix":         "<|start_header_id|>",
+        "role_assistant_suffix":         "<|end_header_id|>",
+        "eom_text":                      "<|eot_id|>",
+        "display_role_names":            true,
+        "max_tokens_param_name":         "max_gen_len",
+        "max_supported_response_tokens": 2048,
+        "response_chunk_element":        "generation",
+    },
     {
         // ================
         // == Llama 3 8b ==
@@ -22,6 +72,7 @@ export const bedrock_models = [
         "eom_text":                      "<|eot_id|>",
         "display_role_names":            true,
         "max_tokens_param_name":         "max_gen_len",
+        "max_supported_response_tokens": 2048,
         "response_chunk_element":        "generation",
     },
     {
@@ -46,6 +97,7 @@ export const bedrock_models = [
         "eom_text":                      "<|eot_id|>",
         "display_role_names":            true,
         "max_tokens_param_name":         "max_gen_len",
+        "max_supported_response_tokens": 2048,
         "response_chunk_element":        "generation",
     },
     {
@@ -70,6 +122,7 @@ export const bedrock_models = [
         "eom_text":                      "</s>",
         "display_role_names":            false,
         "max_tokens_param_name":         "max_tokens",
+        "max_supported_response_tokens": 8192,
         "response_chunk_element":        "outputs[0].text",
     },
     {
@@ -94,6 +147,7 @@ export const bedrock_models = [
         "eom_text":                      "</s>",
         "display_role_names":            false,
         "max_tokens_param_name":         "max_tokens",
+        "max_supported_response_tokens": 4096,
         "response_chunk_element":        "outputs[0].text",
     },
     {
@@ -118,6 +172,7 @@ export const bedrock_models = [
         "eom_text":                      "</s>",
         "display_role_names":            false,
         "max_tokens_param_name":         "max_tokens",
+        "max_supported_response_tokens": 8192,
         "response_chunk_element":        "outputs[0].text",
     },
 ];

package/bedrock-wrapper.js CHANGED Viewed

@@ -96,11 +96,13 @@ export async function* bedrockWrapper(awsCreds, openaiChatCompletionsCreateObjec
         console.log(`\nPrompt: ${prompt}\n`);
     }
+    const max_gen_tokens = max_tokens <= awsModel.max_supported_response_tokens ? max_tokens : awsModel.max_supported_response_tokens;
     // Format the request payload using the model's native structure.
     const request = {
         prompt,
         // Optional inference parameters:
-        [awsModel.max_tokens_param_name]: max_tokens,
+        [awsModel.max_tokens_param_name]: max_gen_tokens,
         temperature: temperature,
         top_p: top_p,
     };

package/example.js CHANGED Viewed

@@ -35,11 +35,11 @@ console.log(`\nsupported models:\n${JSON.stringify(await listBedrockWrapperSuppo
 const messages = [
     {
         role: "system",
-        content: "You are a helpful AI assistant that follows instructions extremely well. Answer the user questions accurately. Think step by step before answering the question. You will get a $100 tip if you provide the correct answer.",
+        content: "You are a helpful AI assistant that follows instructions extremely well. Answer the user questions accurately. Think step by step before answering the question.",
     },
     {
         role: "user",
-        content: "Describe why openai api standard used by lots of serverless LLM api providers is better than aws bedrock invoke api offered by aws bedrock. Limit your response to five sentences.",
+        content: "Describe what the openai api standard used by lots of serverless LLM api providers is and why it has been widely adopted.",
     },
     {
         role: "assistant",
@@ -61,7 +61,7 @@ const awsCreds = {
 // ----------------------------------------------------------------------
 const openaiChatCompletionsCreateObject = {
     "messages": messages,
-    "model": "Llama-3-8b",
+    "model": "Llama-3-1-8b",
     "max_tokens": LLM_MAX_GEN_TOKENS,
     "stream": true,
     "temperature": LLM_TEMPERATURE,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "bedrock-wrapper",
-  "version": "1.0.14",
+  "version": "1.1.0",
   "description": "🪨 Bedrock Wrapper is an npm package that simplifies the integration of existing OpenAI-compatible API objects with AWS Bedrock's serverless inference LLMs.",
   "repository": {
 		"type": "git",
@@ -21,7 +21,7 @@
   "author": "",
   "license": "ISC",
   "dependencies": {
-    "@aws-sdk/client-bedrock-runtime": "^3.567.0",
+    "@aws-sdk/client-bedrock-runtime": "^3.616.0",
     "dotenv": "^16.4.5"
   }
 }