@node-llm/core 1.6.2 → 1.8.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +9 -8
- package/dist/aliases.d.ts +215 -0
- package/dist/aliases.d.ts.map +1 -1
- package/dist/aliases.js +241 -26
- package/dist/chat/Chat.d.ts +12 -3
- package/dist/chat/Chat.d.ts.map +1 -1
- package/dist/chat/Chat.js +35 -5
- package/dist/chat/ChatOptions.d.ts +2 -1
- package/dist/chat/ChatOptions.d.ts.map +1 -1
- package/dist/chat/ChatResponse.d.ts +9 -2
- package/dist/chat/ChatResponse.d.ts.map +1 -1
- package/dist/chat/ChatResponse.js +12 -3
- package/dist/chat/ChatStream.d.ts.map +1 -1
- package/dist/chat/ChatStream.js +15 -1
- package/dist/chat/Content.d.ts +7 -0
- package/dist/chat/Content.d.ts.map +1 -1
- package/dist/config.d.ts +28 -0
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +50 -0
- package/dist/index.d.ts +1 -0
- package/dist/index.d.ts.map +1 -1
- package/dist/llm.d.ts.map +1 -1
- package/dist/llm.js +3 -2
- package/dist/models/models.d.ts +321 -76
- package/dist/models/models.d.ts.map +1 -1
- package/dist/models/models.js +7804 -2885
- package/dist/providers/Provider.d.ts +37 -0
- package/dist/providers/Provider.d.ts.map +1 -1
- package/dist/providers/anthropic/Capabilities.d.ts +1 -0
- package/dist/providers/anthropic/Capabilities.d.ts.map +1 -1
- package/dist/providers/anthropic/Capabilities.js +8 -5
- package/dist/providers/anthropic/Chat.d.ts.map +1 -1
- package/dist/providers/anthropic/Chat.js +23 -1
- package/dist/providers/anthropic/Streaming.d.ts.map +1 -1
- package/dist/providers/anthropic/Streaming.js +15 -0
- package/dist/providers/anthropic/types.d.ts +7 -1
- package/dist/providers/anthropic/types.d.ts.map +1 -1
- package/dist/providers/bedrock/BedrockProvider.d.ts +53 -0
- package/dist/providers/bedrock/BedrockProvider.d.ts.map +1 -0
- package/dist/providers/bedrock/BedrockProvider.js +107 -0
- package/dist/providers/bedrock/Capabilities.d.ts +50 -0
- package/dist/providers/bedrock/Capabilities.d.ts.map +1 -0
- package/dist/providers/bedrock/Capabilities.js +233 -0
- package/dist/providers/bedrock/Chat.d.ts +26 -0
- package/dist/providers/bedrock/Chat.d.ts.map +1 -0
- package/dist/providers/bedrock/Chat.js +170 -0
- package/dist/providers/bedrock/Embeddings.d.ts +22 -0
- package/dist/providers/bedrock/Embeddings.d.ts.map +1 -0
- package/dist/providers/bedrock/Embeddings.js +100 -0
- package/dist/providers/bedrock/Image.d.ts +33 -0
- package/dist/providers/bedrock/Image.d.ts.map +1 -0
- package/dist/providers/bedrock/Image.js +154 -0
- package/dist/providers/bedrock/Models.d.ts +34 -0
- package/dist/providers/bedrock/Models.d.ts.map +1 -0
- package/dist/providers/bedrock/Models.js +131 -0
- package/dist/providers/bedrock/Moderation.d.ts +23 -0
- package/dist/providers/bedrock/Moderation.d.ts.map +1 -0
- package/dist/providers/bedrock/Moderation.js +138 -0
- package/dist/providers/bedrock/Streaming.d.ts +21 -0
- package/dist/providers/bedrock/Streaming.d.ts.map +1 -0
- package/dist/providers/bedrock/Streaming.js +240 -0
- package/dist/providers/bedrock/config.d.ts +57 -0
- package/dist/providers/bedrock/config.d.ts.map +1 -0
- package/dist/providers/bedrock/config.js +33 -0
- package/dist/providers/bedrock/index.d.ts +8 -0
- package/dist/providers/bedrock/index.d.ts.map +1 -0
- package/dist/providers/bedrock/index.js +30 -0
- package/dist/providers/bedrock/mapper.d.ts +37 -0
- package/dist/providers/bedrock/mapper.d.ts.map +1 -0
- package/dist/providers/bedrock/mapper.js +204 -0
- package/dist/providers/bedrock/types.d.ts +179 -0
- package/dist/providers/bedrock/types.d.ts.map +1 -0
- package/dist/providers/bedrock/types.js +7 -0
- package/dist/providers/deepseek/Capabilities.d.ts +3 -2
- package/dist/providers/deepseek/Capabilities.d.ts.map +1 -1
- package/dist/providers/deepseek/Capabilities.js +19 -5
- package/dist/providers/deepseek/Chat.d.ts.map +1 -1
- package/dist/providers/deepseek/Chat.js +9 -2
- package/dist/providers/deepseek/Streaming.d.ts.map +1 -1
- package/dist/providers/deepseek/Streaming.js +3 -2
- package/dist/providers/gemini/Capabilities.d.ts +1 -0
- package/dist/providers/gemini/Capabilities.d.ts.map +1 -1
- package/dist/providers/gemini/Capabilities.js +9 -6
- package/dist/providers/gemini/Chat.d.ts.map +1 -1
- package/dist/providers/gemini/Chat.js +4 -5
- package/dist/providers/gemini/Streaming.d.ts.map +1 -1
- package/dist/providers/gemini/Streaming.js +17 -2
- package/dist/providers/gemini/types.d.ts +4 -0
- package/dist/providers/gemini/types.d.ts.map +1 -1
- package/dist/providers/ollama/Capabilities.d.ts.map +1 -1
- package/dist/providers/ollama/Capabilities.js +4 -1
- package/dist/providers/openai/Capabilities.d.ts +1 -0
- package/dist/providers/openai/Capabilities.d.ts.map +1 -1
- package/dist/providers/openai/Capabilities.js +14 -11
- package/dist/providers/openai/Chat.d.ts.map +1 -1
- package/dist/providers/openai/Chat.js +18 -3
- package/dist/providers/openai/Streaming.d.ts.map +1 -1
- package/dist/providers/openai/Streaming.js +11 -3
- package/dist/providers/registry.d.ts +2 -1
- package/dist/providers/registry.d.ts.map +1 -1
- package/dist/providers/registry.js +2 -1
- package/dist/utils/AwsSigV4.d.ts +51 -0
- package/dist/utils/AwsSigV4.d.ts.map +1 -0
- package/dist/utils/AwsSigV4.js +209 -0
- package/package.json +1 -1
|
@@ -0,0 +1,233 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Maps Bedrock model IDs to their capabilities.
|
|
3
|
+
*/
|
|
4
|
+
import { ModelRegistry } from "../../models/ModelRegistry.js";
|
|
5
|
+
import { PricingRegistry } from "../../models/PricingRegistry.js";
|
|
6
|
+
const MODEL_FAMILIES = [
|
|
7
|
+
[/anthropic\.claude-3-opus/, "claude3_opus"],
|
|
8
|
+
[/anthropic\.claude-3-sonnet/, "claude3_sonnet"],
|
|
9
|
+
[/anthropic\.claude-3-5-sonnet/, "claude3_sonnet"],
|
|
10
|
+
[/anthropic\.claude-3-7-sonnet/, "claude3_sonnet"],
|
|
11
|
+
[/anthropic\.claude-3-haiku/, "claude3_haiku"],
|
|
12
|
+
[/anthropic\.claude-3-5-haiku/, "claude3_5_haiku"],
|
|
13
|
+
[/anthropic\.claude-v2/, "claude2"],
|
|
14
|
+
[/anthropic\.claude-2/, "claude2"],
|
|
15
|
+
[/anthropic\.claude-instant/, "claude_instant"],
|
|
16
|
+
[/anthropic\.claude-(opus|sonnet|haiku)-4/, "claude4"],
|
|
17
|
+
[/amazon\.nova-2/, "nova2"],
|
|
18
|
+
[/amazon\.nova/, "nova"]
|
|
19
|
+
];
|
|
20
|
+
// ─────────────────────────────────────────────────────────────────────────────
|
|
21
|
+
// Pricing (per million tokens)
|
|
22
|
+
// ─────────────────────────────────────────────────────────────────────────────
|
|
23
|
+
const PRICES = {
|
|
24
|
+
claude3_opus: { input: 15.0, output: 75.0 },
|
|
25
|
+
claude3_sonnet: { input: 3.0, output: 15.0 },
|
|
26
|
+
claude3_haiku: { input: 0.25, output: 1.25 },
|
|
27
|
+
claude3_5_haiku: { input: 0.8, output: 4.0 },
|
|
28
|
+
claude2: { input: 8.0, output: 24.0 },
|
|
29
|
+
claude_instant: { input: 0.8, output: 2.4 },
|
|
30
|
+
claude4: { input: 3.0, output: 15.0 }, // Assuming Sonnet 4 as baseline for the family
|
|
31
|
+
nova: { input: 0.06, output: 0.24 },
|
|
32
|
+
nova2: { input: 0.03, output: 0.12 }, // Assuming Nova 2 is cheaper as per trend
|
|
33
|
+
other: { input: 0.1, output: 0.2 }
|
|
34
|
+
};
|
|
35
|
+
// ─────────────────────────────────────────────────────────────────────────────
|
|
36
|
+
// Capabilities Class
|
|
37
|
+
// ─────────────────────────────────────────────────────────────────────────────
|
|
38
|
+
export class Capabilities {
|
|
39
|
+
static getModelFamily(modelId) {
|
|
40
|
+
for (const [pattern, family] of MODEL_FAMILIES) {
|
|
41
|
+
if (pattern.test(modelId))
|
|
42
|
+
return family;
|
|
43
|
+
}
|
|
44
|
+
return "other";
|
|
45
|
+
}
|
|
46
|
+
static getContextWindow(modelId) {
|
|
47
|
+
const val = ModelRegistry.getContextWindow(modelId, "bedrock");
|
|
48
|
+
if (val)
|
|
49
|
+
return val;
|
|
50
|
+
// Claude 2 has 100k, others have 200k
|
|
51
|
+
if (/anthropic\.claude-2/.test(modelId))
|
|
52
|
+
return 100_000;
|
|
53
|
+
if (/anthropic\.claude/.test(modelId))
|
|
54
|
+
return 200_000;
|
|
55
|
+
// DeepSeek
|
|
56
|
+
if (/deepseek/.test(modelId))
|
|
57
|
+
return 128_000;
|
|
58
|
+
// Mistral
|
|
59
|
+
if (/mistral-large/.test(modelId))
|
|
60
|
+
return 128_000;
|
|
61
|
+
if (/mistral/.test(modelId))
|
|
62
|
+
return 32_000;
|
|
63
|
+
// Llama
|
|
64
|
+
if (/llama/.test(modelId))
|
|
65
|
+
return 128_000;
|
|
66
|
+
// Titan
|
|
67
|
+
if (/titan/.test(modelId))
|
|
68
|
+
return 32_000;
|
|
69
|
+
// Nova
|
|
70
|
+
if (/nova/.test(modelId))
|
|
71
|
+
return 300_000;
|
|
72
|
+
return null;
|
|
73
|
+
}
|
|
74
|
+
static getMaxOutputTokens(modelId) {
|
|
75
|
+
const val = ModelRegistry.getMaxOutputTokens(modelId, "bedrock");
|
|
76
|
+
if (val)
|
|
77
|
+
return val;
|
|
78
|
+
return 4_096;
|
|
79
|
+
}
|
|
80
|
+
static supportsChat(modelId) {
|
|
81
|
+
const model = this.findModel(modelId);
|
|
82
|
+
if (model?.capabilities?.includes("chat"))
|
|
83
|
+
return true;
|
|
84
|
+
return (/anthropic\.claude/.test(modelId) ||
|
|
85
|
+
/amazon\.nova/.test(modelId) ||
|
|
86
|
+
/mistral\.mistral/.test(modelId) ||
|
|
87
|
+
/meta\.llama/.test(modelId) ||
|
|
88
|
+
/deepseek/.test(modelId));
|
|
89
|
+
}
|
|
90
|
+
static supportsStreaming(modelId) {
|
|
91
|
+
const model = this.findModel(modelId);
|
|
92
|
+
if (model?.capabilities?.includes("streaming"))
|
|
93
|
+
return true;
|
|
94
|
+
return (/anthropic\.claude/.test(modelId) ||
|
|
95
|
+
/amazon\.nova/.test(modelId) ||
|
|
96
|
+
/mistral\.mistral/.test(modelId) ||
|
|
97
|
+
/meta\.llama/.test(modelId) ||
|
|
98
|
+
/deepseek/.test(modelId));
|
|
99
|
+
}
|
|
100
|
+
static supportsVision(modelId) {
|
|
101
|
+
const model = this.findModel(modelId);
|
|
102
|
+
if (model?.modalities?.input?.includes("image"))
|
|
103
|
+
return true;
|
|
104
|
+
if (model?.capabilities?.includes("vision"))
|
|
105
|
+
return true;
|
|
106
|
+
return /anthropic\.claude-3|anthropic\.claude-4|amazon\.nova/.test(modelId);
|
|
107
|
+
}
|
|
108
|
+
static supportsTools(modelId) {
|
|
109
|
+
const model = this.findModel(modelId);
|
|
110
|
+
if (model?.capabilities?.includes("tools") || model?.capabilities?.includes("function_calling"))
|
|
111
|
+
return true;
|
|
112
|
+
return /anthropic\.claude|amazon\.nova|deepseek-chat/.test(modelId);
|
|
113
|
+
}
|
|
114
|
+
static supportsJsonMode(modelId) {
|
|
115
|
+
const model = this.findModel(modelId);
|
|
116
|
+
if (model?.capabilities?.includes("json_mode") ||
|
|
117
|
+
model?.capabilities?.includes("structured_output"))
|
|
118
|
+
return true;
|
|
119
|
+
return /anthropic\.claude|amazon\.nova/.test(modelId);
|
|
120
|
+
}
|
|
121
|
+
static supportsExtendedThinking(modelId) {
|
|
122
|
+
const model = this.findModel(modelId);
|
|
123
|
+
if (model?.capabilities?.includes("reasoning"))
|
|
124
|
+
return true;
|
|
125
|
+
return /claude-3-7|deepseek-reasoner|deepseek\.r1/.test(modelId);
|
|
126
|
+
}
|
|
127
|
+
static supportsEmbeddings(modelId) {
|
|
128
|
+
const model = this.findModel(modelId);
|
|
129
|
+
if (model?.capabilities?.includes("embeddings"))
|
|
130
|
+
return true;
|
|
131
|
+
return /amazon\.titan-embed/.test(modelId);
|
|
132
|
+
}
|
|
133
|
+
static supportsImageGeneration(modelId) {
|
|
134
|
+
const model = this.findModel(modelId);
|
|
135
|
+
if (model?.capabilities?.includes("image_generation"))
|
|
136
|
+
return true;
|
|
137
|
+
return /amazon\.titan-image-generator|stability\.stable-diffusion/.test(modelId);
|
|
138
|
+
}
|
|
139
|
+
/**
|
|
140
|
+
* Check if a model supports audio input.
|
|
141
|
+
*/
|
|
142
|
+
static supportsAudio(_modelId) {
|
|
143
|
+
return false;
|
|
144
|
+
}
|
|
145
|
+
/**
|
|
146
|
+
* Get input modalities for a model.
|
|
147
|
+
*/
|
|
148
|
+
static getInputModalities(modelId) {
|
|
149
|
+
const modalities = ["text"];
|
|
150
|
+
if ((/anthropic\.claude/.test(modelId) || /amazon\.nova/.test(modelId)) &&
|
|
151
|
+
this.supportsVision(modelId)) {
|
|
152
|
+
modalities.push("image");
|
|
153
|
+
modalities.push("pdf");
|
|
154
|
+
}
|
|
155
|
+
return modalities;
|
|
156
|
+
}
|
|
157
|
+
/**
|
|
158
|
+
* Get output modalities for a model.
|
|
159
|
+
*/
|
|
160
|
+
static getOutputModalities(_modelId) {
|
|
161
|
+
return ["text"];
|
|
162
|
+
}
|
|
163
|
+
/**
|
|
164
|
+
* Get all capabilities for a model.
|
|
165
|
+
*/
|
|
166
|
+
static getCapabilities(modelId) {
|
|
167
|
+
const capabilities = [];
|
|
168
|
+
if (/anthropic\.claude/.test(modelId)) {
|
|
169
|
+
capabilities.push("streaming");
|
|
170
|
+
}
|
|
171
|
+
if (this.supportsTools(modelId)) {
|
|
172
|
+
capabilities.push("function_calling");
|
|
173
|
+
}
|
|
174
|
+
if (/claude-3-7|nova/.test(modelId)) {
|
|
175
|
+
capabilities.push("reasoning");
|
|
176
|
+
}
|
|
177
|
+
if (/claude-3\.5|claude-3-7|nova/.test(modelId)) {
|
|
178
|
+
capabilities.push("batch");
|
|
179
|
+
capabilities.push("citations");
|
|
180
|
+
}
|
|
181
|
+
return capabilities;
|
|
182
|
+
}
|
|
183
|
+
static getPricing(modelId) {
|
|
184
|
+
// Try registry first
|
|
185
|
+
const registryPricing = PricingRegistry.getPricing(modelId, "bedrock");
|
|
186
|
+
if (registryPricing)
|
|
187
|
+
return registryPricing;
|
|
188
|
+
// Fallback to built-in pricing
|
|
189
|
+
const family = this.getModelFamily(modelId);
|
|
190
|
+
const prices = PRICES[family];
|
|
191
|
+
return {
|
|
192
|
+
text_tokens: {
|
|
193
|
+
standard: {
|
|
194
|
+
input_per_million: prices.input,
|
|
195
|
+
output_per_million: prices.output
|
|
196
|
+
},
|
|
197
|
+
batch: {
|
|
198
|
+
input_per_million: prices.input * 0.5,
|
|
199
|
+
output_per_million: prices.output * 0.5
|
|
200
|
+
}
|
|
201
|
+
}
|
|
202
|
+
};
|
|
203
|
+
}
|
|
204
|
+
/**
|
|
205
|
+
* Get input price per million tokens.
|
|
206
|
+
*/
|
|
207
|
+
static getInputPrice(modelId) {
|
|
208
|
+
const family = this.getModelFamily(modelId);
|
|
209
|
+
return PRICES[family].input;
|
|
210
|
+
}
|
|
211
|
+
/**
|
|
212
|
+
* Get output price per million tokens.
|
|
213
|
+
*/
|
|
214
|
+
static getOutputPrice(modelId) {
|
|
215
|
+
const family = this.getModelFamily(modelId);
|
|
216
|
+
return PRICES[family].output;
|
|
217
|
+
}
|
|
218
|
+
/**
|
|
219
|
+
* Format model ID as display name.
|
|
220
|
+
*/
|
|
221
|
+
static formatDisplayName(modelId) {
|
|
222
|
+
return modelId
|
|
223
|
+
.replace(/-/g, " ")
|
|
224
|
+
.split(".")
|
|
225
|
+
.pop()
|
|
226
|
+
.split(" ")
|
|
227
|
+
.map((word) => word.charAt(0).toUpperCase() + word.slice(1))
|
|
228
|
+
.join(" ");
|
|
229
|
+
}
|
|
230
|
+
static findModel(modelId) {
|
|
231
|
+
return ModelRegistry.find(modelId, "bedrock");
|
|
232
|
+
}
|
|
233
|
+
}
|
|
@@ -0,0 +1,26 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Bedrock Chat Handler
|
|
3
|
+
*
|
|
4
|
+
* Executes chat requests against the Bedrock Converse API.
|
|
5
|
+
*/
|
|
6
|
+
import { ChatRequest, ChatResponse } from "../Provider.js";
|
|
7
|
+
import { BedrockConfig } from "./config.js";
|
|
8
|
+
export declare class BedrockChat {
|
|
9
|
+
private readonly config;
|
|
10
|
+
private readonly authMode;
|
|
11
|
+
private readonly baseUrl;
|
|
12
|
+
constructor(config: BedrockConfig);
|
|
13
|
+
/**
|
|
14
|
+
* Execute a chat request against Bedrock Converse API.
|
|
15
|
+
*/
|
|
16
|
+
execute(request: ChatRequest): Promise<ChatResponse>;
|
|
17
|
+
/**
|
|
18
|
+
* Build request headers based on auth mode.
|
|
19
|
+
*/
|
|
20
|
+
private buildHeaders;
|
|
21
|
+
/**
|
|
22
|
+
* Parse Bedrock response to NodeLLM format.
|
|
23
|
+
*/
|
|
24
|
+
private parseResponse;
|
|
25
|
+
}
|
|
26
|
+
//# sourceMappingURL=Chat.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"Chat.d.ts","sourceRoot":"","sources":["../../../src/providers/bedrock/Chat.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,WAAW,EAAE,YAAY,EAAS,MAAM,gBAAgB,CAAC;AAElE,OAAO,EAAE,aAAa,EAA6C,MAAM,aAAa,CAAC;AAYvF,qBAAa,WAAW;IACtB,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAgB;IACvC,OAAO,CAAC,QAAQ,CAAC,QAAQ,CAAqB;IAC9C,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAS;gBAErB,MAAM,EAAE,aAAa;IAMjC;;OAEG;IACG,OAAO,CAAC,OAAO,EAAE,WAAW,GAAG,OAAO,CAAC,YAAY,CAAC;IA6E1D;;OAEG;IACH,OAAO,CAAC,YAAY;IA6CpB;;OAEG;IACH,OAAO,CAAC,aAAa;CAiDtB"}
|
|
@@ -0,0 +1,170 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Bedrock Chat Handler
|
|
3
|
+
*
|
|
4
|
+
* Executes chat requests against the Bedrock Converse API.
|
|
5
|
+
*/
|
|
6
|
+
import { validateBedrockConfig, getBedrockEndpoint } from "./config.js";
|
|
7
|
+
import { buildConverseRequest } from "./mapper.js";
|
|
8
|
+
import { signRequest } from "../../utils/AwsSigV4.js";
|
|
9
|
+
import { ModelRegistry } from "../../models/ModelRegistry.js";
|
|
10
|
+
import { fetchWithTimeout } from "../../utils/fetch.js";
|
|
11
|
+
import { logger } from "../../utils/logger.js";
|
|
12
|
+
// ─────────────────────────────────────────────────────────────────────────────
|
|
13
|
+
// Chat Handler
|
|
14
|
+
// ─────────────────────────────────────────────────────────────────────────────
|
|
15
|
+
export class BedrockChat {
|
|
16
|
+
config;
|
|
17
|
+
authMode;
|
|
18
|
+
baseUrl;
|
|
19
|
+
constructor(config) {
|
|
20
|
+
this.config = config;
|
|
21
|
+
this.authMode = validateBedrockConfig(config);
|
|
22
|
+
this.baseUrl = getBedrockEndpoint(config.region);
|
|
23
|
+
}
|
|
24
|
+
/**
|
|
25
|
+
* Execute a chat request against Bedrock Converse API.
|
|
26
|
+
*/
|
|
27
|
+
async execute(request) {
|
|
28
|
+
const modelId = request.model;
|
|
29
|
+
const url = `${this.baseUrl}/model/${modelId}/converse`;
|
|
30
|
+
// Build the Bedrock request body
|
|
31
|
+
const guardrail = this.config.guardrailIdentifier && this.config.guardrailVersion
|
|
32
|
+
? {
|
|
33
|
+
guardrailIdentifier: this.config.guardrailIdentifier,
|
|
34
|
+
guardrailVersion: this.config.guardrailVersion
|
|
35
|
+
}
|
|
36
|
+
: undefined;
|
|
37
|
+
const body = buildConverseRequest(request.messages, request.tools, {
|
|
38
|
+
maxTokens: request.max_tokens,
|
|
39
|
+
temperature: request.temperature,
|
|
40
|
+
thinking: request.thinking,
|
|
41
|
+
guardrail,
|
|
42
|
+
additionalModelRequestFields: request.additionalModelRequestFields
|
|
43
|
+
});
|
|
44
|
+
const bodyJson = JSON.stringify(body);
|
|
45
|
+
// Build headers based on auth mode
|
|
46
|
+
const headers = this.buildHeaders(url, bodyJson, request.headers);
|
|
47
|
+
logger.logRequest("Bedrock", "POST", url, body);
|
|
48
|
+
// Make the request
|
|
49
|
+
const response = await fetchWithTimeout(url, {
|
|
50
|
+
method: "POST",
|
|
51
|
+
headers,
|
|
52
|
+
body: bodyJson
|
|
53
|
+
}, request.requestTimeout ?? this.config.requestTimeout);
|
|
54
|
+
if (!response.ok) {
|
|
55
|
+
const errorText = await response.text();
|
|
56
|
+
logger.logResponse("Bedrock", response.status, response.statusText, errorText);
|
|
57
|
+
let message = errorText;
|
|
58
|
+
// Improve clarity for known AWS errors
|
|
59
|
+
if (errorText.includes("INVALID_PAYMENT_INSTRUMENT")) {
|
|
60
|
+
message =
|
|
61
|
+
"Billing setup incomplete for AWS Marketplace models. Ensure a credit card is set as default payment method.";
|
|
62
|
+
}
|
|
63
|
+
else if (errorText.includes("AccessDeniedException") &&
|
|
64
|
+
errorText.includes("model access")) {
|
|
65
|
+
message =
|
|
66
|
+
"Access denied for this model. Ensure you have requested and been granted access in the AWS Bedrock console (Model Access section).";
|
|
67
|
+
}
|
|
68
|
+
else if (errorText.includes("ThrottlingException")) {
|
|
69
|
+
message = "Bedrock API throttling. Too many requests. Please retry with backoff.";
|
|
70
|
+
}
|
|
71
|
+
else if (errorText.includes("ValidationException")) {
|
|
72
|
+
message = `Bedrock validation error: ${errorText}`;
|
|
73
|
+
}
|
|
74
|
+
throw new Error(`Bedrock API error (${response.status}): ${message}`);
|
|
75
|
+
}
|
|
76
|
+
const json = (await response.json());
|
|
77
|
+
logger.logResponse("Bedrock", response.status, response.statusText, json);
|
|
78
|
+
const result = this.parseResponse(json);
|
|
79
|
+
if (result.usage) {
|
|
80
|
+
result.usage = ModelRegistry.calculateCost(result.usage, modelId, "bedrock");
|
|
81
|
+
}
|
|
82
|
+
return result;
|
|
83
|
+
}
|
|
84
|
+
/**
|
|
85
|
+
* Build request headers based on auth mode.
|
|
86
|
+
*/
|
|
87
|
+
buildHeaders(url, body, additionalHeaders) {
|
|
88
|
+
const headers = {
|
|
89
|
+
"Content-Type": "application/json",
|
|
90
|
+
Accept: "application/json",
|
|
91
|
+
...additionalHeaders
|
|
92
|
+
};
|
|
93
|
+
if (this.authMode === "apiKey") {
|
|
94
|
+
// Simple Bearer token auth
|
|
95
|
+
headers["Authorization"] = `Bearer ${this.config.apiKey}`;
|
|
96
|
+
}
|
|
97
|
+
else {
|
|
98
|
+
// SigV4 signing
|
|
99
|
+
const credentials = {
|
|
100
|
+
accessKeyId: this.config.accessKeyId,
|
|
101
|
+
secretAccessKey: this.config.secretAccessKey,
|
|
102
|
+
sessionToken: this.config.sessionToken
|
|
103
|
+
};
|
|
104
|
+
const signedHeaders = signRequest({
|
|
105
|
+
method: "POST",
|
|
106
|
+
url,
|
|
107
|
+
body,
|
|
108
|
+
credentials,
|
|
109
|
+
region: this.config.region,
|
|
110
|
+
service: "bedrock"
|
|
111
|
+
});
|
|
112
|
+
// Merge signed headers
|
|
113
|
+
headers["host"] = signedHeaders.host;
|
|
114
|
+
headers["x-amz-date"] = signedHeaders["x-amz-date"];
|
|
115
|
+
headers["x-amz-content-sha256"] = signedHeaders["x-amz-content-sha256"];
|
|
116
|
+
headers["Authorization"] = signedHeaders.authorization;
|
|
117
|
+
if (signedHeaders["x-amz-security-token"]) {
|
|
118
|
+
headers["x-amz-security-token"] = signedHeaders["x-amz-security-token"];
|
|
119
|
+
}
|
|
120
|
+
}
|
|
121
|
+
return headers;
|
|
122
|
+
}
|
|
123
|
+
/**
|
|
124
|
+
* Parse Bedrock response to NodeLLM format.
|
|
125
|
+
*/
|
|
126
|
+
parseResponse(response) {
|
|
127
|
+
const message = response.output.message;
|
|
128
|
+
let content = null;
|
|
129
|
+
let thinkingText = null;
|
|
130
|
+
const toolCalls = [];
|
|
131
|
+
// Process content blocks
|
|
132
|
+
for (const block of message.content) {
|
|
133
|
+
if (block.text) {
|
|
134
|
+
content = content ? content + block.text : block.text;
|
|
135
|
+
}
|
|
136
|
+
if (block.reasoningContent?.text) {
|
|
137
|
+
thinkingText = thinkingText
|
|
138
|
+
? thinkingText + block.reasoningContent.text
|
|
139
|
+
: block.reasoningContent.text;
|
|
140
|
+
}
|
|
141
|
+
if (block.toolUse) {
|
|
142
|
+
toolCalls.push({
|
|
143
|
+
id: block.toolUse.toolUseId,
|
|
144
|
+
type: "function",
|
|
145
|
+
function: {
|
|
146
|
+
name: block.toolUse.name,
|
|
147
|
+
arguments: JSON.stringify(block.toolUse.input)
|
|
148
|
+
}
|
|
149
|
+
});
|
|
150
|
+
}
|
|
151
|
+
}
|
|
152
|
+
// Build usage info
|
|
153
|
+
const usage = {
|
|
154
|
+
input_tokens: response.usage.inputTokens,
|
|
155
|
+
output_tokens: response.usage.outputTokens,
|
|
156
|
+
total_tokens: response.usage.totalTokens,
|
|
157
|
+
cached_tokens: response.usage.cacheReadInputTokens,
|
|
158
|
+
cache_creation_tokens: response.usage.cacheWriteInputTokens
|
|
159
|
+
};
|
|
160
|
+
return {
|
|
161
|
+
content,
|
|
162
|
+
thinking: thinkingText ? { text: thinkingText } : undefined,
|
|
163
|
+
reasoning: thinkingText || undefined, // Keep deprecated field for compat
|
|
164
|
+
tool_calls: toolCalls.length > 0 ? toolCalls : undefined,
|
|
165
|
+
usage,
|
|
166
|
+
finish_reason: response.stopReason,
|
|
167
|
+
metadata: response.trace ? { trace: response.trace } : undefined
|
|
168
|
+
};
|
|
169
|
+
}
|
|
170
|
+
}
|
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Bedrock Embeddings Handler
|
|
3
|
+
*
|
|
4
|
+
* Executes embedding requests against the Bedrock InvokeModel API.
|
|
5
|
+
*/
|
|
6
|
+
import { EmbeddingRequest, EmbeddingResponse } from "../Provider.js";
|
|
7
|
+
import { BedrockConfig } from "./config.js";
|
|
8
|
+
export declare class BedrockEmbeddings {
|
|
9
|
+
private readonly config;
|
|
10
|
+
private readonly authMode;
|
|
11
|
+
private readonly baseUrl;
|
|
12
|
+
constructor(config: BedrockConfig);
|
|
13
|
+
/**
|
|
14
|
+
* Execute an embedding request against Bedrock InvokeModel API.
|
|
15
|
+
*/
|
|
16
|
+
execute(request: EmbeddingRequest): Promise<EmbeddingResponse>;
|
|
17
|
+
/**
|
|
18
|
+
* Build request headers based on auth mode.
|
|
19
|
+
*/
|
|
20
|
+
private buildHeaders;
|
|
21
|
+
}
|
|
22
|
+
//# sourceMappingURL=Embeddings.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"Embeddings.d.ts","sourceRoot":"","sources":["../../../src/providers/bedrock/Embeddings.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,gBAAgB,EAAE,iBAAiB,EAAE,MAAM,gBAAgB,CAAC;AACrE,OAAO,EAAE,aAAa,EAA6C,MAAM,aAAa,CAAC;AAwBvF,qBAAa,iBAAiB;IAC5B,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAgB;IACvC,OAAO,CAAC,QAAQ,CAAC,QAAQ,CAAqB;IAC9C,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAS;gBAErB,MAAM,EAAE,aAAa;IAMjC;;OAEG;IACG,OAAO,CAAC,OAAO,EAAE,gBAAgB,GAAG,OAAO,CAAC,iBAAiB,CAAC;IAqDpE;;OAEG;IACH,OAAO,CAAC,YAAY;CAoCrB"}
|
|
@@ -0,0 +1,100 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Bedrock Embeddings Handler
|
|
3
|
+
*
|
|
4
|
+
* Executes embedding requests against the Bedrock InvokeModel API.
|
|
5
|
+
*/
|
|
6
|
+
import { validateBedrockConfig, getBedrockEndpoint } from "./config.js";
|
|
7
|
+
import { signRequest } from "../../utils/AwsSigV4.js";
|
|
8
|
+
import { fetchWithTimeout } from "../../utils/fetch.js";
|
|
9
|
+
import { logger } from "../../utils/logger.js";
|
|
10
|
+
// ─────────────────────────────────────────────────────────────────────────────
|
|
11
|
+
// Embeddings Handler
|
|
12
|
+
// ─────────────────────────────────────────────────────────────────────────────
|
|
13
|
+
export class BedrockEmbeddings {
|
|
14
|
+
config;
|
|
15
|
+
authMode;
|
|
16
|
+
baseUrl;
|
|
17
|
+
constructor(config) {
|
|
18
|
+
this.config = config;
|
|
19
|
+
this.authMode = validateBedrockConfig(config);
|
|
20
|
+
this.baseUrl = getBedrockEndpoint(config.region);
|
|
21
|
+
}
|
|
22
|
+
/**
|
|
23
|
+
* Execute an embedding request against Bedrock InvokeModel API.
|
|
24
|
+
*/
|
|
25
|
+
async execute(request) {
|
|
26
|
+
const modelId = request.model ?? "amazon.titan-embed-text-v2:0";
|
|
27
|
+
const url = `${this.baseUrl}/model/${modelId}/invoke`;
|
|
28
|
+
// Handle single vs multiple inputs (Titan only supports one at a time via InvokeModel)
|
|
29
|
+
const inputs = Array.isArray(request.input) ? request.input : [request.input];
|
|
30
|
+
const results = [];
|
|
31
|
+
let totalTokens = 0;
|
|
32
|
+
// Bedrock InvokeModel API for Titan embeddings processes one text at a time.
|
|
33
|
+
// We iterate through inputs and collect embeddings.
|
|
34
|
+
for (const text of inputs) {
|
|
35
|
+
const body = {
|
|
36
|
+
inputText: text,
|
|
37
|
+
// Titan V2 supports 256, 512, 1024 dimensions. NodeLLM doesn't have a standardized field for this yet,
|
|
38
|
+
// so we use the model's default (typically 1024 for V2) unless passed in headers/custom.
|
|
39
|
+
normalize: true
|
|
40
|
+
};
|
|
41
|
+
const bodyJson = JSON.stringify(body);
|
|
42
|
+
const headers = this.buildHeaders(url, bodyJson);
|
|
43
|
+
logger.logRequest("BedrockEmbeddings", "POST", url, body);
|
|
44
|
+
const response = await fetchWithTimeout(url, {
|
|
45
|
+
method: "POST",
|
|
46
|
+
headers,
|
|
47
|
+
body: bodyJson
|
|
48
|
+
}, request.requestTimeout ?? this.config.requestTimeout);
|
|
49
|
+
if (!response.ok) {
|
|
50
|
+
const errorText = await response.text();
|
|
51
|
+
logger.logResponse("BedrockEmbeddings", response.status, response.statusText, errorText);
|
|
52
|
+
throw new Error(`Bedrock Embeddings error (${response.status}): ${errorText}`);
|
|
53
|
+
}
|
|
54
|
+
const json = (await response.json());
|
|
55
|
+
results.push(json.embedding);
|
|
56
|
+
totalTokens += json.inputTextTokenCount;
|
|
57
|
+
}
|
|
58
|
+
return {
|
|
59
|
+
vectors: results,
|
|
60
|
+
model: modelId,
|
|
61
|
+
input_tokens: totalTokens,
|
|
62
|
+
dimensions: results[0]?.length || 0
|
|
63
|
+
};
|
|
64
|
+
}
|
|
65
|
+
/**
|
|
66
|
+
* Build request headers based on auth mode.
|
|
67
|
+
*/
|
|
68
|
+
buildHeaders(url, body) {
|
|
69
|
+
const headers = {
|
|
70
|
+
"Content-Type": "application/json",
|
|
71
|
+
Accept: "application/json"
|
|
72
|
+
};
|
|
73
|
+
if (this.authMode === "apiKey") {
|
|
74
|
+
headers["Authorization"] = `Bearer ${this.config.apiKey}`;
|
|
75
|
+
}
|
|
76
|
+
else {
|
|
77
|
+
const credentials = {
|
|
78
|
+
accessKeyId: this.config.accessKeyId,
|
|
79
|
+
secretAccessKey: this.config.secretAccessKey,
|
|
80
|
+
sessionToken: this.config.sessionToken
|
|
81
|
+
};
|
|
82
|
+
const signedHeaders = signRequest({
|
|
83
|
+
method: "POST",
|
|
84
|
+
url,
|
|
85
|
+
body: body,
|
|
86
|
+
credentials,
|
|
87
|
+
region: this.config.region,
|
|
88
|
+
service: "bedrock"
|
|
89
|
+
});
|
|
90
|
+
headers["host"] = signedHeaders.host;
|
|
91
|
+
headers["x-amz-date"] = signedHeaders["x-amz-date"];
|
|
92
|
+
headers["x-amz-content-sha256"] = signedHeaders["x-amz-content-sha256"];
|
|
93
|
+
headers["Authorization"] = signedHeaders.authorization;
|
|
94
|
+
if (signedHeaders["x-amz-security-token"]) {
|
|
95
|
+
headers["x-amz-security-token"] = signedHeaders["x-amz-security-token"];
|
|
96
|
+
}
|
|
97
|
+
}
|
|
98
|
+
return headers;
|
|
99
|
+
}
|
|
100
|
+
}
|
|
@@ -0,0 +1,33 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Bedrock Image Generation Handler
|
|
3
|
+
*
|
|
4
|
+
* Supports Amazon Titan Image Generator and Stability.ai Stable Diffusion models.
|
|
5
|
+
*/
|
|
6
|
+
import { ImageRequest, ImageResponse } from "../Provider.js";
|
|
7
|
+
import { BedrockConfig } from "./config.js";
|
|
8
|
+
export declare class BedrockImage {
|
|
9
|
+
private readonly config;
|
|
10
|
+
private readonly baseUrl;
|
|
11
|
+
constructor(config: BedrockConfig);
|
|
12
|
+
/**
|
|
13
|
+
* Execute an image generation request.
|
|
14
|
+
*/
|
|
15
|
+
execute(request: ImageRequest): Promise<ImageResponse>;
|
|
16
|
+
/**
|
|
17
|
+
* Build model-specific request body.
|
|
18
|
+
*/
|
|
19
|
+
private buildRequestBody;
|
|
20
|
+
/**
|
|
21
|
+
* Parse model-specific response.
|
|
22
|
+
*/
|
|
23
|
+
private parseResponse;
|
|
24
|
+
/**
|
|
25
|
+
* Parse size string (e.g. "1024x1024") into height and width.
|
|
26
|
+
*/
|
|
27
|
+
private parseSize;
|
|
28
|
+
/**
|
|
29
|
+
* Build headers with SigV4 signing.
|
|
30
|
+
*/
|
|
31
|
+
private buildHeaders;
|
|
32
|
+
}
|
|
33
|
+
//# sourceMappingURL=Image.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"Image.d.ts","sourceRoot":"","sources":["../../../src/providers/bedrock/Image.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,YAAY,EAAE,aAAa,EAAE,MAAM,gBAAgB,CAAC;AAC7D,OAAO,EAAE,aAAa,EAAsB,MAAM,aAAa,CAAC;AAKhE,qBAAa,YAAY;IACvB,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAgB;IACvC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAS;gBAErB,MAAM,EAAE,aAAa;IAKjC;;OAEG;IACG,OAAO,CAAC,OAAO,EAAE,YAAY,GAAG,OAAO,CAAC,aAAa,CAAC;IA8B5D;;OAEG;IACH,OAAO,CAAC,gBAAgB;IAuCxB;;OAEG;IACH,OAAO,CAAC,aAAa;IAwBrB;;OAEG;IACH,OAAO,CAAC,SAAS;IAejB;;OAEG;IACH,OAAO,CAAC,YAAY;CAsCrB"}
|