@librechat/agents 3.0.0-rc9 → 3.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (195) hide show
  1. package/dist/cjs/agents/AgentContext.cjs +6 -2
  2. package/dist/cjs/agents/AgentContext.cjs.map +1 -1
  3. package/dist/cjs/graphs/Graph.cjs +23 -2
  4. package/dist/cjs/graphs/Graph.cjs.map +1 -1
  5. package/dist/cjs/graphs/MultiAgentGraph.cjs +5 -5
  6. package/dist/cjs/graphs/MultiAgentGraph.cjs.map +1 -1
  7. package/dist/cjs/instrumentation.cjs +21 -0
  8. package/dist/cjs/instrumentation.cjs.map +1 -0
  9. package/dist/cjs/llm/anthropic/index.cjs +21 -2
  10. package/dist/cjs/llm/anthropic/index.cjs.map +1 -1
  11. package/dist/cjs/llm/google/index.cjs +3 -0
  12. package/dist/cjs/llm/google/index.cjs.map +1 -1
  13. package/dist/cjs/llm/google/utils/common.cjs +13 -0
  14. package/dist/cjs/llm/google/utils/common.cjs.map +1 -1
  15. package/dist/cjs/llm/ollama/index.cjs +3 -0
  16. package/dist/cjs/llm/ollama/index.cjs.map +1 -1
  17. package/dist/cjs/llm/openai/index.cjs +18 -3
  18. package/dist/cjs/llm/openai/index.cjs.map +1 -1
  19. package/dist/cjs/llm/openai/utils/index.cjs +6 -1
  20. package/dist/cjs/llm/openai/utils/index.cjs.map +1 -1
  21. package/dist/cjs/llm/openrouter/index.cjs +5 -1
  22. package/dist/cjs/llm/openrouter/index.cjs.map +1 -1
  23. package/dist/cjs/llm/vertexai/index.cjs +1 -1
  24. package/dist/cjs/llm/vertexai/index.cjs.map +1 -1
  25. package/dist/cjs/main.cjs +8 -2
  26. package/dist/cjs/main.cjs.map +1 -1
  27. package/dist/cjs/messages/cache.cjs +49 -0
  28. package/dist/cjs/messages/cache.cjs.map +1 -0
  29. package/dist/cjs/messages/content.cjs +53 -0
  30. package/dist/cjs/messages/content.cjs.map +1 -0
  31. package/dist/cjs/messages/core.cjs +5 -1
  32. package/dist/cjs/messages/core.cjs.map +1 -1
  33. package/dist/cjs/messages/format.cjs +50 -59
  34. package/dist/cjs/messages/format.cjs.map +1 -1
  35. package/dist/cjs/messages/prune.cjs +28 -0
  36. package/dist/cjs/messages/prune.cjs.map +1 -1
  37. package/dist/cjs/run.cjs +57 -5
  38. package/dist/cjs/run.cjs.map +1 -1
  39. package/dist/cjs/stream.cjs +7 -0
  40. package/dist/cjs/stream.cjs.map +1 -1
  41. package/dist/cjs/tools/ToolNode.cjs +2 -0
  42. package/dist/cjs/tools/ToolNode.cjs.map +1 -1
  43. package/dist/cjs/tools/search/firecrawl.cjs +3 -1
  44. package/dist/cjs/tools/search/firecrawl.cjs.map +1 -1
  45. package/dist/cjs/tools/search/rerankers.cjs +8 -6
  46. package/dist/cjs/tools/search/rerankers.cjs.map +1 -1
  47. package/dist/cjs/tools/search/search.cjs +5 -5
  48. package/dist/cjs/tools/search/search.cjs.map +1 -1
  49. package/dist/cjs/tools/search/serper-scraper.cjs +132 -0
  50. package/dist/cjs/tools/search/serper-scraper.cjs.map +1 -0
  51. package/dist/cjs/tools/search/tool.cjs +46 -9
  52. package/dist/cjs/tools/search/tool.cjs.map +1 -1
  53. package/dist/cjs/utils/handlers.cjs +70 -0
  54. package/dist/cjs/utils/handlers.cjs.map +1 -0
  55. package/dist/cjs/utils/misc.cjs +8 -1
  56. package/dist/cjs/utils/misc.cjs.map +1 -1
  57. package/dist/cjs/utils/title.cjs +54 -25
  58. package/dist/cjs/utils/title.cjs.map +1 -1
  59. package/dist/esm/agents/AgentContext.mjs +6 -2
  60. package/dist/esm/agents/AgentContext.mjs.map +1 -1
  61. package/dist/esm/graphs/Graph.mjs +23 -2
  62. package/dist/esm/graphs/Graph.mjs.map +1 -1
  63. package/dist/esm/graphs/MultiAgentGraph.mjs +5 -5
  64. package/dist/esm/graphs/MultiAgentGraph.mjs.map +1 -1
  65. package/dist/esm/instrumentation.mjs +19 -0
  66. package/dist/esm/instrumentation.mjs.map +1 -0
  67. package/dist/esm/llm/anthropic/index.mjs +21 -2
  68. package/dist/esm/llm/anthropic/index.mjs.map +1 -1
  69. package/dist/esm/llm/google/index.mjs +3 -0
  70. package/dist/esm/llm/google/index.mjs.map +1 -1
  71. package/dist/esm/llm/google/utils/common.mjs +13 -0
  72. package/dist/esm/llm/google/utils/common.mjs.map +1 -1
  73. package/dist/esm/llm/ollama/index.mjs +3 -0
  74. package/dist/esm/llm/ollama/index.mjs.map +1 -1
  75. package/dist/esm/llm/openai/index.mjs +18 -3
  76. package/dist/esm/llm/openai/index.mjs.map +1 -1
  77. package/dist/esm/llm/openai/utils/index.mjs +6 -1
  78. package/dist/esm/llm/openai/utils/index.mjs.map +1 -1
  79. package/dist/esm/llm/openrouter/index.mjs +5 -1
  80. package/dist/esm/llm/openrouter/index.mjs.map +1 -1
  81. package/dist/esm/llm/vertexai/index.mjs +1 -1
  82. package/dist/esm/llm/vertexai/index.mjs.map +1 -1
  83. package/dist/esm/main.mjs +5 -2
  84. package/dist/esm/main.mjs.map +1 -1
  85. package/dist/esm/messages/cache.mjs +47 -0
  86. package/dist/esm/messages/cache.mjs.map +1 -0
  87. package/dist/esm/messages/content.mjs +51 -0
  88. package/dist/esm/messages/content.mjs.map +1 -0
  89. package/dist/esm/messages/core.mjs +5 -1
  90. package/dist/esm/messages/core.mjs.map +1 -1
  91. package/dist/esm/messages/format.mjs +50 -58
  92. package/dist/esm/messages/format.mjs.map +1 -1
  93. package/dist/esm/messages/prune.mjs +28 -0
  94. package/dist/esm/messages/prune.mjs.map +1 -1
  95. package/dist/esm/run.mjs +57 -5
  96. package/dist/esm/run.mjs.map +1 -1
  97. package/dist/esm/stream.mjs +7 -0
  98. package/dist/esm/stream.mjs.map +1 -1
  99. package/dist/esm/tools/ToolNode.mjs +2 -0
  100. package/dist/esm/tools/ToolNode.mjs.map +1 -1
  101. package/dist/esm/tools/search/firecrawl.mjs +3 -1
  102. package/dist/esm/tools/search/firecrawl.mjs.map +1 -1
  103. package/dist/esm/tools/search/rerankers.mjs +8 -6
  104. package/dist/esm/tools/search/rerankers.mjs.map +1 -1
  105. package/dist/esm/tools/search/search.mjs +5 -5
  106. package/dist/esm/tools/search/search.mjs.map +1 -1
  107. package/dist/esm/tools/search/serper-scraper.mjs +129 -0
  108. package/dist/esm/tools/search/serper-scraper.mjs.map +1 -0
  109. package/dist/esm/tools/search/tool.mjs +46 -9
  110. package/dist/esm/tools/search/tool.mjs.map +1 -1
  111. package/dist/esm/utils/handlers.mjs +68 -0
  112. package/dist/esm/utils/handlers.mjs.map +1 -0
  113. package/dist/esm/utils/misc.mjs +8 -2
  114. package/dist/esm/utils/misc.mjs.map +1 -1
  115. package/dist/esm/utils/title.mjs +54 -25
  116. package/dist/esm/utils/title.mjs.map +1 -1
  117. package/dist/types/agents/AgentContext.d.ts +4 -1
  118. package/dist/types/instrumentation.d.ts +1 -0
  119. package/dist/types/llm/anthropic/index.d.ts +3 -0
  120. package/dist/types/llm/google/index.d.ts +1 -0
  121. package/dist/types/llm/ollama/index.d.ts +1 -0
  122. package/dist/types/llm/openai/index.d.ts +4 -0
  123. package/dist/types/llm/openrouter/index.d.ts +4 -2
  124. package/dist/types/llm/vertexai/index.d.ts +1 -1
  125. package/dist/types/messages/cache.d.ts +8 -0
  126. package/dist/types/messages/content.d.ts +7 -0
  127. package/dist/types/messages/format.d.ts +22 -25
  128. package/dist/types/messages/index.d.ts +2 -0
  129. package/dist/types/run.d.ts +2 -1
  130. package/dist/types/tools/search/firecrawl.d.ts +2 -1
  131. package/dist/types/tools/search/rerankers.d.ts +4 -1
  132. package/dist/types/tools/search/search.d.ts +1 -2
  133. package/dist/types/tools/search/serper-scraper.d.ts +59 -0
  134. package/dist/types/tools/search/tool.d.ts +25 -4
  135. package/dist/types/tools/search/types.d.ts +31 -1
  136. package/dist/types/types/graph.d.ts +3 -1
  137. package/dist/types/types/messages.d.ts +4 -0
  138. package/dist/types/utils/handlers.d.ts +34 -0
  139. package/dist/types/utils/index.d.ts +1 -0
  140. package/dist/types/utils/misc.d.ts +1 -0
  141. package/package.json +6 -2
  142. package/src/agents/AgentContext.ts +8 -0
  143. package/src/graphs/Graph.ts +31 -2
  144. package/src/graphs/MultiAgentGraph.ts +5 -5
  145. package/src/instrumentation.ts +22 -0
  146. package/src/llm/anthropic/index.ts +23 -2
  147. package/src/llm/anthropic/llm.spec.ts +1 -1
  148. package/src/llm/google/index.ts +4 -0
  149. package/src/llm/google/utils/common.ts +14 -0
  150. package/src/llm/ollama/index.ts +3 -0
  151. package/src/llm/openai/index.ts +17 -4
  152. package/src/llm/openai/utils/index.ts +7 -1
  153. package/src/llm/openrouter/index.ts +15 -6
  154. package/src/llm/vertexai/index.ts +2 -2
  155. package/src/messages/cache.test.ts +262 -0
  156. package/src/messages/cache.ts +56 -0
  157. package/src/messages/content.test.ts +362 -0
  158. package/src/messages/content.ts +63 -0
  159. package/src/messages/core.ts +5 -2
  160. package/src/messages/format.ts +65 -71
  161. package/src/messages/formatMessage.test.ts +418 -2
  162. package/src/messages/index.ts +2 -0
  163. package/src/messages/prune.ts +51 -0
  164. package/src/run.ts +82 -10
  165. package/src/scripts/ant_web_search.ts +1 -1
  166. package/src/scripts/handoff-test.ts +1 -1
  167. package/src/scripts/multi-agent-chain.ts +4 -4
  168. package/src/scripts/multi-agent-conditional.ts +4 -4
  169. package/src/scripts/multi-agent-document-review-chain.ts +4 -4
  170. package/src/scripts/multi-agent-parallel.ts +10 -8
  171. package/src/scripts/multi-agent-sequence.ts +3 -3
  172. package/src/scripts/multi-agent-supervisor.ts +5 -3
  173. package/src/scripts/multi-agent-test.ts +2 -2
  174. package/src/scripts/search.ts +5 -1
  175. package/src/scripts/simple.ts +8 -0
  176. package/src/scripts/test-custom-prompt-key.ts +4 -4
  177. package/src/scripts/test-handoff-input.ts +3 -3
  178. package/src/scripts/test-multi-agent-list-handoff.ts +2 -2
  179. package/src/scripts/tools.ts +4 -1
  180. package/src/specs/agent-handoffs.test.ts +889 -0
  181. package/src/stream.ts +9 -2
  182. package/src/tools/search/firecrawl.ts +5 -2
  183. package/src/tools/search/jina-reranker.test.ts +126 -0
  184. package/src/tools/search/rerankers.ts +11 -5
  185. package/src/tools/search/search.ts +6 -8
  186. package/src/tools/search/serper-scraper.ts +155 -0
  187. package/src/tools/search/tool.ts +49 -8
  188. package/src/tools/search/types.ts +46 -0
  189. package/src/types/graph.ts +6 -1
  190. package/src/types/messages.ts +4 -0
  191. package/src/utils/handlers.ts +107 -0
  192. package/src/utils/index.ts +2 -1
  193. package/src/utils/llmConfig.ts +35 -1
  194. package/src/utils/misc.ts +33 -21
  195. package/src/utils/title.ts +80 -40
@@ -0,0 +1,362 @@
1
+ import {
2
+ HumanMessage,
3
+ AIMessage,
4
+ SystemMessage,
5
+ } from '@langchain/core/messages';
6
+ import { formatContentStrings } from './content';
7
+ import { ContentTypes } from '@/common';
8
+
9
+ describe('formatContentStrings', () => {
10
+ describe('Human messages', () => {
11
+ it('should convert human message with all text blocks to string', () => {
12
+ const messages = [
13
+ new HumanMessage({
14
+ content: [
15
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'Hello' },
16
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'World' },
17
+ ],
18
+ }),
19
+ ];
20
+
21
+ const result = formatContentStrings(messages);
22
+
23
+ expect(result).toHaveLength(1);
24
+ expect(result[0].content).toBe('Hello\nWorld');
25
+ });
26
+
27
+ it('should not convert human message with mixed content types (text + image)', () => {
28
+ const messages = [
29
+ new HumanMessage({
30
+ content: [
31
+ { type: ContentTypes.TEXT, text: 'what do you see' },
32
+ {
33
+ type: 'image_url',
34
+ image_url: {
35
+ url: '_SOME_BASE64_DATA=',
36
+ detail: 'auto',
37
+ },
38
+ },
39
+ ],
40
+ }),
41
+ ];
42
+
43
+ const result = formatContentStrings(messages);
44
+
45
+ expect(result).toHaveLength(1);
46
+ expect(result[0].content).toEqual([
47
+ { type: ContentTypes.TEXT, text: 'what do you see' },
48
+ {
49
+ type: 'image_url',
50
+ image_url: {
51
+ url: '_SOME_BASE64_DATA=',
52
+ detail: 'auto',
53
+ },
54
+ },
55
+ ]);
56
+ });
57
+
58
+ it('should leave string content unchanged', () => {
59
+ const messages = [
60
+ new HumanMessage({
61
+ content: 'Hello World',
62
+ }),
63
+ ];
64
+
65
+ const result = formatContentStrings(messages);
66
+
67
+ expect(result).toHaveLength(1);
68
+ expect(result[0].content).toBe('Hello World');
69
+ });
70
+
71
+ it('should handle empty text blocks', () => {
72
+ const messages = [
73
+ new HumanMessage({
74
+ content: [
75
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'Hello' },
76
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: '' },
77
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'World' },
78
+ ],
79
+ }),
80
+ ];
81
+
82
+ const result = formatContentStrings(messages);
83
+
84
+ expect(result).toHaveLength(1);
85
+ expect(result[0].content).toBe('Hello\n\nWorld');
86
+ });
87
+
88
+ it('should handle null/undefined text values', () => {
89
+ const messages = [
90
+ new HumanMessage({
91
+ content: [
92
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'Hello' },
93
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: null },
94
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: undefined },
95
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'World' },
96
+ ],
97
+ }),
98
+ ];
99
+
100
+ const result = formatContentStrings(messages);
101
+
102
+ expect(result).toHaveLength(1);
103
+ expect(result[0].content).toBe('Hello\n\n\nWorld');
104
+ });
105
+ });
106
+
107
+ describe('AI messages', () => {
108
+ it('should convert AI message with all text blocks to string', () => {
109
+ const messages = [
110
+ new AIMessage({
111
+ content: [
112
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'Hello' },
113
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'World' },
114
+ ],
115
+ }),
116
+ ];
117
+
118
+ const result = formatContentStrings(messages);
119
+
120
+ expect(result).toHaveLength(1);
121
+ expect(result[0].content).toBe('Hello\nWorld');
122
+ expect(result[0].getType()).toBe('ai');
123
+ });
124
+
125
+ it('should not convert AI message with mixed content types', () => {
126
+ const messages = [
127
+ new AIMessage({
128
+ content: [
129
+ {
130
+ type: ContentTypes.TEXT,
131
+ [ContentTypes.TEXT]: 'Here is an image',
132
+ },
133
+ {
134
+ type: ContentTypes.TOOL_CALL,
135
+ tool_call: { name: 'generate_image' },
136
+ },
137
+ ],
138
+ }),
139
+ ];
140
+
141
+ const result = formatContentStrings(messages);
142
+
143
+ expect(result).toHaveLength(1);
144
+ expect(result[0].content).toEqual([
145
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'Here is an image' },
146
+ { type: ContentTypes.TOOL_CALL, tool_call: { name: 'generate_image' } },
147
+ ]);
148
+ });
149
+ });
150
+
151
+ describe('System messages', () => {
152
+ it('should convert System message with all text blocks to string', () => {
153
+ const messages = [
154
+ new SystemMessage({
155
+ content: [
156
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'System' },
157
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'Message' },
158
+ ],
159
+ }),
160
+ ];
161
+
162
+ const result = formatContentStrings(messages);
163
+
164
+ expect(result).toHaveLength(1);
165
+ expect(result[0].content).toBe('System\nMessage');
166
+ expect(result[0].getType()).toBe('system');
167
+ });
168
+ });
169
+
170
+ describe('Mixed message types', () => {
171
+ it('should process all valid message types in mixed array', () => {
172
+ const messages = [
173
+ new HumanMessage({
174
+ content: [
175
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'Human' },
176
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'Message' },
177
+ ],
178
+ }),
179
+ new AIMessage({
180
+ content: [
181
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'AI' },
182
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'Response' },
183
+ ],
184
+ }),
185
+ new SystemMessage({
186
+ content: [
187
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'System' },
188
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: 'Prompt' },
189
+ ],
190
+ }),
191
+ ];
192
+
193
+ const result = formatContentStrings(messages);
194
+
195
+ expect(result).toHaveLength(3);
196
+ // All messages should be converted
197
+ expect(result[0].content).toBe('Human\nMessage');
198
+ expect(result[0].getType()).toBe('human');
199
+
200
+ expect(result[1].content).toBe('AI\nResponse');
201
+ expect(result[1].getType()).toBe('ai');
202
+
203
+ expect(result[2].content).toBe('System\nPrompt');
204
+ expect(result[2].getType()).toBe('system');
205
+ });
206
+ });
207
+
208
+ describe('Edge cases', () => {
209
+ it('should handle empty array', () => {
210
+ const result = formatContentStrings([]);
211
+ expect(result).toEqual([]);
212
+ });
213
+
214
+ it('should handle messages with non-array content', () => {
215
+ const messages = [
216
+ new HumanMessage({
217
+ content: 'This is a string content',
218
+ }),
219
+ ];
220
+
221
+ const result = formatContentStrings(messages);
222
+
223
+ expect(result).toHaveLength(1);
224
+ expect(result[0].content).toBe('This is a string content');
225
+ });
226
+
227
+ it('should trim the final concatenated string', () => {
228
+ const messages = [
229
+ new HumanMessage({
230
+ content: [
231
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: ' Hello ' },
232
+ { type: ContentTypes.TEXT, [ContentTypes.TEXT]: ' World ' },
233
+ ],
234
+ }),
235
+ ];
236
+
237
+ const result = formatContentStrings(messages);
238
+
239
+ expect(result).toHaveLength(1);
240
+ expect(result[0].content).toBe('Hello \n World');
241
+ });
242
+ });
243
+
244
+ describe('Real-world scenarios', () => {
245
+ it('should handle the exact scenario from the issue', () => {
246
+ const messages = [
247
+ new HumanMessage({
248
+ content: [
249
+ {
250
+ type: 'text',
251
+ text: 'hi there',
252
+ },
253
+ ],
254
+ }),
255
+ new AIMessage({
256
+ content: [
257
+ {
258
+ type: 'text',
259
+ text: 'Hi Danny! How can I help you today?',
260
+ },
261
+ ],
262
+ }),
263
+ new HumanMessage({
264
+ content: [
265
+ {
266
+ type: 'text',
267
+ text: 'what do you see',
268
+ },
269
+ {
270
+ type: 'image_url',
271
+ image_url: {
272
+ url: '_SOME_BASE64_DATA=',
273
+ detail: 'auto',
274
+ },
275
+ },
276
+ ],
277
+ }),
278
+ ];
279
+
280
+ const result = formatContentStrings(messages);
281
+
282
+ expect(result).toHaveLength(3);
283
+
284
+ // First human message (all text) should be converted
285
+ expect(result[0].content).toBe('hi there');
286
+ expect(result[0].getType()).toBe('human');
287
+
288
+ // AI message (all text) should now also be converted
289
+ expect(result[1].content).toBe('Hi Danny! How can I help you today?');
290
+ expect(result[1].getType()).toBe('ai');
291
+
292
+ // Third message (mixed content) should remain unchanged
293
+ expect(result[2].content).toEqual([
294
+ {
295
+ type: 'text',
296
+ text: 'what do you see',
297
+ },
298
+ {
299
+ type: 'image_url',
300
+ image_url: {
301
+ url: '_SOME_BASE64_DATA=',
302
+ detail: 'auto',
303
+ },
304
+ },
305
+ ]);
306
+ });
307
+
308
+ it('should handle messages with tool calls', () => {
309
+ const messages = [
310
+ new HumanMessage({
311
+ content: [
312
+ {
313
+ type: ContentTypes.TEXT,
314
+ [ContentTypes.TEXT]: 'Please use the calculator',
315
+ },
316
+ {
317
+ type: ContentTypes.TOOL_CALL,
318
+ tool_call: { name: 'calculator', args: '{"a": 1, "b": 2}' },
319
+ },
320
+ ],
321
+ }),
322
+ new AIMessage({
323
+ content: [
324
+ {
325
+ type: ContentTypes.TEXT,
326
+ [ContentTypes.TEXT]: 'I will calculate that for you',
327
+ },
328
+ {
329
+ type: ContentTypes.TOOL_CALL,
330
+ tool_call: { name: 'calculator', args: '{"a": 1, "b": 2}' },
331
+ },
332
+ ],
333
+ }),
334
+ ];
335
+
336
+ const result = formatContentStrings(messages);
337
+
338
+ expect(result).toHaveLength(2);
339
+ // Should not convert because not all blocks are text
340
+ expect(result[0].content).toEqual([
341
+ {
342
+ type: ContentTypes.TEXT,
343
+ [ContentTypes.TEXT]: 'Please use the calculator',
344
+ },
345
+ {
346
+ type: ContentTypes.TOOL_CALL,
347
+ tool_call: { name: 'calculator', args: '{"a": 1, "b": 2}' },
348
+ },
349
+ ]);
350
+ expect(result[1].content).toEqual([
351
+ {
352
+ type: ContentTypes.TEXT,
353
+ [ContentTypes.TEXT]: 'I will calculate that for you',
354
+ },
355
+ {
356
+ type: ContentTypes.TOOL_CALL,
357
+ tool_call: { name: 'calculator', args: '{"a": 1, "b": 2}' },
358
+ },
359
+ ]);
360
+ });
361
+ });
362
+ });
@@ -0,0 +1,63 @@
1
+ import { ContentTypes } from '@/common';
2
+ import type { BaseMessage } from '@langchain/core/messages';
3
+
4
+ /**
5
+ * Formats an array of messages for LangChain, making sure all content fields are strings
6
+ * @param {Array<HumanMessage | AIMessage | SystemMessage | ToolMessage>} payload - The array of messages to format.
7
+ * @returns {Array<HumanMessage | AIMessage | SystemMessage | ToolMessage>} - The array of formatted LangChain messages, including ToolMessages for tool calls.
8
+ */
9
+ export const formatContentStrings = (
10
+ payload: Array<BaseMessage>
11
+ ): Array<BaseMessage> => {
12
+ // Create a new array to store the processed messages
13
+ const result: Array<BaseMessage> = [];
14
+
15
+ for (const message of payload) {
16
+ const messageType = message.getType();
17
+ const isValidMessage =
18
+ messageType === 'human' ||
19
+ messageType === 'ai' ||
20
+ messageType === 'system';
21
+
22
+ if (!isValidMessage) {
23
+ result.push(message);
24
+ continue;
25
+ }
26
+
27
+ // If content is already a string, add as-is
28
+ if (typeof message.content === 'string') {
29
+ result.push(message);
30
+ continue;
31
+ }
32
+
33
+ // If content is not an array, add as-is
34
+ if (!Array.isArray(message.content)) {
35
+ result.push(message);
36
+ continue;
37
+ }
38
+
39
+ // Check if all content blocks are text type
40
+ const allTextBlocks = message.content.every(
41
+ (block) => block.type === ContentTypes.TEXT
42
+ );
43
+
44
+ // Only convert to string if all blocks are text type
45
+ if (!allTextBlocks) {
46
+ result.push(message);
47
+ continue;
48
+ }
49
+
50
+ // Reduce text types to a single string
51
+ const content = message.content.reduce((acc, curr) => {
52
+ if (curr.type === ContentTypes.TEXT) {
53
+ return `${acc}${curr[ContentTypes.TEXT] || ''}\n`;
54
+ }
55
+ return acc;
56
+ }, '');
57
+
58
+ message.content = content.trim();
59
+ result.push(message);
60
+ }
61
+
62
+ return result;
63
+ };
@@ -321,12 +321,15 @@ export function convertMessagesToContent(
321
321
  const id = (message as ToolMessage).tool_call_id;
322
322
  const output = (message as ToolMessage).content;
323
323
  const tool_call = toolCallMap.get(id);
324
-
324
+ if (currentAIMessageIndex === -1) {
325
+ processedContent.push({ type: 'text', text: '' });
326
+ currentAIMessageIndex = processedContent.length - 1;
327
+ }
328
+ const contentPart = processedContent[currentAIMessageIndex];
325
329
  processedContent.push({
326
330
  type: 'tool_call',
327
331
  tool_call: Object.assign({}, tool_call, { output }),
328
332
  });
329
- const contentPart = processedContent[currentAIMessageIndex];
330
333
  const tool_call_ids = contentPart.tool_call_ids || [];
331
334
  tool_call_ids.push(id);
332
335
  contentPart.tool_call_ids = tool_call_ids;
@@ -17,28 +17,28 @@ import type {
17
17
  } from '@/types';
18
18
  import { Providers, ContentTypes } from '@/common';
19
19
 
20
- interface VisionMessageParams {
20
+ interface MediaMessageParams {
21
21
  message: {
22
22
  role: string;
23
23
  content: string;
24
24
  name?: string;
25
25
  [key: string]: any;
26
26
  };
27
- image_urls: MessageContentImageUrl[];
27
+ mediaParts: MessageContentComplex[];
28
28
  endpoint?: Providers;
29
29
  }
30
30
 
31
31
  /**
32
- * Formats a message to OpenAI Vision API payload format.
32
+ * Formats a message with media content (images, documents, videos, audios) to API payload format.
33
33
  *
34
- * @param {VisionMessageParams} params - The parameters for formatting.
35
- * @returns {Object} - The formatted message.
34
+ * @param params - The parameters for formatting.
35
+ * @returns - The formatted message.
36
36
  */
37
- export const formatVisionMessage = ({
37
+ export const formatMediaMessage = ({
38
38
  message,
39
- image_urls,
40
39
  endpoint,
41
- }: VisionMessageParams): {
40
+ mediaParts,
41
+ }: MediaMessageParams): {
42
42
  role: string;
43
43
  content: MessageContentComplex[];
44
44
  name?: string;
@@ -57,7 +57,7 @@ export const formatVisionMessage = ({
57
57
 
58
58
  if (endpoint === Providers.ANTHROPIC) {
59
59
  result.content = [
60
- ...image_urls,
60
+ ...mediaParts,
61
61
  { type: ContentTypes.TEXT, text: message.content },
62
62
  ] as MessageContentComplex[];
63
63
  return result;
@@ -65,7 +65,7 @@ export const formatVisionMessage = ({
65
65
 
66
66
  result.content = [
67
67
  { type: ContentTypes.TEXT, text: message.content },
68
- ...image_urls,
68
+ ...mediaParts,
69
69
  ] as MessageContentComplex[];
70
70
 
71
71
  return result;
@@ -78,6 +78,9 @@ interface MessageInput {
78
78
  text?: string;
79
79
  content?: string | MessageContentComplex[];
80
80
  image_urls?: MessageContentImageUrl[];
81
+ documents?: MessageContentComplex[];
82
+ videos?: MessageContentComplex[];
83
+ audios?: MessageContentComplex[];
81
84
  lc_id?: string[];
82
85
  [key: string]: any;
83
86
  }
@@ -100,14 +103,14 @@ interface FormattedMessage {
100
103
  /**
101
104
  * Formats a message to OpenAI payload format based on the provided options.
102
105
  *
103
- * @param {FormatMessageParams} params - The parameters for formatting.
104
- * @returns {FormattedMessage | HumanMessage | AIMessage | SystemMessage} - The formatted message.
106
+ * @param params - The parameters for formatting.
107
+ * @returns - The formatted message.
105
108
  */
106
109
  export const formatMessage = ({
107
110
  message,
108
111
  userName,
109
- assistantName,
110
112
  endpoint,
113
+ assistantName,
111
114
  langChain = false,
112
115
  }: FormatMessageParams):
113
116
  | FormattedMessage
@@ -135,21 +138,7 @@ export const formatMessage = ({
135
138
  content,
136
139
  };
137
140
 
138
- const { image_urls } = message;
139
- if (Array.isArray(image_urls) && image_urls.length > 0 && role === 'user') {
140
- return formatVisionMessage({
141
- message: {
142
- ...formattedMessage,
143
- content:
144
- typeof formattedMessage.content === 'string'
145
- ? formattedMessage.content
146
- : '',
147
- },
148
- image_urls,
149
- endpoint,
150
- });
151
- }
152
-
141
+ // Set name fields first
153
142
  if (_name != null && _name) {
154
143
  formattedMessage.name = _name;
155
144
  }
@@ -179,6 +168,45 @@ export const formatMessage = ({
179
168
  }
180
169
  }
181
170
 
171
+ const { image_urls, documents, videos, audios } = message;
172
+ const mediaParts: MessageContentComplex[] = [];
173
+
174
+ if (Array.isArray(documents) && documents.length > 0) {
175
+ mediaParts.push(...documents);
176
+ }
177
+
178
+ if (Array.isArray(videos) && videos.length > 0) {
179
+ mediaParts.push(...videos);
180
+ }
181
+
182
+ if (Array.isArray(audios) && audios.length > 0) {
183
+ mediaParts.push(...audios);
184
+ }
185
+
186
+ if (Array.isArray(image_urls) && image_urls.length > 0) {
187
+ mediaParts.push(...image_urls);
188
+ }
189
+
190
+ if (mediaParts.length > 0 && role === 'user') {
191
+ const mediaMessage = formatMediaMessage({
192
+ message: {
193
+ ...formattedMessage,
194
+ content:
195
+ typeof formattedMessage.content === 'string'
196
+ ? formattedMessage.content
197
+ : '',
198
+ },
199
+ mediaParts,
200
+ endpoint,
201
+ });
202
+
203
+ if (!langChain) {
204
+ return mediaMessage;
205
+ }
206
+
207
+ return new HumanMessage(mediaMessage);
208
+ }
209
+
182
210
  if (!langChain) {
183
211
  return formattedMessage;
184
212
  }
@@ -195,9 +223,9 @@ export const formatMessage = ({
195
223
  /**
196
224
  * Formats an array of messages for LangChain.
197
225
  *
198
- * @param {Array<MessageInput>} messages - The array of messages to format.
199
- * @param {Omit<FormatMessageParams, 'message' | 'langChain'>} formatOptions - The options for formatting each message.
200
- * @returns {Array<HumanMessage | AIMessage | SystemMessage>} - The array of formatted LangChain messages.
226
+ * @param messages - The array of messages to format.
227
+ * @param formatOptions - The options for formatting each message.
228
+ * @returns - The array of formatted LangChain messages.
201
229
  */
202
230
  export const formatLangChainMessages = (
203
231
  messages: Array<MessageInput>,
@@ -228,8 +256,8 @@ interface LangChainMessage {
228
256
  /**
229
257
  * Formats a LangChain message object by merging properties from `lc_kwargs` or `kwargs` and `additional_kwargs`.
230
258
  *
231
- * @param {LangChainMessage} message - The message object to format.
232
- * @returns {Record<string, any>} The formatted LangChain message.
259
+ * @param message - The message object to format.
260
+ * @returns - The formatted LangChain message.
233
261
  */
234
262
  export const formatFromLangChain = (
235
263
  message: LangChainMessage
@@ -357,10 +385,10 @@ function formatAssistantMessage(
357
385
  /**
358
386
  * Formats an array of messages for LangChain, handling tool calls and creating ToolMessage instances.
359
387
  *
360
- * @param {TPayload} payload - The array of messages to format.
361
- * @param {Record<number, number>} [indexTokenCountMap] - Optional map of message indices to token counts.
362
- * @param {Set<string>} [tools] - Optional set of tool names that are allowed in the request.
363
- * @returns {Object} - Object containing formatted messages and updated indexTokenCountMap if provided.
388
+ * @param payload - The array of messages to format.
389
+ * @param indexTokenCountMap - Optional map of message indices to token counts.
390
+ * @param tools - Optional set of tool names that are allowed in the request.
391
+ * @returns - Object containing formatted messages and updated indexTokenCountMap if provided.
364
392
  */
365
393
  export const formatAgentMessages = (
366
394
  payload: TPayload,
@@ -537,40 +565,6 @@ export const formatAgentMessages = (
537
565
  };
538
566
  };
539
567
 
540
- /**
541
- * Formats an array of messages for LangChain, making sure all content fields are strings
542
- * @param {Array<HumanMessage | AIMessage | SystemMessage | ToolMessage>} payload - The array of messages to format.
543
- * @returns {Array<HumanMessage | AIMessage | SystemMessage | ToolMessage>} - The array of formatted LangChain messages, including ToolMessages for tool calls.
544
- */
545
- export const formatContentStrings = (
546
- payload: Array<BaseMessage>
547
- ): Array<BaseMessage> => {
548
- // Create a copy of the payload to avoid modifying the original
549
- const result = [...payload];
550
-
551
- for (const message of result) {
552
- if (typeof message.content === 'string') {
553
- continue;
554
- }
555
-
556
- if (!Array.isArray(message.content)) {
557
- continue;
558
- }
559
-
560
- // Reduce text types to a single string, ignore all other types
561
- const content = message.content.reduce((acc, curr) => {
562
- if (curr.type === ContentTypes.TEXT) {
563
- return `${acc}${curr[ContentTypes.TEXT] || ''}\n`;
564
- }
565
- return acc;
566
- }, '');
567
-
568
- message.content = content.trim();
569
- }
570
-
571
- return result;
572
- };
573
-
574
568
  /**
575
569
  * Adds a value at key 0 for system messages and shifts all key indices by one in an indexTokenCountMap.
576
570
  * This is useful when adding a system message at the beginning of a conversation.