npm - symposium - Versions diffs - 0.13.8 → 0.14.0 - Mend

symposium 0.13.8 → 0.14.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/Agent.js CHANGED Viewed

@@ -88,6 +88,17 @@ export default class Agent {
 			this.callbacks[i + '-' + thread.id].push(callback);
 		}
+		const model = Symposium.getModelByName(thread.state.model);
+		if (!model.supports_audio) {
+			for (let c of content) {
+				if (c.type === 'audio' && !c.content?.transcription) {
+					const words = await this.getPromptWordsForTranscription(thread);
+					const prompt = words.length ? 'Possibili parole usate: ' + words.join(', ') : null;
+					c.content.transcription = await Symposium.transcribe(c.content, prompt);
+				}
+			}
+		}
 		await this.log('user_message', content);
 		thread.addMessage('user', content);
@@ -205,19 +216,6 @@ export default class Agent {
 	async generateCompletion(thread, options = {}, retry_counter = 1) {
 		try {
 			const model = Symposium.getModelByName(thread.state.model);
-			for (let message of thread.messages) {
-				for (let c of message.content) {
-					if (c.type === 'audio' && !model.supports_audio) {
-						const words = await this.getPromptWordsForTranscription(thread);
-						const prompt = words.length ? 'Possibili parole usate: ' + words.join(', ') : null;
-						const transcribed = await Symposium.transcribe(c.content, prompt);
-						c.type = 'text';
-						c.content = '[voice message] ' + transcribed;
-					}
-				}
-			}
 			const messages = await model.generate(thread, await this.getFunctions(), options);
 			return model.supports_functions ? messages : messages.map(m => this.parseFunctions(m));
 		} catch (error) {

package/Symposium.js CHANGED Viewed

@@ -85,17 +85,17 @@ export default class Symposium {
 		let file;
 		switch (audio.type) {
 			case 'url':
-				if (!audio.url)
+				if (!audio.data)
 					throw new Error('Audio URL is required');
-				if (audio.url.startsWith('/')) { // Local path
+				if (audio.data.startsWith('/')) { // Local path
 					// Get with fs
-					if (!fs.existsSync(audio.url))
-						throw new Error('Audio file does not exist at the specified path: ' + audio.url);
+					if (!fs.existsSync(audio.data))
+						throw new Error('Audio file does not exist at the specified path: ' + audio.data);
-					file = fs.readFileSync(audio.url);
+					file = fs.readFileSync(audio.data);
 				} else {
-					file = await fetch(audio.url).then(res => res.blob());
+					file = await fetch(audio.data).then(res => res.blob());
 				}
 				file = new File([file], 'audio.' + this.getExtFromMime(file.type), {type: file.type});

package/models/AnthropicModel.js CHANGED Viewed

@@ -148,6 +148,17 @@ export default class AnthropicModel extends Model {
 							}
 							break;
+						case 'audio':
+							if (c.content.transcription) {
+								content.push({
+									type: 'text',
+									text: '[transcribed] ' + c.content.transcription,
+								});
+							} else {
+								throw new Error('Audio content is not supported by this model');
+							}
+							break;
 						default:
 							throw new Error('Message type "' + c.type + '" unsupported by this model');
 					}

package/models/GroqModel.js CHANGED Viewed

@@ -158,6 +158,19 @@ export default class GroqModel extends Model {
 					}
 					break;
+				case 'audio':
+					if (c.content.transcription) {
+						messages.push({
+							role: message.role,
+							content: '[transcribed] ' + c.content.transcription,
+							name: message.name,
+						});
+					} else {
+						throw new Error('Audio content is not supported by this model');
+					}
+					break;
 				default:
 					throw new Error('Message type unsupported by this model');
 			}

package/models/OpenAIModel.js CHANGED Viewed

@@ -140,24 +140,34 @@ export default class OpenAIModel extends Model {
 					break;
 				case 'audio':
-					if (c.content.type !== 'base64')
-						throw new Error('Audio content must be base64 encoded for this model');
-					if (!['audio/mpeg', 'audio/wav'].includes(c.content.mime))
-						throw new Error('Audio content must have a valid MIME type');
+					if (this.supports_audio) {
+						if (c.content.type !== 'base64')
+							throw new Error('Audio content must be base64 encoded for this model');
+						if (!['audio/mpeg', 'audio/wav'].includes(c.content.mime))
+							throw new Error('Audio content must have a valid MIME type');
-					messages.push({
-						role,
-						content: [
-							{
-								type: 'input_audio',
-								input_audio: {
-									data: c.content.data,
-									format: c.content.mime === 'audio/mpeg' ? 'mp3' : 'wav',
+						messages.push({
+							role,
+							content: [
+								{
+									type: 'input_audio',
+									input_audio: {
+										data: c.content.data,
+										format: c.content.mime === 'audio/mpeg' ? 'mp3' : 'wav',
+									},
 								},
-							},
-						],
-						name: message.name,
-					});
+							],
+							name: message.name,
+						});
+					} else if (c.content.transcription) {
+						messages.push({
+							role,
+							content: '[transcribed] ' + c.content.transcription,
+							name: message.name,
+						});
+					} else{
+						throw new Error('Audio content is not supported by this model');
+					}
 					break;
 				case 'function':

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "type": "module",
   "name": "symposium",
-  "version": "0.13.8",
+  "version": "0.14.0",
   "description": "Agents",
   "main": "index.js",
   "author": "Domenico Giambra",