npm - @supertone/supertone - Versions diffs - 0.1.2 → 0.1.4 - Mend

@supertone/supertone 0.1.2 → 0.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (52) hide show

package/README.md +4 -4
package/custom_test/realtime_tts_player.ts +120 -16
package/custom_test/test_pronunciation_dictionary.ts +227 -0
package/custom_test/test_real_api.ts +580 -0
package/custom_test/test_text_utils_chunk_text_punctuation.ts +55 -0
package/dist/commonjs/lib/config.d.ts +2 -2
package/dist/commonjs/lib/config.d.ts.map +1 -1
package/dist/commonjs/lib/config.js +2 -2
package/dist/commonjs/lib/config.js.map +1 -1
package/dist/commonjs/lib/custom_utils/index.d.ts +1 -0
package/dist/commonjs/lib/custom_utils/index.d.ts.map +1 -1
package/dist/commonjs/lib/custom_utils/index.js +5 -1
package/dist/commonjs/lib/custom_utils/index.js.map +1 -1
package/dist/commonjs/lib/custom_utils/pronunciation_utils.d.ts +24 -0
package/dist/commonjs/lib/custom_utils/pronunciation_utils.d.ts.map +1 -0
package/dist/commonjs/lib/custom_utils/pronunciation_utils.js +145 -0
package/dist/commonjs/lib/custom_utils/pronunciation_utils.js.map +1 -0
package/dist/commonjs/lib/custom_utils/text_utils.d.ts +1 -1
package/dist/commonjs/lib/custom_utils/text_utils.d.ts.map +1 -1
package/dist/commonjs/lib/custom_utils/text_utils.js +21 -4
package/dist/commonjs/lib/custom_utils/text_utils.js.map +1 -1
package/dist/commonjs/sdk/texttospeech.d.ts +17 -6
package/dist/commonjs/sdk/texttospeech.d.ts.map +1 -1
package/dist/commonjs/sdk/texttospeech.js +48 -25
package/dist/commonjs/sdk/texttospeech.js.map +1 -1
package/dist/esm/lib/config.d.ts +2 -2
package/dist/esm/lib/config.d.ts.map +1 -1
package/dist/esm/lib/config.js +2 -2
package/dist/esm/lib/config.js.map +1 -1
package/dist/esm/lib/custom_utils/index.d.ts +1 -0
package/dist/esm/lib/custom_utils/index.d.ts.map +1 -1
package/dist/esm/lib/custom_utils/index.js +2 -0
package/dist/esm/lib/custom_utils/index.js.map +1 -1
package/dist/esm/lib/custom_utils/pronunciation_utils.d.ts +24 -0
package/dist/esm/lib/custom_utils/pronunciation_utils.d.ts.map +1 -0
package/dist/esm/lib/custom_utils/pronunciation_utils.js +140 -0
package/dist/esm/lib/custom_utils/pronunciation_utils.js.map +1 -0
package/dist/esm/lib/custom_utils/text_utils.d.ts +1 -1
package/dist/esm/lib/custom_utils/text_utils.d.ts.map +1 -1
package/dist/esm/lib/custom_utils/text_utils.js +21 -4
package/dist/esm/lib/custom_utils/text_utils.js.map +1 -1
package/dist/esm/sdk/texttospeech.d.ts +17 -6
package/dist/esm/sdk/texttospeech.d.ts.map +1 -1
package/dist/esm/sdk/texttospeech.js +49 -26
package/dist/esm/sdk/texttospeech.js.map +1 -1
package/jsr.json +1 -1
package/package.json +1 -1
package/src/lib/config.ts +41 -41
package/src/lib/custom_utils/index.ts +7 -0
package/src/lib/custom_utils/pronunciation_utils.ts +193 -0
package/src/lib/custom_utils/text_utils.ts +25 -4
package/src/sdk/texttospeech.ts +99 -68

package/custom_test/test_real_api.ts CHANGED Viewed

@@ -1084,6 +1084,235 @@ async function testCreateSpeechJapaneseNoSpaces(
 	}
 }
+/**
+ * Test TTS with Arabic text and Arabic punctuation marks (؟ ؛ ۔)
+ * This tests multilingual sentence punctuation support added in fix/text_utils
+ */
+async function testCreateSpeechArabicPunctuation(
+	voiceId: string | null
+): Promise<[boolean, any]> {
+	console.log("🇸🇦 Arabic Text with Arabic Punctuation Test");
+	if (!voiceId) {
+		console.log("  ⚠️  No voice ID available");
+		return [false, null];
+	}
+	try {
+		const { Supertone } = await import("../src/index.js");
+		const models = await import("../src/models/index.js");
+		const client = new Supertone({ apiKey: API_KEY });
+		// Arabic text with Arabic punctuation marks (؟ ؛ ۔ ،)
+		// Text length: ~350 characters (exceeds 300 char limit)
+		const arabicText =
+			"مرحبا بكم في اختبار تقنية تحويل النص إلى كلام؟ " +
+			"هذا النظام يدعم اللغة العربية بشكل كامل؛ " +
+			"يمكنه التعرف على علامات الترقيم العربية مثل علامة الاستفهام وعلامة الفاصلة المنقوطة۔ " +
+			"تقنية الذكاء الاصطناعي تتطور بسرعة كبيرة، " +
+			"والآن يمكننا تحويل النصوص الطويلة إلى كلام طبيعي؟ " +
+			"هذا الاختبار يتحقق من أن النظام يقسم النص بشكل صحيح عند علامات الترقيم العربية؛ " +
+			"نأمل أن يعمل كل شيء بشكل مثالي۔";
+		const actualLength = arabicText.length;
+		console.log(
+			`  📏 Text length: ${actualLength} characters (Arabic with Arabic punctuation)`
+		);
+		console.log(`  🔧 Expected behavior: Sentence-based chunking with Arabic punctuation (؟ ؛ ۔)`);
+		console.log("  ⚠️  This test consumes credits!");
+		if (actualLength <= 300) {
+			console.log(`  ❌ Text length ${actualLength} is <= 300, test may not trigger chunking`);
+		}
+		const response = await client.textToSpeech.createSpeech({
+			voiceId,
+			apiConvertTextToSpeechUsingCharacterRequest: {
+				text: arabicText,
+				language: models.APIConvertTextToSpeechUsingCharacterRequestLanguage.Ar,
+				outputFormat:
+					models.APIConvertTextToSpeechUsingCharacterRequestOutputFormat.Wav,
+				style: "neutral",
+				model: models.APIConvertTextToSpeechUsingCharacterRequestModel.SonaSpeech2,
+			},
+		});
+		if (response.result) {
+			const audioData = await extractAudioData(response);
+			console.log(
+				`  ✅ Arabic punctuation chunking TTS success: ${audioData.length} bytes`
+			);
+			console.log(`  🎯 Arabic text with Arabic punctuation processed correctly!`);
+			const outputFile = "test_arabic_punctuation_speech_output.wav";
+			fs.writeFileSync(outputFile, audioData);
+			console.log(`  💾 Audio saved: ${outputFile}`);
+			const estimatedChunks = Math.ceil(actualLength / 300);
+			console.log(`  📊 Estimated chunks: ${estimatedChunks}`);
+		}
+		return [true, response];
+	} catch (e: any) {
+		logDetailedError(e, "Arabic punctuation chunking");
+		return [false, e];
+	}
+}
+/**
+ * Test TTS with Hindi text and Devanagari punctuation marks (। ॥)
+ * This tests multilingual sentence punctuation support added in fix/text_utils
+ */
+async function testCreateSpeechHindiPunctuation(
+	voiceId: string | null
+): Promise<[boolean, any]> {
+	console.log("🇮🇳 Hindi Text with Devanagari Punctuation Test");
+	if (!voiceId) {
+		console.log("  ⚠️  No voice ID available");
+		return [false, null];
+	}
+	try {
+		const { Supertone } = await import("../src/index.js");
+		const models = await import("../src/models/index.js");
+		const client = new Supertone({ apiKey: API_KEY });
+		// Hindi text with Devanagari punctuation marks (। ॥)
+		// Text length: ~380 characters (exceeds 300 char limit)
+		const hindiText =
+			"नमस्ते और स्वागत है आपका इस परीक्षण में। " +
+			"यह प्रणाली हिंदी भाषा का पूर्ण समर्थन करती है। " +
+			"देवनागरी लिपि में पूर्ण विराम और दोहरा दंड जैसे विराम चिह्न होते हैं॥ " +
+			"कृत्रिम बुद्धिमत्ता की तकनीक बहुत तेजी से विकसित हो रही है। " +
+			"अब हम लंबे पाठों को स्वाभाविक वाणी में बदल सकते हैं। " +
+			"यह परीक्षण जांचता है कि सिस्टम हिंदी विराम चिह्नों पर सही ढंग से पाठ को विभाजित करता है। " +
+			"हमें आशा है कि सब कुछ ठीक से काम करेगा॥";
+		const actualLength = hindiText.length;
+		console.log(
+			`  📏 Text length: ${actualLength} characters (Hindi with Devanagari punctuation)`
+		);
+		console.log(`  🔧 Expected behavior: Sentence-based chunking with Devanagari punctuation (। ॥)`);
+		console.log("  ⚠️  This test consumes credits!");
+		if (actualLength <= 300) {
+			console.log(`  ❌ Text length ${actualLength} is <= 300, test may not trigger chunking`);
+		}
+		const response = await client.textToSpeech.createSpeech({
+			voiceId,
+			apiConvertTextToSpeechUsingCharacterRequest: {
+				text: hindiText,
+				language: models.APIConvertTextToSpeechUsingCharacterRequestLanguage.Hi,
+				outputFormat:
+					models.APIConvertTextToSpeechUsingCharacterRequestOutputFormat.Wav,
+				style: "neutral",
+				model: models.APIConvertTextToSpeechUsingCharacterRequestModel.SonaSpeech2,
+			},
+		});
+		if (response.result) {
+			const audioData = await extractAudioData(response);
+			console.log(
+				`  ✅ Hindi punctuation chunking TTS success: ${audioData.length} bytes`
+			);
+			console.log(`  🎯 Hindi text with Devanagari punctuation processed correctly!`);
+			const outputFile = "test_hindi_punctuation_speech_output.wav";
+			fs.writeFileSync(outputFile, audioData);
+			console.log(`  💾 Audio saved: ${outputFile}`);
+			const estimatedChunks = Math.ceil(actualLength / 300);
+			console.log(`  📊 Estimated chunks: ${estimatedChunks}`);
+		}
+		return [true, response];
+	} catch (e: any) {
+		logDetailedError(e, "Hindi punctuation chunking");
+		return [false, e];
+	}
+}
+/**
+ * Test TTS with ellipsis punctuation marks (… ‥)
+ * This tests multilingual sentence punctuation support added in fix/text_utils
+ */
+async function testCreateSpeechEllipsisPunctuation(
+	voiceId: string | null
+): Promise<[boolean, any]> {
+	console.log("⏳ Text with Ellipsis Punctuation Test (… ‥)");
+	if (!voiceId) {
+		console.log("  ⚠️  No voice ID available");
+		return [false, null];
+	}
+	try {
+		const { Supertone } = await import("../src/index.js");
+		const models = await import("../src/models/index.js");
+		const client = new Supertone({ apiKey: API_KEY });
+		// Text with ellipsis punctuation marks (… ‥)
+		// Text length: ~380 characters (exceeds 300 char limit)
+		const ellipsisText =
+			"Sometimes we need to pause and think… " +
+			"The ellipsis character is used to indicate a trailing thought or a pause in speech… " +
+			"This test verifies that the text chunking system correctly handles Unicode ellipsis characters‥ " +
+			"There are actually multiple types of ellipsis in Unicode… " +
+			"The horizontal ellipsis U+2026 and the two dot leader U+2025 are both supported‥ " +
+			"When processing long texts the SDK should split at these punctuation marks… " +
+			"This ensures natural pauses in the generated speech output‥ " +
+			"Let us verify that everything works correctly…";
+		const actualLength = ellipsisText.length;
+		console.log(
+			`  📏 Text length: ${actualLength} characters (with ellipsis punctuation)`
+		);
+		console.log(`  🔧 Expected behavior: Sentence-based chunking with ellipsis (… ‥)`);
+		console.log("  ⚠️  This test consumes credits!");
+		if (actualLength <= 300) {
+			console.log(`  ❌ Text length ${actualLength} is <= 300, test may not trigger chunking`);
+		}
+		const response = await client.textToSpeech.createSpeech({
+			voiceId,
+			apiConvertTextToSpeechUsingCharacterRequest: {
+				text: ellipsisText,
+				language: models.APIConvertTextToSpeechUsingCharacterRequestLanguage.En,
+				outputFormat:
+					models.APIConvertTextToSpeechUsingCharacterRequestOutputFormat.Wav,
+				style: "neutral",
+				model: models.APIConvertTextToSpeechUsingCharacterRequestModel.SonaSpeech1,
+			},
+		});
+		if (response.result) {
+			const audioData = await extractAudioData(response);
+			console.log(
+				`  ✅ Ellipsis punctuation chunking TTS success: ${audioData.length} bytes`
+			);
+			console.log(`  🎯 Text with ellipsis punctuation processed correctly!`);
+			const outputFile = "test_ellipsis_punctuation_speech_output.wav";
+			fs.writeFileSync(outputFile, audioData);
+			console.log(`  💾 Audio saved: ${outputFile}`);
+			const estimatedChunks = Math.ceil(actualLength / 300);
+			console.log(`  📊 Estimated chunks: ${estimatedChunks}`);
+		}
+		return [true, response];
+	} catch (e: any) {
+		logDetailedError(e, "Ellipsis punctuation chunking");
+		return [false, e];
+	}
+}
 /**
  * Test TTS streaming with long text
  */
@@ -2387,6 +2616,304 @@ async function testCreateSpeechWithChunking(
 	}
 }
+// =============================================================================
+// Pronunciation Dictionary Tests
+// =============================================================================
+/**
+ * Test TTS with pronunciation dictionary (basic test with partial_match=true/false)
+ */
+async function testCreateSpeechWithPronunciationDictionary(
+	voiceId: string | null
+): Promise<[boolean, any]> {
+	console.log("📖 TTS with Pronunciation Dictionary Test");
+	if (!voiceId) {
+		console.log("  ⚠️  No voice ID available");
+		return [false, null];
+	}
+	try {
+		const { Supertone } = await import("../src/index.js");
+		const models = await import("../src/models/index.js");
+		const client = new Supertone({ apiKey: API_KEY });
+		// Test text with abbreviations and special terms
+		const testText =
+			"The CEO of OpenAI announced that GPT models are improving. Dr. Smith from MIT said AI research is accelerating.";
+		// Pronunciation dictionary with both partial_match=true and partial_match=false cases
+		const pronunciationDictionary = [
+			// partial_match=false: exact word boundary match
+			{ text: "CEO", pronunciation: "Chief Executive Officer", partial_match: false },
+			{ text: "MIT", pronunciation: "Massachusetts Institute of Technology", partial_match: false },
+			{ text: "AI", pronunciation: "Artificial Intelligence", partial_match: false },
+			// partial_match=true: substring match (will match "OpenAI" -> "OpenArtificial Intelligence")
+			{ text: "GPT", pronunciation: "Generative Pre-trained Transformer", partial_match: true },
+			{ text: "Dr.", pronunciation: "Doctor", partial_match: true },
+		];
+		console.log(`  🔍 Original text: "${testText}"`);
+		console.log(`  📖 Pronunciation dictionary entries: ${pronunciationDictionary.length}`);
+		console.log(`     - partial_match=false: CEO, MIT, AI (word boundary match)`);
+		console.log(`     - partial_match=true: GPT, Dr. (substring match)`);
+		console.log("  ⚠️  This test consumes credits!");
+		const response = await client.textToSpeech.createSpeech(
+			{
+				voiceId,
+				apiConvertTextToSpeechUsingCharacterRequest: {
+					text: testText,
+					language: models.APIConvertTextToSpeechUsingCharacterRequestLanguage.En,
+					outputFormat:
+						models.APIConvertTextToSpeechUsingCharacterRequestOutputFormat.Wav,
+					style: "neutral",
+					model: "sona_speech_1",
+				},
+			},
+			{
+				pronunciationDictionary,
+			}
+		);
+		console.log(`  ✅ TTS with pronunciation dictionary success`);
+		if (response.result) {
+			const audioData = await extractAudioData(response);
+			const outputFile = "test_pronunciation_dictionary_output.wav";
+			fs.writeFileSync(outputFile, audioData);
+			console.log(`  💾 Audio saved: ${outputFile} (${audioData.length} bytes)`);
+		}
+		return [true, response];
+	} catch (e: any) {
+		logDetailedError(e, "Pronunciation dictionary TTS");
+		return [false, e];
+	}
+}
+/**
+ * Test TTS with pronunciation dictionary causing text to exceed 300 chars (triggers chunking)
+ */
+async function testCreateSpeechWithPronunciationDictionaryLongText(
+	voiceId: string | null
+): Promise<[boolean, any]> {
+	console.log("📖 TTS with Pronunciation Dictionary + Long Text Chunking Test");
+	if (!voiceId) {
+		console.log("  ⚠️  No voice ID available");
+		return [false, null];
+	}
+	try {
+		const { Supertone } = await import("../src/index.js");
+		const models = await import("../src/models/index.js");
+		const client = new Supertone({ apiKey: API_KEY });
+		// Short original text (~200 chars) that will exceed 300 chars after pronunciation dictionary expansion
+		const testText =
+			"AI and ML are revolutionizing tech. The CEO of OpenAI discussed GPT advancements. " +
+			"Dr. Kim from MIT explained how NLP and CV work together. AWS and GCP provide cloud AI services.";
+		// Pronunciation dictionary that expands abbreviations significantly
+		const pronunciationDictionary = [
+			// partial_match=false: exact word boundary matches
+			{ text: "AI", pronunciation: "Artificial Intelligence", partial_match: false },
+			{ text: "ML", pronunciation: "Machine Learning", partial_match: false },
+			{ text: "CEO", pronunciation: "Chief Executive Officer", partial_match: false },
+			{ text: "MIT", pronunciation: "Massachusetts Institute of Technology", partial_match: false },
+			{ text: "NLP", pronunciation: "Natural Language Processing", partial_match: false },
+			{ text: "CV", pronunciation: "Computer Vision", partial_match: false },
+			{ text: "AWS", pronunciation: "Amazon Web Services", partial_match: false },
+			{ text: "GCP", pronunciation: "Google Cloud Platform", partial_match: false },
+			// partial_match=true: substring matches
+			{ text: "GPT", pronunciation: "Generative Pre-trained Transformer", partial_match: true },
+			{ text: "Dr.", pronunciation: "Doctor", partial_match: true },
+			{ text: "tech", pronunciation: "technology", partial_match: true },
+		];
+		const originalLength = testText.length;
+		console.log(`  🔍 Original text length: ${originalLength} characters (under 300)`);
+		console.log(`  📖 Pronunciation dictionary entries: ${pronunciationDictionary.length}`);
+		console.log(`     - partial_match=false: AI, ML, CEO, MIT, NLP, CV, AWS, GCP`);
+		console.log(`     - partial_match=true: GPT, Dr., tech`);
+		console.log(`  🔧 Expected: Text will expand to 300+ chars, triggering auto-chunking`);
+		console.log("  ⚠️  This test consumes credits!");
+		const response = await client.textToSpeech.createSpeech(
+			{
+				voiceId,
+				apiConvertTextToSpeechUsingCharacterRequest: {
+					text: testText,
+					language: models.APIConvertTextToSpeechUsingCharacterRequestLanguage.En,
+					outputFormat:
+						models.APIConvertTextToSpeechUsingCharacterRequestOutputFormat.Wav,
+					style: "neutral",
+					model: "sona_speech_1",
+				},
+			},
+			{
+				pronunciationDictionary,
+			}
+		);
+		console.log(`  ✅ TTS with pronunciation dictionary + long text chunking success`);
+		console.log(`  🎯 Auto-chunking was triggered after pronunciation expansion!`);
+		if (response.result) {
+			const audioData = await extractAudioData(response);
+			const outputFile = "test_pronunciation_dictionary_long_text_output.wav";
+			fs.writeFileSync(outputFile, audioData);
+			console.log(`  💾 Audio saved: ${outputFile} (${audioData.length} bytes)`);
+		}
+		return [true, response];
+	} catch (e: any) {
+		logDetailedError(e, "Pronunciation dictionary long text TTS");
+		return [false, e];
+	}
+}
+/**
+ * Test TTS streaming with pronunciation dictionary
+ */
+async function testStreamSpeechWithPronunciationDictionary(
+	voiceId: string | null
+): Promise<[boolean, any]> {
+	console.log("📡 TTS Streaming with Pronunciation Dictionary Test");
+	if (!voiceId) {
+		console.log("  ⚠️  No voice ID available");
+		return [false, null];
+	}
+	try {
+		const { Supertone } = await import("../src/index.js");
+		const models = await import("../src/models/index.js");
+		const client = new Supertone({ apiKey: API_KEY });
+		const testText =
+			"The API documentation explains how to use the SDK. " +
+			"Dr. Lee from NASA discussed the new AI system.";
+		const pronunciationDictionary = [
+			{ text: "API", pronunciation: "Application Programming Interface", partial_match: false },
+			{ text: "SDK", pronunciation: "Software Development Kit", partial_match: false },
+			{ text: "NASA", pronunciation: "National Aeronautics and Space Administration", partial_match: false },
+			{ text: "AI", pronunciation: "Artificial Intelligence", partial_match: false },
+			{ text: "Dr.", pronunciation: "Doctor", partial_match: true },
+		];
+		console.log(`  🔍 Original text: "${testText}"`);
+		console.log(`  📖 Pronunciation dictionary entries: ${pronunciationDictionary.length}`);
+		console.log("  ⚠️  This test consumes credits!");
+		const response = await client.textToSpeech.streamSpeech(
+			{
+				voiceId,
+				apiConvertTextToSpeechUsingCharacterRequest: {
+					text: testText,
+					language: models.APIConvertTextToSpeechUsingCharacterRequestLanguage.En,
+					outputFormat:
+						models.APIConvertTextToSpeechUsingCharacterRequestOutputFormat.Wav,
+				},
+			},
+			{
+				pronunciationDictionary,
+			}
+		);
+		console.log(`  ✅ Stream with pronunciation dictionary started successfully`);
+		// Consume the stream and save to file
+		if (response.result) {
+			const audioData = await extractAudioData(response);
+			const outputFile = "test_pronunciation_dictionary_stream_output.wav";
+			fs.writeFileSync(outputFile, audioData);
+			console.log(`  💾 Audio saved: ${outputFile} (${audioData.length} bytes)`);
+		}
+		return [true, response];
+	} catch (e: any) {
+		logDetailedError(e, "Pronunciation dictionary streaming TTS");
+		return [false, e];
+	}
+}
+/**
+ * Test TTS streaming with pronunciation dictionary + long text (triggers chunking)
+ */
+async function testStreamSpeechWithPronunciationDictionaryLongText(
+	voiceId: string | null
+): Promise<[boolean, any]> {
+	console.log("📡 TTS Streaming with Pronunciation Dictionary + Long Text Test");
+	if (!voiceId) {
+		console.log("  ⚠️  No voice ID available");
+		return [false, null];
+	}
+	try {
+		const { Supertone } = await import("../src/index.js");
+		const models = await import("../src/models/index.js");
+		const client = new Supertone({ apiKey: API_KEY });
+		// Short text that will expand after pronunciation dictionary
+		const testText =
+			"AI is everywhere. ML powers many apps. The CEO spoke about GPT. " +
+			"Dr. Smith from MIT and UCLA collaborated on NLP research. AWS and GCP offer AI services.";
+		const pronunciationDictionary = [
+			{ text: "AI", pronunciation: "Artificial Intelligence", partial_match: false },
+			{ text: "ML", pronunciation: "Machine Learning", partial_match: false },
+			{ text: "CEO", pronunciation: "Chief Executive Officer", partial_match: false },
+			{ text: "MIT", pronunciation: "Massachusetts Institute of Technology", partial_match: false },
+			{ text: "UCLA", pronunciation: "University of California Los Angeles", partial_match: false },
+			{ text: "NLP", pronunciation: "Natural Language Processing", partial_match: false },
+			{ text: "AWS", pronunciation: "Amazon Web Services", partial_match: false },
+			{ text: "GCP", pronunciation: "Google Cloud Platform", partial_match: false },
+			{ text: "GPT", pronunciation: "Generative Pre-trained Transformer", partial_match: true },
+			{ text: "Dr.", pronunciation: "Doctor", partial_match: true },
+		];
+		console.log(`  🔍 Original text length: ${testText.length} characters`);
+		console.log(`  📖 Pronunciation dictionary entries: ${pronunciationDictionary.length}`);
+		console.log(`  🔧 Expected: Text will expand to 300+ chars, triggering stream chunking`);
+		console.log("  ⚠️  This test consumes credits!");
+		const response = await client.textToSpeech.streamSpeech(
+			{
+				voiceId,
+				apiConvertTextToSpeechUsingCharacterRequest: {
+					text: testText,
+					language: models.APIConvertTextToSpeechUsingCharacterRequestLanguage.En,
+					outputFormat:
+						models.APIConvertTextToSpeechUsingCharacterRequestOutputFormat.Wav,
+				},
+			},
+			{
+				pronunciationDictionary,
+			}
+		);
+		console.log(`  ✅ Stream with pronunciation dictionary + long text started successfully`);
+		console.log(`  🎯 Stream chunking was triggered after pronunciation expansion!`);
+		if (response.result) {
+			const audioData = await extractAudioData(response);
+			const outputFile = "test_pronunciation_dictionary_stream_long_text_output.wav";
+			fs.writeFileSync(outputFile, audioData);
+			console.log(`  💾 Audio saved: ${outputFile} (${audioData.length} bytes)`);
+		}
+		return [true, response];
+	} catch (e: any) {
+		logDetailedError(e, "Pronunciation dictionary streaming long text TTS");
+		return [false, e];
+	}
+}
 /**
  * Main test execution
  */
@@ -2569,6 +3096,21 @@ async function main(): Promise<boolean> {
 		[success, result] = await testCreateSpeechJapaneseNoSpaces(voiceIdForTTS);
 		testResults["create_speech_japanese_no_spaces"] = success;
+		// 6.5 Multilingual Punctuation Tests (fix/text_utils)
+		console.log("\n🌍 Multilingual Punctuation Chunking Tests");
+		console.log("-".repeat(60));
+		console.log("⚠️  These tests verify multilingual sentence punctuation support!");
+		console.log("");
+		[success, result] = await testCreateSpeechArabicPunctuation(voiceIdForTTS);
+		testResults["create_speech_arabic_punctuation"] = success;
+		[success, result] = await testCreateSpeechHindiPunctuation(voiceIdForTTS);
+		testResults["create_speech_hindi_punctuation"] = success;
+		[success, result] = await testCreateSpeechEllipsisPunctuation(voiceIdForTTS);
+		testResults["create_speech_ellipsis_punctuation"] = success;
 		[success, result] = await testStreamSpeechLongText(voiceIdForTTS);
 		testResults["stream_speech_long_text"] = success;
@@ -2621,6 +3163,32 @@ async function main(): Promise<boolean> {
 		[success, result] = await testStreamSpeechLongTextMp3(voiceIdForTTS);
 		testResults["stream_speech_long_text_mp3"] = success;
+		// 10. Pronunciation Dictionary Tests
+		console.log("\n📖 Pronunciation Dictionary Tests");
+		console.log("-".repeat(60));
+		console.log("⚠️  These tests consume credits!");
+		console.log("");
+		[success, result] = await testCreateSpeechWithPronunciationDictionary(
+			voiceIdForTTS
+		);
+		testResults["create_speech_pronunciation_dictionary"] = success;
+		[success, result] = await testCreateSpeechWithPronunciationDictionaryLongText(
+			voiceIdForTTS
+		);
+		testResults["create_speech_pronunciation_dictionary_long_text"] = success;
+		[success, result] = await testStreamSpeechWithPronunciationDictionary(
+			voiceIdForTTS
+		);
+		testResults["stream_speech_pronunciation_dictionary"] = success;
+		[success, result] = await testStreamSpeechWithPronunciationDictionaryLongText(
+			voiceIdForTTS
+		);
+		testResults["stream_speech_pronunciation_dictionary_long_text"] = success;
 	}
 	// Results Summary
@@ -2681,6 +3249,9 @@ async function main(): Promise<boolean> {
 	console.log(
 		"  • TTS Chunking Strategies: Word-based (no punctuation), Character-based (Japanese)"
 	);
+	console.log(
+		"  • Multilingual Punctuation: Arabic (؟ ؛ ۔), Hindi (। ॥), Ellipsis (… ‥)"
+	);
 	console.log(
 		"  • TTS with Voice Settings: createSpeechWithVoiceSettings, predictDurationWithVoiceSettings, streamSpeechWithVoiceSettings"
 	);
@@ -2693,6 +3264,15 @@ async function main(): Promise<boolean> {
 	console.log(
 		"  • Custom Features: Auto-chunking in createSpeech/streamSpeech (transparent)"
 	);
+	console.log(
+		"  • Pronunciation Dictionary: createSpeech/streamSpeech with pronunciationDictionary option"
+	);
+	console.log(
+		"    - partial_match=false (word boundary) and partial_match=true (substring)"
+	);
+	console.log(
+		"    - Long text chunking after pronunciation expansion"
+	);
 	console.log("");
 	console.log("🤖 New Model & Language Tests:");
 	console.log(

package/custom_test/test_text_utils_chunk_text_punctuation.ts ADDED Viewed

@@ -0,0 +1,55 @@
+#!/usr/bin/env node
+/**
+ * Smoke test for multilingual sentence punctuation splitting in chunkText().
+ *
+ * Run:
+ *   npx ts-node custom_test/test_text_utils_chunk_text_punctuation.ts
+ *   # or after build:
+ *   node dist/custom_test/test_text_utils_chunk_text_punctuation.js
+ */
+import { chunkText } from "../src/lib/custom_utils/text_utils.js";
+function assertSplits(
+	text: string,
+	expectedChunks: string[],
+	maxLength: number
+): void {
+	const got = chunkText(text, maxLength);
+	const passed = JSON.stringify(got) === JSON.stringify(expectedChunks);
+	if (!passed) {
+		throw new Error(
+			`\ntext=${JSON.stringify(text)}\nexpected=${JSON.stringify(expectedChunks)}\ngot=${JSON.stringify(got)}`
+		);
+	}
+}
+function main(): void {
+	// English / many EU languages
+	assertSplits("Hello. World!", ["Hello. ", "World!"], 8);
+	// Korean (mostly ASCII punctuation in practice, plus ellipsis)
+	assertSplits("안...반가… 네.", ["안...", "반가… ", "네."], 4);
+	// Japanese
+	assertSplits(
+		"こんにちは。元気ですか？はい！",
+		["こんにちは。", "元気ですか？", "はい！"],
+		6
+	);
+	// Arabic (short samples to avoid max_length merge issues)
+	assertSplits("مر؟ نعم۔", ["مر؟ ", "نعم۔"], 5);
+	// Hindi
+	assertSplits("हाँ। नहीं॥", ["हाँ। ", "नहीं॥"], 6);
+	// Greek question mark (U+037E)
+	assertSplits("Γεια;Καλά.", ["Γεια;", "Καλά."], 5);
+	console.log("OK: chunkText punctuation smoke test passed");
+}
+main();

package/dist/commonjs/lib/config.d.ts CHANGED Viewed

@@ -31,8 +31,8 @@ export declare function serverURLFromOptions(options: SDKOptions): URL | null;
 export declare const SDK_METADATA: {
     readonly language: "typescript";
     readonly openapiDocVersion: "0.8.69";
-    readonly sdkVersion: "0.1.2";
+    readonly sdkVersion: "0.1.4";
     readonly genVersion: "2.686.7";
-    readonly userAgent: "speakeasy-sdk/typescript 0.1.2 2.686.7 0.8.69 @supertone/supertone";
+    readonly userAgent: "speakeasy-sdk/typescript 0.1.4 2.686.7 0.8.69 @supertone/supertone";
 };
 //# sourceMappingURL=config.d.ts.map

package/dist/commonjs/lib/config.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"config.d.ts","sourceRoot":"","sources":["../../../src/lib/config.ts"],"names":[],"mappings":"AAIA,OAAO,EAAE,UAAU,EAAE,MAAM,WAAW,CAAC;AACvC,OAAO,EAAE,MAAM,EAAE,MAAM,aAAa,CAAC;AACrC,OAAO,EAAE,WAAW,EAAE,MAAM,cAAc,CAAC;AAG3C;;GAEG;AACH,eAAO,MAAM,UAAU,uCAKb,CAAC;AAEX,MAAM,MAAM,UAAU,GAAG;~~IACvB~~,MAAM,CAAC,EAAE,MAAM,GAAG,CAAC,MAAM,OAAO,CAAC,MAAM,CAAC,CAAC,GAAG,SAAS,CAAC;IAEtD,UAAU,CAAC,EAAE,UAAU,CAAC;IACxB;;OAEG;IACH,SAAS,CAAC,EAAE,MAAM,GAAG,SAAS,CAAC;IAC/B;;OAEG;IACH,SAAS,CAAC,EAAE,MAAM,GAAG,SAAS,CAAC;IAC/B;;OAEG;IACH,SAAS,CAAC,EAAE,MAAM,GAAG,SAAS,CAAC;IAC/B;;OAEG;IACH,WAAW,CAAC,EAAE,WAAW,CAAC;IAC1B,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,WAAW,CAAC,EAAE,MAAM,CAAC;~~CACtB~~,CAAC;AAEF,wBAAgB,oBAAoB,CAAC,OAAO,EAAE,UAAU,GAAG,GAAG,GAAG,IAAI,CAepE;AAED,eAAO,MAAM,YAAY;;;;;;CAOf,CAAC"}
1	+ {"version":3,"file":"config.d.ts","sourceRoot":"","sources":["../../../src/lib/config.ts"],"names":[],"mappings":"AAIA,OAAO,EAAE,UAAU,EAAE,MAAM,WAAW,CAAC;AACvC,OAAO,EAAE,MAAM,EAAE,MAAM,aAAa,CAAC;AACrC,OAAO,EAAE,WAAW,EAAE,MAAM,cAAc,CAAC;AAG3C;;GAEG;AACH,eAAO,MAAM,UAAU,uCAKb,CAAC;AAEX,MAAM,MAAM,UAAU,GAAG;IACxB,MAAM,CAAC,EAAE,MAAM,GAAG,CAAC,MAAM,OAAO,CAAC,MAAM,CAAC,CAAC,GAAG,SAAS,CAAC;IAEtD,UAAU,CAAC,EAAE,UAAU,CAAC;IACxB;;OAEG;IACH,SAAS,CAAC,EAAE,MAAM,GAAG,SAAS,CAAC;IAC/B;;OAEG;IACH,SAAS,CAAC,EAAE,MAAM,GAAG,SAAS,CAAC;IAC/B;;OAEG;IACH,SAAS,CAAC,EAAE,MAAM,GAAG,SAAS,CAAC;IAC/B;;OAEG;IACH,WAAW,CAAC,EAAE,WAAW,CAAC;IAC1B,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,WAAW,CAAC,EAAE,MAAM,CAAC;CACrB,CAAC;AAEF,wBAAgB,oBAAoB,CAAC,OAAO,EAAE,UAAU,GAAG,GAAG,GAAG,IAAI,CAepE;AAED,eAAO,MAAM,YAAY;;;;;;CAOf,CAAC"}