PyPI - deva-tts - Versions diffs - 0.1.0__py3-none-any.whl - Mend

deva-tts 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

deva_tts/__init__.py +8 -0
deva_tts/engine.py +155 -0
deva_tts/utils.py +10 -0
deva_tts-0.1.0.dist-info/METADATA +10 -0
deva_tts-0.1.0.dist-info/RECORD +7 -0
deva_tts-0.1.0.dist-info/WHEEL +5 -0
deva_tts-0.1.0.dist-info/top_level.txt +1 -0

deva_tts/__init__.py ADDED Viewed

@@ -0,0 +1,8 @@
+from .engine import start_engine,stop_engine,feed_chunk,set_voice
+__all__ = [
+    "start_engine",
+    "stop_engine",
+    "feed_chunk",
+    "set_voice"
+]

deva_tts/engine.py ADDED Viewed

@@ -0,0 +1,155 @@
+import asyncio
+import re
+import edge_tts
+import pyaudio
+import miniaudio
+from .utils import clean_text
+import aiohttp
+_background_tasks = []
+_VOICE = "en-US-EmmaMultilingualNeural"
+OUTPUT_SAMPLE_RATE = 24000
+CHANNELS = 1
+# Initialize PyAudio
+p = pyaudio.PyAudio()
+audio_stream = p.open(
+    format=pyaudio.paInt16,
+    channels=CHANNELS,
+    rate=OUTPUT_SAMPLE_RATE,
+    output=True
+)
+_chunk_queue = asyncio.Queue()
+_sentence_queue = asyncio.Queue()
+_pcm_queue = asyncio.Queue()
+def set_voice(voice : str = "en-US-EmmaMultilingualNeural"):
+    """allows users to change the TTS voice model"""
+    global _VOICE
+    try :
+        test = edge_tts.Communicate("hello", voice)
+        _VOICE = voice
+    except ValueError as e:
+        print(f"[INVALID VOICE NAME] : {voice}")
+        print("falling back to default voice")
+async def feed_chunk(chunk):
+    if chunk != None or chunk != "":
+        await _chunk_queue.put(chunk)
+async def text_parser():
+    sentence_end = re.compile(r'[^.!?]+[.!?](?=\s|$)')
+    buffer = ""
+    buffer_list = []
+    target = 1
+    while True:
+        chunk = await _chunk_queue.get()
+        if not chunk:
+            _chunk_queue.task_done()
+            await _sentence_queue.put(" ".join(buffer_list).strip())
+            break
+        buffer += chunk
+        while True:
+            match = sentence_end.match(buffer)
+            if not match:
+                break
+            sentence = match.group().strip()
+            sentence = clean_text(sentence)
+            buffer = buffer[match.end():].strip()
+            if sentence:
+                buffer_list.append(sentence)
+                if len(buffer_list) == target or target == 0:
+                    print(f"[parser] sentence found: {sentence}")
+                    await _sentence_queue.put(" ".join(buffer_list[:target]).strip())
+                    buffer_list = buffer_list[target:]
+                    if target < 5:
+                        target += 1
+    await _sentence_queue.put(None)
+async def tts_worker():
+    while True:
+        sentence = await _sentence_queue.get()
+        if sentence == None:
+            await _pcm_queue.put(None)
+            _sentence_queue.task_done()
+            break
+        print(f"[TTS] generating audio for: {sentence}")
+        communicate = edge_tts.Communicate(sentence, _VOICE)
+        mp3_buffer = b""
+        try :
+            async for chunk in communicate.stream():
+                if chunk["type"] == "audio":
+                    mp3_buffer += chunk["data"]
+            if mp3_buffer:
+                decoded = miniaudio.decode(
+                        mp3_buffer,
+                        output_format=miniaudio.SampleFormat.SIGNED16,
+                        nchannels=CHANNELS,
+                        sample_rate=OUTPUT_SAMPLE_RATE
+                    )
+                pcm_bytes = bytes(decoded.samples)
+                await _pcm_queue.put(pcm_bytes)
+        except aiohttp.client_exceptions.WSServerHandshakeError as e:
+            print(f"{e.status} : ")
+            if e.status == 403:
+                print("="*60 + "\n")
+                print(f"status : {e.status}")
+                print("="*60)
+                print("[DEVA_TTS_ERROR] CONNECTION BLOCKED")
+                print("="*60)
+                print("To fix this instantly, run this command in your terminal:")
+                print("\n    python -m pip install --upgrade edge-tts\n")
+                print("="*60 + "\n")
+            else:
+                print("\n[DEVA_TTS] network error")
+            _sentence_queue.task_done()
+            continue
+        except asyncio.CancelledError:
+            print("\n[TTS] Download violently interrupted. Shutting down worker.")
+            break
+        _sentence_queue.task_done()
+    await _pcm_queue.put(None)
+async def audio_playback():
+    loop = asyncio.get_running_loop()
+    chunk_size = 8192
+    try:
+        while True:
+            pcm_data = await _pcm_queue.get()
+            if not pcm_data:
+                _pcm_queue.task_done()
+                break
+            print(f"[Player] Playing back sentence audio segment ({len(pcm_data)} bytes)...")
+            for i in range(0,len(pcm_data),chunk_size):
+                sliced_data = pcm_data[i: i+chunk_size]
+                await loop.run_in_executor(None,audio_stream.write,sliced_data)
+            _pcm_queue.task_done()
+    except asyncio.CancelledError as e:
+        print("stoping the process")
+    finally:
+        print("\n[System] Shutting down audio streams...")
+        audio_stream.stop_stream()
+        audio_stream.close()
+        p.terminate()
+        print("[System] Done.")
+async def start_engine():
+    print("the engine is starting....")
+    _background_tasks.append(asyncio.create_task(text_parser()))
+    _background_tasks.append(asyncio.create_task(tts_worker()))
+    _background_tasks.append(asyncio.create_task(audio_playback()))
+async def stop_engine():
+    await _chunk_queue.put(None)
+    await asyncio.gather(*_background_tasks)

deva_tts/utils.py ADDED Viewed

@@ -0,0 +1,10 @@
+import re
+import emoji
+def clean_text(text : str) -> str:
+    text = re.sub(r'[`*#~|]','',text)
+    text = emoji.replace_emoji(text,'')
+    text = re.sub(r'https?://\S+|www\.\S+','',text)
+    return text

deva_tts-0.1.0.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,10 @@
+Metadata-Version: 2.4
+Name: deva_tts
+Version: 0.1.0
+Summary: A real-time, streaming text-to-speech engine.
+Requires-Dist: edge-tts
+Requires-Dist: pyaudio
+Requires-Dist: miniaudio
+Requires-Dist: emoji
+Dynamic: requires-dist
+Dynamic: summary

deva_tts-0.1.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,7 @@
+deva_tts/__init__.py,sha256=6L9qJJvIJYaRupkD7QCKnGm74c9PHfl8JmyCRUQmsFU,160
+deva_tts/engine.py,sha256=8FnSUI9i4y4fsCFeO3mhRUmWK4kLn_e2MI8xmA8f3j0,5223
+deva_tts/utils.py,sha256=rkhUIYd25NAP33hXXYFL9kNHTUfzWDm4TUeCtLDOwmg,219
+deva_tts-0.1.0.dist-info/METADATA,sha256=SaBI7i6r9wjaOno_NDhlTXrSWEZWB7OWPg_yGH4traI,250
+deva_tts-0.1.0.dist-info/WHEEL,sha256=aeYiig01lYGDzBgS8HxWXOg3uV61G9ijOsup-k9o1sk,91
+deva_tts-0.1.0.dist-info/top_level.txt,sha256=Lq8h-sBoyHMN0UhjFspiP7T_p5FjmOv0LaVC89RC-ZU,9
+deva_tts-0.1.0.dist-info/RECORD,,

deva_tts-0.1.0.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,5 @@
+Wheel-Version: 1.0
+Generator: setuptools (82.0.1)
+Root-Is-Purelib: true
+Tag: py3-none-any

deva_tts-0.1.0.dist-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ deva_tts