livekit-plugins-elevenlabs 0.1.2__py3-none-any.whl → 0.1.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- livekit/plugins/elevenlabs/tts.py +10 -4
- livekit/plugins/elevenlabs/version.py +1 -1
- {livekit_plugins_elevenlabs-0.1.2.dist-info → livekit_plugins_elevenlabs-0.1.3.dist-info}/METADATA +1 -1
- livekit_plugins_elevenlabs-0.1.3.dist-info/RECORD +8 -0
- livekit_plugins_elevenlabs-0.1.2.dist-info/RECORD +0 -8
- {livekit_plugins_elevenlabs-0.1.2.dist-info → livekit_plugins_elevenlabs-0.1.3.dist-info}/WHEEL +0 -0
- {livekit_plugins_elevenlabs-0.1.2.dist-info → livekit_plugins_elevenlabs-0.1.3.dist-info}/top_level.txt +0 -0
@@ -63,6 +63,8 @@ class TTSOptions:
|
|
63
63
|
voice: Voice
|
64
64
|
model_id: TTSModels
|
65
65
|
base_url: str
|
66
|
+
sample_rate: int
|
67
|
+
latency: int
|
66
68
|
|
67
69
|
|
68
70
|
class TTS(tts.TTS):
|
@@ -73,6 +75,8 @@ class TTS(tts.TTS):
|
|
73
75
|
model_id: TTSModels = "eleven_multilingual_v2",
|
74
76
|
api_key: Optional[str] = None,
|
75
77
|
base_url: Optional[str] = None,
|
78
|
+
sample_rate: int = 24000,
|
79
|
+
latency: int = 2,
|
76
80
|
) -> None:
|
77
81
|
super().__init__(streaming_supported=True)
|
78
82
|
api_key = api_key or os.environ.get("ELEVEN_API_KEY")
|
@@ -85,6 +89,8 @@ class TTS(tts.TTS):
|
|
85
89
|
model_id=model_id,
|
86
90
|
api_key=api_key,
|
87
91
|
base_url=base_url or API_BASE_URL_V1,
|
92
|
+
sample_rate=sample_rate,
|
93
|
+
latency=latency,
|
88
94
|
)
|
89
95
|
|
90
96
|
async def list_voices(self) -> List[Voice]:
|
@@ -134,11 +140,9 @@ class SynthesizeStream(tts.SynthesizeStream):
|
|
134
140
|
self,
|
135
141
|
session: aiohttp.ClientSession,
|
136
142
|
config: TTSOptions,
|
137
|
-
latency: int = 2, # [1-4] the higher the more optimized for streaming latency
|
138
143
|
):
|
139
144
|
self._config = config
|
140
145
|
self._session = session
|
141
|
-
self._latency = latency
|
142
146
|
|
143
147
|
self._queue = asyncio.Queue[str]()
|
144
148
|
self._event_queue = asyncio.Queue[tts.SynthesisEvent]()
|
@@ -157,7 +161,7 @@ class SynthesizeStream(tts.SynthesizeStream):
|
|
157
161
|
base_url = self._config.base_url
|
158
162
|
voice_id = self._config.voice.id
|
159
163
|
model_id = self._config.model_id
|
160
|
-
return f"{base_url}/text-to-speech/{voice_id}/stream-input?model_id={model_id}&output_format=
|
164
|
+
return f"{base_url}/text-to-speech/{voice_id}/stream-input?model_id={model_id}&output_format=pcm_{self._config.sample_rate}&optimize_streaming_latency={self._config.latency}"
|
161
165
|
|
162
166
|
def push_text(self, token: str) -> None:
|
163
167
|
if self._closed:
|
@@ -265,7 +269,7 @@ class SynthesizeStream(tts.SynthesizeStream):
|
|
265
269
|
data = base64.b64decode(msg["audio"])
|
266
270
|
audio_frame = rtc.AudioFrame(
|
267
271
|
data=data,
|
268
|
-
sample_rate=
|
272
|
+
sample_rate=self._config.sample_rate,
|
269
273
|
num_channels=1,
|
270
274
|
samples_per_channel=len(data) // 2,
|
271
275
|
)
|
@@ -277,6 +281,8 @@ class SynthesizeStream(tts.SynthesizeStream):
|
|
277
281
|
)
|
278
282
|
elif msg.get("isFinal"):
|
279
283
|
break
|
284
|
+
else:
|
285
|
+
logging.error(f"Unhandled message from ElevenLabs: {msg}")
|
280
286
|
|
281
287
|
async def flush(self) -> None:
|
282
288
|
self._queue.put_nowait(self._text + " ")
|
@@ -0,0 +1,8 @@
|
|
1
|
+
livekit/plugins/elevenlabs/__init__.py,sha256=-FQ-hnTqqbaVFa0sEu8CwInVp9vzkt-nRWkd34ruFFk,977
|
2
|
+
livekit/plugins/elevenlabs/models.py,sha256=g46mCMMHP3x3qtHmybHHMcid1UwmjKCcF0T4IWjMjWE,163
|
3
|
+
livekit/plugins/elevenlabs/tts.py,sha256=xfx22n3T85vyu0dAjObaPzaaJC7dFewU2ZLa47cIZhg,10160
|
4
|
+
livekit/plugins/elevenlabs/version.py,sha256=tpb8RDeB0haxcQ6bcP2ohrPerLn7AiijcHoutd5FqYg,600
|
5
|
+
livekit_plugins_elevenlabs-0.1.3.dist-info/METADATA,sha256=7f-98TJdfwIqJDHrICrppAo1o0gywcA8LoHWd-ETcAw,1360
|
6
|
+
livekit_plugins_elevenlabs-0.1.3.dist-info/WHEEL,sha256=oiQVh_5PnQM0E3gPdiz09WCNmwiHDMaGer_elqB3coM,92
|
7
|
+
livekit_plugins_elevenlabs-0.1.3.dist-info/top_level.txt,sha256=OoDok3xUmXbZRvOrfvvXB-Juu4DX79dlq188E19YHoo,8
|
8
|
+
livekit_plugins_elevenlabs-0.1.3.dist-info/RECORD,,
|
@@ -1,8 +0,0 @@
|
|
1
|
-
livekit/plugins/elevenlabs/__init__.py,sha256=-FQ-hnTqqbaVFa0sEu8CwInVp9vzkt-nRWkd34ruFFk,977
|
2
|
-
livekit/plugins/elevenlabs/models.py,sha256=g46mCMMHP3x3qtHmybHHMcid1UwmjKCcF0T4IWjMjWE,163
|
3
|
-
livekit/plugins/elevenlabs/tts.py,sha256=kGFh5yCdAxss97wf-Z3mfQtxs7V8wXJmmnKlsOGTe30,9975
|
4
|
-
livekit/plugins/elevenlabs/version.py,sha256=S3xxF-H96nScSv_7l7IUvROJ0avu9oz5Gm6j673md_Y,600
|
5
|
-
livekit_plugins_elevenlabs-0.1.2.dist-info/METADATA,sha256=1R3mr6tpE6KWEyzseGy80VOifmjSdcv9vasuIKDk-Hs,1360
|
6
|
-
livekit_plugins_elevenlabs-0.1.2.dist-info/WHEEL,sha256=oiQVh_5PnQM0E3gPdiz09WCNmwiHDMaGer_elqB3coM,92
|
7
|
-
livekit_plugins_elevenlabs-0.1.2.dist-info/top_level.txt,sha256=OoDok3xUmXbZRvOrfvvXB-Juu4DX79dlq188E19YHoo,8
|
8
|
-
livekit_plugins_elevenlabs-0.1.2.dist-info/RECORD,,
|
{livekit_plugins_elevenlabs-0.1.2.dist-info → livekit_plugins_elevenlabs-0.1.3.dist-info}/WHEEL
RENAMED
File without changes
|
File without changes
|