webscout 8.2.7__py3-none-any.whl → 8.2.8__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of webscout might be problematic. Click here for more details.
- webscout/AIauto.py +1 -1
- webscout/AIutel.py +298 -249
- webscout/Extra/Act.md +309 -0
- webscout/Extra/GitToolkit/__init__.py +10 -0
- webscout/Extra/GitToolkit/gitapi/README.md +110 -0
- webscout/Extra/GitToolkit/gitapi/__init__.py +12 -0
- webscout/Extra/GitToolkit/gitapi/repository.py +195 -0
- webscout/Extra/GitToolkit/gitapi/user.py +96 -0
- webscout/Extra/GitToolkit/gitapi/utils.py +62 -0
- webscout/Extra/YTToolkit/README.md +375 -0
- webscout/Extra/YTToolkit/YTdownloader.py +957 -0
- webscout/Extra/YTToolkit/__init__.py +3 -0
- webscout/Extra/YTToolkit/transcriber.py +476 -0
- webscout/Extra/YTToolkit/ytapi/README.md +44 -0
- webscout/Extra/YTToolkit/ytapi/__init__.py +6 -0
- webscout/Extra/YTToolkit/ytapi/channel.py +307 -0
- webscout/Extra/YTToolkit/ytapi/errors.py +13 -0
- webscout/Extra/YTToolkit/ytapi/extras.py +118 -0
- webscout/Extra/YTToolkit/ytapi/https.py +88 -0
- webscout/Extra/YTToolkit/ytapi/patterns.py +61 -0
- webscout/Extra/YTToolkit/ytapi/playlist.py +59 -0
- webscout/Extra/YTToolkit/ytapi/pool.py +8 -0
- webscout/Extra/YTToolkit/ytapi/query.py +40 -0
- webscout/Extra/YTToolkit/ytapi/stream.py +63 -0
- webscout/Extra/YTToolkit/ytapi/utils.py +62 -0
- webscout/Extra/YTToolkit/ytapi/video.py +232 -0
- webscout/Extra/__init__.py +7 -0
- webscout/Extra/autocoder/__init__.py +9 -0
- webscout/Extra/autocoder/autocoder.py +1105 -0
- webscout/Extra/autocoder/autocoder_utiles.py +332 -0
- webscout/Extra/gguf.md +430 -0
- webscout/Extra/gguf.py +684 -0
- webscout/Extra/tempmail/README.md +488 -0
- webscout/Extra/tempmail/__init__.py +28 -0
- webscout/Extra/tempmail/async_utils.py +141 -0
- webscout/Extra/tempmail/base.py +161 -0
- webscout/Extra/tempmail/cli.py +187 -0
- webscout/Extra/tempmail/emailnator.py +84 -0
- webscout/Extra/tempmail/mail_tm.py +361 -0
- webscout/Extra/tempmail/temp_mail_io.py +292 -0
- webscout/Extra/weather.md +281 -0
- webscout/Extra/weather.py +194 -0
- webscout/Extra/weather_ascii.py +76 -0
- webscout/Litlogger/Readme.md +175 -0
- webscout/Litlogger/__init__.py +67 -0
- webscout/Litlogger/core/__init__.py +6 -0
- webscout/Litlogger/core/level.py +23 -0
- webscout/Litlogger/core/logger.py +165 -0
- webscout/Litlogger/handlers/__init__.py +12 -0
- webscout/Litlogger/handlers/console.py +33 -0
- webscout/Litlogger/handlers/file.py +143 -0
- webscout/Litlogger/handlers/network.py +173 -0
- webscout/Litlogger/styles/__init__.py +7 -0
- webscout/Litlogger/styles/colors.py +249 -0
- webscout/Litlogger/styles/formats.py +458 -0
- webscout/Litlogger/styles/text.py +87 -0
- webscout/Litlogger/utils/__init__.py +6 -0
- webscout/Litlogger/utils/detectors.py +153 -0
- webscout/Litlogger/utils/formatters.py +200 -0
- webscout/Provider/AI21.py +177 -0
- webscout/Provider/AISEARCH/DeepFind.py +254 -0
- webscout/Provider/AISEARCH/Perplexity.py +359 -0
- webscout/Provider/AISEARCH/README.md +279 -0
- webscout/Provider/AISEARCH/__init__.py +9 -0
- webscout/Provider/AISEARCH/felo_search.py +228 -0
- webscout/Provider/AISEARCH/genspark_search.py +350 -0
- webscout/Provider/AISEARCH/hika_search.py +198 -0
- webscout/Provider/AISEARCH/iask_search.py +436 -0
- webscout/Provider/AISEARCH/monica_search.py +246 -0
- webscout/Provider/AISEARCH/scira_search.py +324 -0
- webscout/Provider/AISEARCH/webpilotai_search.py +281 -0
- webscout/Provider/Aitopia.py +316 -0
- webscout/Provider/AllenAI.py +440 -0
- webscout/Provider/Andi.py +228 -0
- webscout/Provider/Blackboxai.py +673 -0
- webscout/Provider/ChatGPTClone.py +237 -0
- webscout/Provider/ChatGPTGratis.py +194 -0
- webscout/Provider/ChatSandbox.py +342 -0
- webscout/Provider/Cloudflare.py +324 -0
- webscout/Provider/Cohere.py +208 -0
- webscout/Provider/Deepinfra.py +340 -0
- webscout/Provider/ExaAI.py +261 -0
- webscout/Provider/ExaChat.py +358 -0
- webscout/Provider/Flowith.py +217 -0
- webscout/Provider/FreeGemini.py +250 -0
- webscout/Provider/Gemini.py +169 -0
- webscout/Provider/GithubChat.py +370 -0
- webscout/Provider/GizAI.py +295 -0
- webscout/Provider/Glider.py +225 -0
- webscout/Provider/Groq.py +801 -0
- webscout/Provider/HF_space/__init__.py +0 -0
- webscout/Provider/HF_space/qwen_qwen2.py +206 -0
- webscout/Provider/HeckAI.py +285 -0
- webscout/Provider/HuggingFaceChat.py +469 -0
- webscout/Provider/Hunyuan.py +283 -0
- webscout/Provider/Jadve.py +291 -0
- webscout/Provider/Koboldai.py +384 -0
- webscout/Provider/LambdaChat.py +411 -0
- webscout/Provider/Llama3.py +259 -0
- webscout/Provider/MCPCore.py +315 -0
- webscout/Provider/Marcus.py +198 -0
- webscout/Provider/Nemotron.py +218 -0
- webscout/Provider/Netwrck.py +270 -0
- webscout/Provider/OLLAMA.py +396 -0
- webscout/Provider/OPENAI/BLACKBOXAI.py +735 -0
- webscout/Provider/OPENAI/Cloudflare.py +378 -0
- webscout/Provider/OPENAI/FreeGemini.py +282 -0
- webscout/Provider/OPENAI/NEMOTRON.py +244 -0
- webscout/Provider/OPENAI/README.md +1253 -0
- webscout/Provider/OPENAI/__init__.py +36 -0
- webscout/Provider/OPENAI/ai4chat.py +293 -0
- webscout/Provider/OPENAI/api.py +810 -0
- webscout/Provider/OPENAI/base.py +249 -0
- webscout/Provider/OPENAI/c4ai.py +373 -0
- webscout/Provider/OPENAI/chatgpt.py +556 -0
- webscout/Provider/OPENAI/chatgptclone.py +488 -0
- webscout/Provider/OPENAI/chatsandbox.py +172 -0
- webscout/Provider/OPENAI/deepinfra.py +319 -0
- webscout/Provider/OPENAI/e2b.py +1356 -0
- webscout/Provider/OPENAI/exaai.py +411 -0
- webscout/Provider/OPENAI/exachat.py +443 -0
- webscout/Provider/OPENAI/flowith.py +162 -0
- webscout/Provider/OPENAI/freeaichat.py +359 -0
- webscout/Provider/OPENAI/glider.py +323 -0
- webscout/Provider/OPENAI/groq.py +361 -0
- webscout/Provider/OPENAI/heckai.py +307 -0
- webscout/Provider/OPENAI/llmchatco.py +335 -0
- webscout/Provider/OPENAI/mcpcore.py +383 -0
- webscout/Provider/OPENAI/multichat.py +376 -0
- webscout/Provider/OPENAI/netwrck.py +356 -0
- webscout/Provider/OPENAI/opkfc.py +496 -0
- webscout/Provider/OPENAI/scirachat.py +471 -0
- webscout/Provider/OPENAI/sonus.py +303 -0
- webscout/Provider/OPENAI/standardinput.py +433 -0
- webscout/Provider/OPENAI/textpollinations.py +339 -0
- webscout/Provider/OPENAI/toolbaz.py +413 -0
- webscout/Provider/OPENAI/typefully.py +355 -0
- webscout/Provider/OPENAI/typegpt.py +358 -0
- webscout/Provider/OPENAI/uncovrAI.py +462 -0
- webscout/Provider/OPENAI/utils.py +307 -0
- webscout/Provider/OPENAI/venice.py +425 -0
- webscout/Provider/OPENAI/wisecat.py +381 -0
- webscout/Provider/OPENAI/writecream.py +163 -0
- webscout/Provider/OPENAI/x0gpt.py +378 -0
- webscout/Provider/OPENAI/yep.py +356 -0
- webscout/Provider/OpenGPT.py +209 -0
- webscout/Provider/Openai.py +496 -0
- webscout/Provider/PI.py +429 -0
- webscout/Provider/Perplexitylabs.py +415 -0
- webscout/Provider/QwenLM.py +254 -0
- webscout/Provider/Reka.py +214 -0
- webscout/Provider/StandardInput.py +290 -0
- webscout/Provider/TTI/AiForce/README.md +159 -0
- webscout/Provider/TTI/AiForce/__init__.py +22 -0
- webscout/Provider/TTI/AiForce/async_aiforce.py +224 -0
- webscout/Provider/TTI/AiForce/sync_aiforce.py +245 -0
- webscout/Provider/TTI/FreeAIPlayground/README.md +99 -0
- webscout/Provider/TTI/FreeAIPlayground/__init__.py +9 -0
- webscout/Provider/TTI/FreeAIPlayground/async_freeaiplayground.py +181 -0
- webscout/Provider/TTI/FreeAIPlayground/sync_freeaiplayground.py +180 -0
- webscout/Provider/TTI/ImgSys/README.md +174 -0
- webscout/Provider/TTI/ImgSys/__init__.py +23 -0
- webscout/Provider/TTI/ImgSys/async_imgsys.py +202 -0
- webscout/Provider/TTI/ImgSys/sync_imgsys.py +195 -0
- webscout/Provider/TTI/MagicStudio/README.md +101 -0
- webscout/Provider/TTI/MagicStudio/__init__.py +2 -0
- webscout/Provider/TTI/MagicStudio/async_magicstudio.py +111 -0
- webscout/Provider/TTI/MagicStudio/sync_magicstudio.py +109 -0
- webscout/Provider/TTI/Nexra/README.md +155 -0
- webscout/Provider/TTI/Nexra/__init__.py +22 -0
- webscout/Provider/TTI/Nexra/async_nexra.py +286 -0
- webscout/Provider/TTI/Nexra/sync_nexra.py +258 -0
- webscout/Provider/TTI/PollinationsAI/README.md +146 -0
- webscout/Provider/TTI/PollinationsAI/__init__.py +23 -0
- webscout/Provider/TTI/PollinationsAI/async_pollinations.py +311 -0
- webscout/Provider/TTI/PollinationsAI/sync_pollinations.py +265 -0
- webscout/Provider/TTI/README.md +128 -0
- webscout/Provider/TTI/__init__.py +12 -0
- webscout/Provider/TTI/aiarta/README.md +134 -0
- webscout/Provider/TTI/aiarta/__init__.py +2 -0
- webscout/Provider/TTI/aiarta/async_aiarta.py +482 -0
- webscout/Provider/TTI/aiarta/sync_aiarta.py +440 -0
- webscout/Provider/TTI/artbit/README.md +100 -0
- webscout/Provider/TTI/artbit/__init__.py +22 -0
- webscout/Provider/TTI/artbit/async_artbit.py +155 -0
- webscout/Provider/TTI/artbit/sync_artbit.py +148 -0
- webscout/Provider/TTI/fastflux/README.md +129 -0
- webscout/Provider/TTI/fastflux/__init__.py +22 -0
- webscout/Provider/TTI/fastflux/async_fastflux.py +261 -0
- webscout/Provider/TTI/fastflux/sync_fastflux.py +252 -0
- webscout/Provider/TTI/huggingface/README.md +114 -0
- webscout/Provider/TTI/huggingface/__init__.py +22 -0
- webscout/Provider/TTI/huggingface/async_huggingface.py +199 -0
- webscout/Provider/TTI/huggingface/sync_huggingface.py +195 -0
- webscout/Provider/TTI/piclumen/README.md +161 -0
- webscout/Provider/TTI/piclumen/__init__.py +23 -0
- webscout/Provider/TTI/piclumen/async_piclumen.py +268 -0
- webscout/Provider/TTI/piclumen/sync_piclumen.py +233 -0
- webscout/Provider/TTI/pixelmuse/README.md +79 -0
- webscout/Provider/TTI/pixelmuse/__init__.py +4 -0
- webscout/Provider/TTI/pixelmuse/async_pixelmuse.py +249 -0
- webscout/Provider/TTI/pixelmuse/sync_pixelmuse.py +182 -0
- webscout/Provider/TTI/talkai/README.md +139 -0
- webscout/Provider/TTI/talkai/__init__.py +4 -0
- webscout/Provider/TTI/talkai/async_talkai.py +229 -0
- webscout/Provider/TTI/talkai/sync_talkai.py +207 -0
- webscout/Provider/TTS/README.md +192 -0
- webscout/Provider/TTS/__init__.py +9 -0
- webscout/Provider/TTS/base.py +159 -0
- webscout/Provider/TTS/deepgram.py +156 -0
- webscout/Provider/TTS/elevenlabs.py +111 -0
- webscout/Provider/TTS/gesserit.py +128 -0
- webscout/Provider/TTS/murfai.py +113 -0
- webscout/Provider/TTS/parler.py +111 -0
- webscout/Provider/TTS/speechma.py +580 -0
- webscout/Provider/TTS/sthir.py +94 -0
- webscout/Provider/TTS/streamElements.py +333 -0
- webscout/Provider/TTS/utils.py +280 -0
- webscout/Provider/TeachAnything.py +229 -0
- webscout/Provider/TextPollinationsAI.py +308 -0
- webscout/Provider/TwoAI.py +280 -0
- webscout/Provider/TypliAI.py +305 -0
- webscout/Provider/UNFINISHED/ChatHub.py +209 -0
- webscout/Provider/UNFINISHED/Youchat.py +330 -0
- webscout/Provider/UNFINISHED/liner_api_request.py +263 -0
- webscout/Provider/UNFINISHED/oivscode.py +351 -0
- webscout/Provider/UNFINISHED/test_lmarena.py +119 -0
- webscout/Provider/Venice.py +258 -0
- webscout/Provider/VercelAI.py +253 -0
- webscout/Provider/WiseCat.py +233 -0
- webscout/Provider/WrDoChat.py +370 -0
- webscout/Provider/Writecream.py +246 -0
- webscout/Provider/WritingMate.py +269 -0
- webscout/Provider/__init__.py +172 -0
- webscout/Provider/ai4chat.py +149 -0
- webscout/Provider/akashgpt.py +335 -0
- webscout/Provider/asksteve.py +220 -0
- webscout/Provider/cerebras.py +290 -0
- webscout/Provider/chatglm.py +215 -0
- webscout/Provider/cleeai.py +213 -0
- webscout/Provider/copilot.py +425 -0
- webscout/Provider/elmo.py +283 -0
- webscout/Provider/freeaichat.py +285 -0
- webscout/Provider/geminiapi.py +208 -0
- webscout/Provider/granite.py +235 -0
- webscout/Provider/hermes.py +266 -0
- webscout/Provider/julius.py +223 -0
- webscout/Provider/koala.py +170 -0
- webscout/Provider/learnfastai.py +325 -0
- webscout/Provider/llama3mitril.py +215 -0
- webscout/Provider/llmchat.py +258 -0
- webscout/Provider/llmchatco.py +306 -0
- webscout/Provider/lmarena.py +198 -0
- webscout/Provider/meta.py +801 -0
- webscout/Provider/multichat.py +364 -0
- webscout/Provider/samurai.py +223 -0
- webscout/Provider/scira_chat.py +299 -0
- webscout/Provider/scnet.py +243 -0
- webscout/Provider/searchchat.py +292 -0
- webscout/Provider/sonus.py +258 -0
- webscout/Provider/talkai.py +194 -0
- webscout/Provider/toolbaz.py +353 -0
- webscout/Provider/turboseek.py +266 -0
- webscout/Provider/typefully.py +202 -0
- webscout/Provider/typegpt.py +289 -0
- webscout/Provider/uncovr.py +368 -0
- webscout/Provider/x0gpt.py +299 -0
- webscout/Provider/yep.py +389 -0
- webscout/__init__.py +4 -2
- webscout/cli.py +3 -28
- webscout/conversation.py +35 -35
- webscout/litagent/Readme.md +276 -0
- webscout/litagent/__init__.py +29 -0
- webscout/litagent/agent.py +455 -0
- webscout/litagent/constants.py +60 -0
- webscout/litprinter/__init__.py +59 -0
- webscout/scout/README.md +402 -0
- webscout/scout/__init__.py +8 -0
- webscout/scout/core/__init__.py +7 -0
- webscout/scout/core/crawler.py +140 -0
- webscout/scout/core/scout.py +568 -0
- webscout/scout/core/search_result.py +96 -0
- webscout/scout/core/text_analyzer.py +63 -0
- webscout/scout/core/text_utils.py +277 -0
- webscout/scout/core/web_analyzer.py +52 -0
- webscout/scout/element.py +460 -0
- webscout/scout/parsers/__init__.py +69 -0
- webscout/scout/parsers/html5lib_parser.py +172 -0
- webscout/scout/parsers/html_parser.py +236 -0
- webscout/scout/parsers/lxml_parser.py +178 -0
- webscout/scout/utils.py +37 -0
- webscout/swiftcli/Readme.md +323 -0
- webscout/swiftcli/__init__.py +95 -0
- webscout/swiftcli/core/__init__.py +7 -0
- webscout/swiftcli/core/cli.py +297 -0
- webscout/swiftcli/core/context.py +104 -0
- webscout/swiftcli/core/group.py +241 -0
- webscout/swiftcli/decorators/__init__.py +28 -0
- webscout/swiftcli/decorators/command.py +221 -0
- webscout/swiftcli/decorators/options.py +220 -0
- webscout/swiftcli/decorators/output.py +252 -0
- webscout/swiftcli/exceptions.py +21 -0
- webscout/swiftcli/plugins/__init__.py +9 -0
- webscout/swiftcli/plugins/base.py +135 -0
- webscout/swiftcli/plugins/manager.py +262 -0
- webscout/swiftcli/utils/__init__.py +59 -0
- webscout/swiftcli/utils/formatting.py +252 -0
- webscout/swiftcli/utils/parsing.py +267 -0
- webscout/version.py +1 -1
- webscout/webscout_search.py +2 -182
- webscout/webscout_search_async.py +1 -179
- webscout/zeroart/README.md +89 -0
- webscout/zeroart/__init__.py +135 -0
- webscout/zeroart/base.py +66 -0
- webscout/zeroart/effects.py +101 -0
- webscout/zeroart/fonts.py +1239 -0
- {webscout-8.2.7.dist-info → webscout-8.2.8.dist-info}/METADATA +115 -60
- webscout-8.2.8.dist-info/RECORD +334 -0
- {webscout-8.2.7.dist-info → webscout-8.2.8.dist-info}/WHEEL +1 -1
- webscout-8.2.7.dist-info/RECORD +0 -26
- {webscout-8.2.7.dist-info → webscout-8.2.8.dist-info}/entry_points.txt +0 -0
- {webscout-8.2.7.dist-info → webscout-8.2.8.dist-info}/licenses/LICENSE.md +0 -0
- {webscout-8.2.7.dist-info → webscout-8.2.8.dist-info}/top_level.txt +0 -0
|
@@ -0,0 +1,159 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Base class for TTS providers with common functionality.
|
|
3
|
+
"""
|
|
4
|
+
import os
|
|
5
|
+
import tempfile
|
|
6
|
+
from pathlib import Path
|
|
7
|
+
from typing import Generator, Optional
|
|
8
|
+
from webscout.AIbase import TTSProvider
|
|
9
|
+
|
|
10
|
+
class BaseTTSProvider(TTSProvider):
|
|
11
|
+
"""
|
|
12
|
+
Base class for TTS providers with common functionality.
|
|
13
|
+
|
|
14
|
+
This class implements common methods like save_audio and stream_audio
|
|
15
|
+
that can be used by all TTS providers.
|
|
16
|
+
"""
|
|
17
|
+
|
|
18
|
+
def __init__(self):
|
|
19
|
+
"""Initialize the base TTS provider."""
|
|
20
|
+
self.temp_dir = tempfile.mkdtemp(prefix="webscout_tts_")
|
|
21
|
+
|
|
22
|
+
def save_audio(self, audio_file: str, destination: str = None, verbose: bool = False) -> str:
|
|
23
|
+
"""
|
|
24
|
+
Save audio to a specific destination.
|
|
25
|
+
|
|
26
|
+
Args:
|
|
27
|
+
audio_file (str): Path to the source audio file
|
|
28
|
+
destination (str, optional): Destination path. Defaults to current directory with timestamp.
|
|
29
|
+
verbose (bool, optional): Whether to print debug information. Defaults to False.
|
|
30
|
+
|
|
31
|
+
Returns:
|
|
32
|
+
str: Path to the saved audio file
|
|
33
|
+
|
|
34
|
+
Raises:
|
|
35
|
+
FileNotFoundError: If the audio file doesn't exist
|
|
36
|
+
"""
|
|
37
|
+
import shutil
|
|
38
|
+
import time
|
|
39
|
+
|
|
40
|
+
source_path = Path(audio_file)
|
|
41
|
+
|
|
42
|
+
if not source_path.exists():
|
|
43
|
+
raise FileNotFoundError(f"Audio file not found: {audio_file}")
|
|
44
|
+
|
|
45
|
+
if destination is None:
|
|
46
|
+
# Create a default destination with timestamp in current directory
|
|
47
|
+
timestamp = int(time.time())
|
|
48
|
+
destination = os.path.join(os.getcwd(), f"tts_audio_{timestamp}{source_path.suffix}")
|
|
49
|
+
|
|
50
|
+
# Ensure the destination directory exists
|
|
51
|
+
os.makedirs(os.path.dirname(os.path.abspath(destination)), exist_ok=True)
|
|
52
|
+
|
|
53
|
+
# Copy the file
|
|
54
|
+
shutil.copy2(source_path, destination)
|
|
55
|
+
|
|
56
|
+
if verbose:
|
|
57
|
+
print(f"[debug] Audio saved to {destination}")
|
|
58
|
+
|
|
59
|
+
return destination
|
|
60
|
+
|
|
61
|
+
def stream_audio(self, text: str, voice: str = None, chunk_size: int = 1024, verbose: bool = False) -> Generator[bytes, None, None]:
|
|
62
|
+
"""
|
|
63
|
+
Stream audio in chunks.
|
|
64
|
+
|
|
65
|
+
Args:
|
|
66
|
+
text (str): The text to convert to speech
|
|
67
|
+
voice (str, optional): The voice to use. Defaults to provider's default voice.
|
|
68
|
+
chunk_size (int, optional): Size of audio chunks to yield. Defaults to 1024.
|
|
69
|
+
verbose (bool, optional): Whether to print debug information. Defaults to False.
|
|
70
|
+
|
|
71
|
+
Yields:
|
|
72
|
+
Generator[bytes, None, None]: Audio data chunks
|
|
73
|
+
"""
|
|
74
|
+
# Generate the audio file
|
|
75
|
+
audio_file = self.tts(text, voice=voice, verbose=verbose)
|
|
76
|
+
|
|
77
|
+
# Stream the file in chunks
|
|
78
|
+
with open(audio_file, 'rb') as f:
|
|
79
|
+
while chunk := f.read(chunk_size):
|
|
80
|
+
yield chunk
|
|
81
|
+
|
|
82
|
+
|
|
83
|
+
class AsyncBaseTTSProvider:
|
|
84
|
+
"""
|
|
85
|
+
Base class for async TTS providers with common functionality.
|
|
86
|
+
|
|
87
|
+
This class implements common async methods like save_audio and stream_audio
|
|
88
|
+
that can be used by all async TTS providers.
|
|
89
|
+
"""
|
|
90
|
+
|
|
91
|
+
def __init__(self):
|
|
92
|
+
"""Initialize the async base TTS provider."""
|
|
93
|
+
self.temp_dir = tempfile.mkdtemp(prefix="webscout_tts_")
|
|
94
|
+
|
|
95
|
+
async def save_audio(self, audio_file: str, destination: str = None, verbose: bool = False) -> str:
|
|
96
|
+
"""
|
|
97
|
+
Save audio to a specific destination asynchronously.
|
|
98
|
+
|
|
99
|
+
Args:
|
|
100
|
+
audio_file (str): Path to the source audio file
|
|
101
|
+
destination (str, optional): Destination path. Defaults to current directory with timestamp.
|
|
102
|
+
verbose (bool, optional): Whether to print debug information. Defaults to False.
|
|
103
|
+
|
|
104
|
+
Returns:
|
|
105
|
+
str: Path to the saved audio file
|
|
106
|
+
|
|
107
|
+
Raises:
|
|
108
|
+
FileNotFoundError: If the audio file doesn't exist
|
|
109
|
+
"""
|
|
110
|
+
import shutil
|
|
111
|
+
import time
|
|
112
|
+
import asyncio
|
|
113
|
+
|
|
114
|
+
source_path = Path(audio_file)
|
|
115
|
+
|
|
116
|
+
if not source_path.exists():
|
|
117
|
+
raise FileNotFoundError(f"Audio file not found: {audio_file}")
|
|
118
|
+
|
|
119
|
+
if destination is None:
|
|
120
|
+
# Create a default destination with timestamp in current directory
|
|
121
|
+
timestamp = int(time.time())
|
|
122
|
+
destination = os.path.join(os.getcwd(), f"tts_audio_{timestamp}{source_path.suffix}")
|
|
123
|
+
|
|
124
|
+
# Ensure the destination directory exists
|
|
125
|
+
os.makedirs(os.path.dirname(os.path.abspath(destination)), exist_ok=True)
|
|
126
|
+
|
|
127
|
+
# Copy the file using asyncio to avoid blocking
|
|
128
|
+
await asyncio.to_thread(shutil.copy2, source_path, destination)
|
|
129
|
+
|
|
130
|
+
if verbose:
|
|
131
|
+
print(f"[debug] Audio saved to {destination}")
|
|
132
|
+
|
|
133
|
+
return destination
|
|
134
|
+
|
|
135
|
+
async def stream_audio(self, text: str, voice: str = None, chunk_size: int = 1024, verbose: bool = False):
|
|
136
|
+
"""
|
|
137
|
+
Stream audio in chunks asynchronously.
|
|
138
|
+
|
|
139
|
+
Args:
|
|
140
|
+
text (str): The text to convert to speech
|
|
141
|
+
voice (str, optional): The voice to use. Defaults to provider's default voice.
|
|
142
|
+
chunk_size (int, optional): Size of audio chunks to yield. Defaults to 1024.
|
|
143
|
+
verbose (bool, optional): Whether to print debug information. Defaults to False.
|
|
144
|
+
|
|
145
|
+
Yields:
|
|
146
|
+
AsyncGenerator[bytes, None]: Audio data chunks
|
|
147
|
+
"""
|
|
148
|
+
try:
|
|
149
|
+
import aiofiles
|
|
150
|
+
except ImportError:
|
|
151
|
+
raise ImportError("The 'aiofiles' package is required for async streaming. Install it with 'pip install aiofiles'.")
|
|
152
|
+
|
|
153
|
+
# Generate the audio file
|
|
154
|
+
audio_file = await self.tts(text, voice=voice, verbose=verbose)
|
|
155
|
+
|
|
156
|
+
# Stream the file in chunks
|
|
157
|
+
async with aiofiles.open(audio_file, 'rb') as f:
|
|
158
|
+
while chunk := await f.read(chunk_size):
|
|
159
|
+
yield chunk
|
|
@@ -0,0 +1,156 @@
|
|
|
1
|
+
import time
|
|
2
|
+
import requests
|
|
3
|
+
import pathlib
|
|
4
|
+
import base64
|
|
5
|
+
import tempfile
|
|
6
|
+
from io import BytesIO
|
|
7
|
+
from webscout import exceptions
|
|
8
|
+
from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
9
|
+
from webscout.litagent import LitAgent
|
|
10
|
+
from . import utils
|
|
11
|
+
from .base import BaseTTSProvider
|
|
12
|
+
|
|
13
|
+
class DeepgramTTS(BaseTTSProvider):
|
|
14
|
+
"""
|
|
15
|
+
Text-to-speech provider using the DeepgramTTS API.
|
|
16
|
+
"""
|
|
17
|
+
# Request headers
|
|
18
|
+
headers: dict[str, str] = {
|
|
19
|
+
"User-Agent": LitAgent().random()
|
|
20
|
+
}
|
|
21
|
+
all_voices: dict[str, str] = {
|
|
22
|
+
"Asteria": "aura-asteria-en", "Arcas": "aura-arcas-en", "Luna": "aura-luna-en",
|
|
23
|
+
"Zeus": "aura-zeus-en", "Orpheus": "aura-orpheus-en", "Angus": "aura-angus-en",
|
|
24
|
+
"Athena": "aura-athena-en", "Helios": "aura-helios-en", "Hera": "aura-hera-en",
|
|
25
|
+
"Orion": "aura-orion-en", "Perseus": "aura-perseus-en", "Stella": "aura-stella-en"
|
|
26
|
+
}
|
|
27
|
+
|
|
28
|
+
def __init__(self, timeout: int = 20, proxies: dict = None):
|
|
29
|
+
"""Initializes the DeepgramTTS TTS client."""
|
|
30
|
+
super().__init__()
|
|
31
|
+
self.session = requests.Session()
|
|
32
|
+
self.session.headers.update(self.headers)
|
|
33
|
+
if proxies:
|
|
34
|
+
self.session.proxies.update(proxies)
|
|
35
|
+
self.timeout = timeout
|
|
36
|
+
|
|
37
|
+
def tts(self, text: str, voice: str = "Brian", verbose: bool = True) -> str:
|
|
38
|
+
"""
|
|
39
|
+
Converts text to speech using the DeepgramTTS API and saves it to a file.
|
|
40
|
+
|
|
41
|
+
Args:
|
|
42
|
+
text (str): The text to convert to speech
|
|
43
|
+
voice (str): The voice to use for TTS (default: "Brian")
|
|
44
|
+
verbose (bool): Whether to print progress messages (default: True)
|
|
45
|
+
|
|
46
|
+
Returns:
|
|
47
|
+
str: Path to the generated audio file
|
|
48
|
+
|
|
49
|
+
Raises:
|
|
50
|
+
AssertionError: If the specified voice is not available
|
|
51
|
+
requests.RequestException: If there's an error communicating with the API
|
|
52
|
+
RuntimeError: If there's an error processing the audio
|
|
53
|
+
"""
|
|
54
|
+
assert (
|
|
55
|
+
voice in self.all_voices
|
|
56
|
+
), f"Voice '{voice}' not one of [{', '.join(self.all_voices.keys())}]"
|
|
57
|
+
|
|
58
|
+
url = "https://deepgram.com/api/ttsAudioGeneration"
|
|
59
|
+
filename = pathlib.Path(tempfile.mktemp(suffix=".mp3", dir=self.temp_dir))
|
|
60
|
+
|
|
61
|
+
# Split text into sentences using the utils module
|
|
62
|
+
sentences = utils.split_sentences(text)
|
|
63
|
+
if verbose:
|
|
64
|
+
for index, sen in enumerate(sentences):
|
|
65
|
+
print(f"[debug] Sentence {index}: {sen}")
|
|
66
|
+
|
|
67
|
+
def generate_audio_for_chunk(part_text: str, part_number: int):
|
|
68
|
+
"""
|
|
69
|
+
Generate audio for a single chunk of text.
|
|
70
|
+
|
|
71
|
+
Args:
|
|
72
|
+
part_text (str): The text chunk to convert
|
|
73
|
+
part_number (int): The chunk number for ordering
|
|
74
|
+
|
|
75
|
+
Returns:
|
|
76
|
+
tuple: (part_number, audio_data)
|
|
77
|
+
|
|
78
|
+
Raises:
|
|
79
|
+
requests.RequestException: If there's an API error
|
|
80
|
+
"""
|
|
81
|
+
max_retries = 3
|
|
82
|
+
retry_count = 0
|
|
83
|
+
|
|
84
|
+
while retry_count < max_retries:
|
|
85
|
+
try:
|
|
86
|
+
payload = {"text": part_text, "model": self.all_voices[voice]}
|
|
87
|
+
response = self.session.post(
|
|
88
|
+
url=url,
|
|
89
|
+
headers=self.headers,
|
|
90
|
+
json=payload,
|
|
91
|
+
stream=True,
|
|
92
|
+
timeout=self.timeout
|
|
93
|
+
)
|
|
94
|
+
response.raise_for_status()
|
|
95
|
+
|
|
96
|
+
response_data = response.json().get('data')
|
|
97
|
+
if response_data:
|
|
98
|
+
audio_data = base64.b64decode(response_data)
|
|
99
|
+
if verbose:
|
|
100
|
+
print(f"[debug] Chunk {part_number} processed successfully")
|
|
101
|
+
return part_number, audio_data
|
|
102
|
+
|
|
103
|
+
if verbose:
|
|
104
|
+
print(f"[debug] No data received for chunk {part_number}. Attempt {retry_count + 1}/{max_retries}")
|
|
105
|
+
|
|
106
|
+
except requests.RequestException as e:
|
|
107
|
+
if verbose:
|
|
108
|
+
print(f"[debug] Error processing chunk {part_number}: {str(e)}. Attempt {retry_count + 1}/{max_retries}")
|
|
109
|
+
if retry_count == max_retries - 1:
|
|
110
|
+
raise
|
|
111
|
+
|
|
112
|
+
retry_count += 1
|
|
113
|
+
time.sleep(1)
|
|
114
|
+
|
|
115
|
+
raise RuntimeError(f"Failed to generate audio for chunk {part_number} after {max_retries} attempts")
|
|
116
|
+
|
|
117
|
+
try:
|
|
118
|
+
# Using ThreadPoolExecutor to handle requests concurrently
|
|
119
|
+
with ThreadPoolExecutor() as executor:
|
|
120
|
+
futures = {
|
|
121
|
+
executor.submit(generate_audio_for_chunk, sentence.strip(), chunk_num): chunk_num
|
|
122
|
+
for chunk_num, sentence in enumerate(sentences, start=1)
|
|
123
|
+
}
|
|
124
|
+
|
|
125
|
+
# Dictionary to store results with order preserved
|
|
126
|
+
audio_chunks = {}
|
|
127
|
+
|
|
128
|
+
for future in as_completed(futures):
|
|
129
|
+
chunk_num = futures[future]
|
|
130
|
+
try:
|
|
131
|
+
part_number, audio_data = future.result()
|
|
132
|
+
audio_chunks[part_number] = audio_data
|
|
133
|
+
except Exception as e:
|
|
134
|
+
raise RuntimeError(f"Failed to generate audio for chunk {chunk_num}: {str(e)}")
|
|
135
|
+
|
|
136
|
+
# Combine all audio chunks in order
|
|
137
|
+
with open(filename, 'wb') as f:
|
|
138
|
+
for chunk_num in sorted(audio_chunks.keys()):
|
|
139
|
+
f.write(audio_chunks[chunk_num])
|
|
140
|
+
|
|
141
|
+
if verbose:
|
|
142
|
+
print(f"[debug] Audio saved to {filename}")
|
|
143
|
+
return str(filename)
|
|
144
|
+
|
|
145
|
+
except Exception as e:
|
|
146
|
+
print(f"[debug] Failed to generate audio: {str(e)}") if verbose else None
|
|
147
|
+
raise RuntimeError(f"Failed to generate audio: {str(e)}")
|
|
148
|
+
|
|
149
|
+
# Example usage
|
|
150
|
+
if __name__ == "__main__":
|
|
151
|
+
deepgram = DeepgramTTS()
|
|
152
|
+
text = "This is a test of the DeepgramTTS text-to-speech API. It supports multiple sentences. Let's see how it works!"
|
|
153
|
+
|
|
154
|
+
print("[debug] Generating audio...")
|
|
155
|
+
audio_file = deepgram.tts(text, voice="Asteria")
|
|
156
|
+
print(f"Audio saved to: {audio_file}")
|
|
@@ -0,0 +1,111 @@
|
|
|
1
|
+
import time
|
|
2
|
+
import requests
|
|
3
|
+
import pathlib
|
|
4
|
+
import tempfile
|
|
5
|
+
from io import BytesIO
|
|
6
|
+
from webscout import exceptions
|
|
7
|
+
from webscout.litagent import LitAgent
|
|
8
|
+
from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
9
|
+
from . import utils
|
|
10
|
+
from .base import BaseTTSProvider
|
|
11
|
+
|
|
12
|
+
class ElevenlabsTTS(BaseTTSProvider):
|
|
13
|
+
"""
|
|
14
|
+
Text-to-speech provider using the ElevenlabsTTS API.
|
|
15
|
+
"""
|
|
16
|
+
# Request headers
|
|
17
|
+
headers: dict[str, str] = {
|
|
18
|
+
"User-Agent": LitAgent().random()
|
|
19
|
+
}
|
|
20
|
+
all_voices: dict[str, str] = {"Brian": "nPczCjzI2devNBz1zQrb", "Alice":"Xb7hH8MSUJpSbSDYk0k2", "Bill":"pqHfZKP75CvOlQylNhV4", "Callum":"N2lVS1w4EtoT3dr4eOWO", "Charlie":"IKne3meq5aSn9XLyUdCD", "Charlotte":"XB0fDUnXU5powFXDhCwa", "Chris":"iP95p4xoKVk53GoZ742B", "Daniel":"onwK4e9ZLuTAKqWW03F9", "Eric":"cjVigY5qzO86Huf0OWal", "George":"JBFqnCBsd6RMkjVDRZzb", "Jessica":"cgSgspJ2msm6clMCkdW9", "Laura":"FGY2WhTYpPnrIDTdsKH5", "Liam":"TX3LPaxmHKxFdv7VOQHJ", "Lily":"pFZP5JQG7iQjIQuC4Bku", "Matilda":"XrExE9yKIg1WjnnlVkGX", "Sarah":"EXAVITQu4vr4xnSDxMaL", "Will":"bIHbv24MWmeRgasZH58o"}
|
|
21
|
+
|
|
22
|
+
def __init__(self, timeout: int = 20, proxies: dict = None):
|
|
23
|
+
"""Initializes the ElevenlabsTTS TTS client."""
|
|
24
|
+
super().__init__()
|
|
25
|
+
self.session = requests.Session()
|
|
26
|
+
self.session.headers.update(self.headers)
|
|
27
|
+
if proxies:
|
|
28
|
+
self.session.proxies.update(proxies)
|
|
29
|
+
self.timeout = timeout
|
|
30
|
+
self.params = {'allow_unauthenticated': '1'}
|
|
31
|
+
|
|
32
|
+
def tts(self, text: str, voice: str = "Brian", verbose:bool = True) -> str:
|
|
33
|
+
"""
|
|
34
|
+
Converts text to speech using the ElevenlabsTTS API and saves it to a file.
|
|
35
|
+
"""
|
|
36
|
+
assert (
|
|
37
|
+
voice in self.all_voices
|
|
38
|
+
), f"Voice '{voice}' not one of [{', '.join(self.all_voices.keys())}]"
|
|
39
|
+
|
|
40
|
+
filename = pathlib.Path(tempfile.mktemp(suffix=".mp3", dir=self.temp_dir))
|
|
41
|
+
|
|
42
|
+
# Split text into sentences
|
|
43
|
+
sentences = utils.split_sentences(text)
|
|
44
|
+
|
|
45
|
+
# Function to request audio for each chunk
|
|
46
|
+
def generate_audio_for_chunk(part_text: str, part_number: int):
|
|
47
|
+
while True:
|
|
48
|
+
try:
|
|
49
|
+
json_data = {'text': part_text, 'model_id': 'eleven_multilingual_v2'}
|
|
50
|
+
response = self.session.post(f'https://api.elevenlabs.io/v1/text-to-speech/{self.all_voices[voice]}',params=self.params, headers=self.headers, json=json_data, timeout=self.timeout)
|
|
51
|
+
response.raise_for_status()
|
|
52
|
+
|
|
53
|
+
# Check if the request was successful
|
|
54
|
+
if response.ok and response.status_code == 200:
|
|
55
|
+
if verbose:
|
|
56
|
+
print(f"[debug] Chunk {part_number} processed successfully")
|
|
57
|
+
return part_number, response.content
|
|
58
|
+
else:
|
|
59
|
+
if verbose:
|
|
60
|
+
print(f"[debug] No data received for chunk {part_number}. Retrying...")
|
|
61
|
+
except requests.RequestException as e:
|
|
62
|
+
if verbose:
|
|
63
|
+
print(f"[debug] Error for chunk {part_number}: {e}. Retrying...")
|
|
64
|
+
time.sleep(1)
|
|
65
|
+
try:
|
|
66
|
+
# Using ThreadPoolExecutor to handle requests concurrently
|
|
67
|
+
with ThreadPoolExecutor() as executor:
|
|
68
|
+
futures = {executor.submit(generate_audio_for_chunk, sentence.strip(), chunk_num): chunk_num
|
|
69
|
+
for chunk_num, sentence in enumerate(sentences, start=1)}
|
|
70
|
+
|
|
71
|
+
# Dictionary to store results with order preserved
|
|
72
|
+
audio_chunks = {}
|
|
73
|
+
|
|
74
|
+
for future in as_completed(futures):
|
|
75
|
+
chunk_num = futures[future]
|
|
76
|
+
try:
|
|
77
|
+
part_number, audio_data = future.result()
|
|
78
|
+
audio_chunks[part_number] = audio_data # Store the audio data in correct sequence
|
|
79
|
+
except Exception as e:
|
|
80
|
+
if verbose:
|
|
81
|
+
print(f"[debug] Failed to generate audio for chunk {chunk_num}: {e}")
|
|
82
|
+
|
|
83
|
+
# Combine audio chunks in the correct sequence
|
|
84
|
+
combined_audio = BytesIO()
|
|
85
|
+
for part_number in sorted(audio_chunks.keys()):
|
|
86
|
+
combined_audio.write(audio_chunks[part_number])
|
|
87
|
+
if verbose:
|
|
88
|
+
print(f"[debug] Added chunk {part_number} to the combined file.")
|
|
89
|
+
|
|
90
|
+
# Save the combined audio data to a single file
|
|
91
|
+
with open(filename, 'wb') as f:
|
|
92
|
+
f.write(combined_audio.getvalue())
|
|
93
|
+
if verbose:
|
|
94
|
+
print(f"[debug] Final Audio Saved as {filename}")
|
|
95
|
+
return filename.as_posix()
|
|
96
|
+
|
|
97
|
+
except requests.exceptions.RequestException as e:
|
|
98
|
+
if verbose:
|
|
99
|
+
print(f"[debug] Failed to perform the operation: {e}")
|
|
100
|
+
raise exceptions.FailedToGenerateResponseError(
|
|
101
|
+
f"Failed to perform the operation: {e}"
|
|
102
|
+
)
|
|
103
|
+
|
|
104
|
+
# Example usage
|
|
105
|
+
if __name__ == "__main__":
|
|
106
|
+
elevenlabs = ElevenlabsTTS()
|
|
107
|
+
text = "This is a test of the ElevenlabsTTS text-to-speech API. It supports multiple sentences and advanced logging."
|
|
108
|
+
|
|
109
|
+
print("[debug] Generating audio...")
|
|
110
|
+
audio_file = elevenlabs.tts(text, voice="Brian")
|
|
111
|
+
print(f"Audio saved to: {audio_file}")
|
|
@@ -0,0 +1,128 @@
|
|
|
1
|
+
import time
|
|
2
|
+
import requests
|
|
3
|
+
import pathlib
|
|
4
|
+
import base64
|
|
5
|
+
from io import BytesIO
|
|
6
|
+
from webscout import exceptions
|
|
7
|
+
from webscout.litagent import LitAgent
|
|
8
|
+
from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
9
|
+
from . import utils
|
|
10
|
+
from .base import BaseTTSProvider
|
|
11
|
+
|
|
12
|
+
class GesseritTTS(BaseTTSProvider):
|
|
13
|
+
"""Text-to-speech provider using the GesseritTTS API."""
|
|
14
|
+
# Request headers
|
|
15
|
+
headers: dict[str, str] = {
|
|
16
|
+
"User-Agent": LitAgent().random()
|
|
17
|
+
}
|
|
18
|
+
cache_dir = pathlib.Path("./audio_cache")
|
|
19
|
+
all_voices: dict[str, str] = {
|
|
20
|
+
"Emma": "en_us_001", # Female Voice
|
|
21
|
+
"Liam": "en_us_006", # Male Voice
|
|
22
|
+
"Noah": "en_us_007", # Male Voice
|
|
23
|
+
"Oliver": "en_us_009", # Male Voice
|
|
24
|
+
"Elijah": "en_us_010", # Male Voice
|
|
25
|
+
"James": "en_male_narration", # Male Voice
|
|
26
|
+
"Charlie": "en_male_funny", # Male Voice
|
|
27
|
+
"Sophia": "en_female_emotional", # Female Voice
|
|
28
|
+
"Cody": "en_male_cody", # Male Voice
|
|
29
|
+
}
|
|
30
|
+
|
|
31
|
+
def __init__(self, timeout: int = 20, proxies: dict = None):
|
|
32
|
+
"""Initializes the GesseritTTS TTS client."""
|
|
33
|
+
super().__init__()
|
|
34
|
+
self.session = requests.Session()
|
|
35
|
+
self.session.headers.update(self.headers)
|
|
36
|
+
if proxies:
|
|
37
|
+
self.session.proxies.update(proxies)
|
|
38
|
+
self.timeout = timeout
|
|
39
|
+
|
|
40
|
+
def tts(self, text: str, voice: str = "Oliver", verbose:bool = True) -> str:
|
|
41
|
+
"""Converts text to speech using the GesseritTTS API and saves it to a file."""
|
|
42
|
+
assert (
|
|
43
|
+
voice in self.all_voices
|
|
44
|
+
), f"Voice '{voice}' not one of [{', '.join(self.all_voices.keys())}]"
|
|
45
|
+
|
|
46
|
+
filename = self.cache_dir / f"{int(time.time())}.mp3"
|
|
47
|
+
|
|
48
|
+
voice_id = self.all_voices[voice]
|
|
49
|
+
|
|
50
|
+
# Split text into sentences
|
|
51
|
+
sentences = utils.split_sentences(text)
|
|
52
|
+
|
|
53
|
+
# Function to request audio for each chunk
|
|
54
|
+
def generate_audio_for_chunk(part_text: str, part_number: int):
|
|
55
|
+
while True:
|
|
56
|
+
try:
|
|
57
|
+
payload = {
|
|
58
|
+
"text": part_text,
|
|
59
|
+
"voice": voice_id
|
|
60
|
+
}
|
|
61
|
+
response = self.session.post('https://gesserit.co/api/tiktok-tts', headers=self.headers, json=payload, timeout=self.timeout)
|
|
62
|
+
response.raise_for_status()
|
|
63
|
+
|
|
64
|
+
# Create the audio_cache directory if it doesn't exist
|
|
65
|
+
self.cache_dir.mkdir(parents=True, exist_ok=True)
|
|
66
|
+
|
|
67
|
+
# Check if the request was successful
|
|
68
|
+
if response.ok and response.status_code == 200:
|
|
69
|
+
data = response.json()
|
|
70
|
+
audio_base64 = data["audioUrl"].split(",")[1]
|
|
71
|
+
audio_data = base64.b64decode(audio_base64)
|
|
72
|
+
if verbose:
|
|
73
|
+
print(f"[debug] Chunk {part_number} processed successfully")
|
|
74
|
+
return part_number, audio_data
|
|
75
|
+
else:
|
|
76
|
+
if verbose:
|
|
77
|
+
print(f"[debug] No data received for chunk {part_number}. Retrying...")
|
|
78
|
+
except requests.RequestException as e:
|
|
79
|
+
if verbose:
|
|
80
|
+
print(f"[debug] Error for chunk {part_number}: {e}. Retrying...")
|
|
81
|
+
time.sleep(1)
|
|
82
|
+
try:
|
|
83
|
+
# Using ThreadPoolExecutor to handle requests concurrently
|
|
84
|
+
with ThreadPoolExecutor() as executor:
|
|
85
|
+
futures = {executor.submit(generate_audio_for_chunk, sentence.strip(), chunk_num): chunk_num
|
|
86
|
+
for chunk_num, sentence in enumerate(sentences, start=1)}
|
|
87
|
+
|
|
88
|
+
# Dictionary to store results with order preserved
|
|
89
|
+
audio_chunks = {}
|
|
90
|
+
|
|
91
|
+
for future in as_completed(futures):
|
|
92
|
+
chunk_num = futures[future]
|
|
93
|
+
try:
|
|
94
|
+
part_number, audio_data = future.result()
|
|
95
|
+
audio_chunks[part_number] = audio_data # Store the audio data in correct sequence
|
|
96
|
+
except Exception as e:
|
|
97
|
+
if verbose:
|
|
98
|
+
print(f"[debug] Failed to generate audio for chunk {chunk_num}: {e}")
|
|
99
|
+
|
|
100
|
+
# Combine audio chunks in the correct sequence
|
|
101
|
+
combined_audio = BytesIO()
|
|
102
|
+
for part_number in sorted(audio_chunks.keys()):
|
|
103
|
+
combined_audio.write(audio_chunks[part_number])
|
|
104
|
+
if verbose:
|
|
105
|
+
print(f"[debug] Added chunk {part_number} to the combined file.")
|
|
106
|
+
|
|
107
|
+
# Save the combined audio data to a single file
|
|
108
|
+
with open(filename, 'wb') as f:
|
|
109
|
+
f.write(combined_audio.getvalue())
|
|
110
|
+
if verbose:
|
|
111
|
+
print(f"[debug] Final Audio Saved as {filename}")
|
|
112
|
+
return filename.as_posix()
|
|
113
|
+
|
|
114
|
+
except requests.exceptions.RequestException as e:
|
|
115
|
+
if verbose:
|
|
116
|
+
print(f"[debug] Failed to perform the operation: {e}")
|
|
117
|
+
raise exceptions.FailedToGenerateResponseError(
|
|
118
|
+
f"Failed to perform the operation: {e}"
|
|
119
|
+
)
|
|
120
|
+
|
|
121
|
+
# Example usage
|
|
122
|
+
if __name__ == "__main__":
|
|
123
|
+
gesserit = GesseritTTS()
|
|
124
|
+
text = "This is a test of the GesseritTTS text-to-speech API. It supports multiple sentences and advanced logging."
|
|
125
|
+
|
|
126
|
+
print("[debug] Generating audio...")
|
|
127
|
+
audio_file = gesserit.tts(text, voice="Oliver")
|
|
128
|
+
print(f"Audio saved to: {audio_file}")
|
|
@@ -0,0 +1,113 @@
|
|
|
1
|
+
import time
|
|
2
|
+
import requests
|
|
3
|
+
import pathlib
|
|
4
|
+
import tempfile
|
|
5
|
+
from io import BytesIO
|
|
6
|
+
from urllib.parse import urlencode
|
|
7
|
+
from webscout import exceptions
|
|
8
|
+
from webscout.litagent import LitAgent
|
|
9
|
+
from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
10
|
+
from . import utils
|
|
11
|
+
from .base import BaseTTSProvider
|
|
12
|
+
|
|
13
|
+
class MurfAITTS(BaseTTSProvider):
|
|
14
|
+
"""Text-to-speech provider using the MurfAITTS API."""
|
|
15
|
+
# Request headers
|
|
16
|
+
headers: dict[str, str] = {
|
|
17
|
+
"User-Agent": LitAgent().random()
|
|
18
|
+
}
|
|
19
|
+
all_voices: dict[str, str] = {"Hazel": "en-UK-hazel"}
|
|
20
|
+
|
|
21
|
+
def __init__(self, timeout: int = 20, proxies: dict = None):
|
|
22
|
+
"""Initializes the MurfAITTS TTS client."""
|
|
23
|
+
super().__init__()
|
|
24
|
+
self.session = requests.Session()
|
|
25
|
+
self.session.headers.update(self.headers)
|
|
26
|
+
if proxies:
|
|
27
|
+
self.session.proxies.update(proxies)
|
|
28
|
+
self.timeout = timeout
|
|
29
|
+
|
|
30
|
+
def tts(self, text: str, voice: str = "Hazel", verbose:bool = True) -> str:
|
|
31
|
+
"""Converts text to speech using the MurfAITTS API and saves it to a file."""
|
|
32
|
+
assert (
|
|
33
|
+
voice in self.all_voices
|
|
34
|
+
), f"Voice '{voice}' not one of [{', '.join(self.all_voices.keys())}]"
|
|
35
|
+
|
|
36
|
+
filename = pathlib.Path(tempfile.mktemp(suffix=".mp3", dir=self.temp_dir))
|
|
37
|
+
|
|
38
|
+
voice_id = self.all_voices[voice]
|
|
39
|
+
|
|
40
|
+
# Split text into sentences
|
|
41
|
+
sentences = utils.split_sentences(text)
|
|
42
|
+
|
|
43
|
+
# Function to request audio for each chunk
|
|
44
|
+
def generate_audio_for_chunk(part_text: str, part_number: int):
|
|
45
|
+
while True:
|
|
46
|
+
try:
|
|
47
|
+
params: dict[str, str] = {
|
|
48
|
+
"name": voice_id,
|
|
49
|
+
"text": part_text
|
|
50
|
+
}
|
|
51
|
+
encode_param: str = urlencode(params)
|
|
52
|
+
response = self.session.get(f"https://murf.ai/Prod/anonymous-tts/audio?{encode_param}", headers=self.headers, timeout=self.timeout)
|
|
53
|
+
response.raise_for_status()
|
|
54
|
+
|
|
55
|
+
# Check if the request was successful
|
|
56
|
+
if response.ok and response.status_code == 200:
|
|
57
|
+
if verbose:
|
|
58
|
+
print(f"[debug] Chunk {part_number} processed successfully")
|
|
59
|
+
return part_number, response.content
|
|
60
|
+
else:
|
|
61
|
+
if verbose:
|
|
62
|
+
print(f"[debug] No data received for chunk {part_number}. Retrying...")
|
|
63
|
+
except requests.RequestException as e:
|
|
64
|
+
if verbose:
|
|
65
|
+
print(f"[debug] Error for chunk {part_number}: {e}. Retrying...")
|
|
66
|
+
time.sleep(1)
|
|
67
|
+
try:
|
|
68
|
+
# Using ThreadPoolExecutor to handle requests concurrently
|
|
69
|
+
with ThreadPoolExecutor() as executor:
|
|
70
|
+
futures = {executor.submit(generate_audio_for_chunk, sentence.strip(), chunk_num): chunk_num
|
|
71
|
+
for chunk_num, sentence in enumerate(sentences, start=1)}
|
|
72
|
+
|
|
73
|
+
# Dictionary to store results with order preserved
|
|
74
|
+
audio_chunks = {}
|
|
75
|
+
|
|
76
|
+
for future in as_completed(futures):
|
|
77
|
+
chunk_num = futures[future]
|
|
78
|
+
try:
|
|
79
|
+
part_number, audio_data = future.result()
|
|
80
|
+
audio_chunks[part_number] = audio_data # Store the audio data in correct sequence
|
|
81
|
+
except Exception as e:
|
|
82
|
+
if verbose:
|
|
83
|
+
print(f"[debug] Failed to generate audio for chunk {chunk_num}: {e}")
|
|
84
|
+
|
|
85
|
+
# Combine audio chunks in the correct sequence
|
|
86
|
+
combined_audio = BytesIO()
|
|
87
|
+
for part_number in sorted(audio_chunks.keys()):
|
|
88
|
+
combined_audio.write(audio_chunks[part_number])
|
|
89
|
+
if verbose:
|
|
90
|
+
print(f"[debug] Added chunk {part_number} to the combined file.")
|
|
91
|
+
|
|
92
|
+
# Save the combined audio data to a single file
|
|
93
|
+
with open(filename, 'wb') as f:
|
|
94
|
+
f.write(combined_audio.getvalue())
|
|
95
|
+
if verbose:
|
|
96
|
+
print(f"[debug] Final Audio Saved as {filename}")
|
|
97
|
+
return filename.as_posix()
|
|
98
|
+
|
|
99
|
+
except requests.exceptions.RequestException as e:
|
|
100
|
+
if verbose:
|
|
101
|
+
print(f"[debug] Failed to perform the operation: {e}")
|
|
102
|
+
raise exceptions.FailedToGenerateResponseError(
|
|
103
|
+
f"Failed to perform the operation: {e}"
|
|
104
|
+
)
|
|
105
|
+
|
|
106
|
+
# Example usage
|
|
107
|
+
if __name__ == "__main__":
|
|
108
|
+
murfai = MurfAITTS()
|
|
109
|
+
text = "This is a test of the MurfAITTS text-to-speech API. It supports multiple sentences and advanced logging."
|
|
110
|
+
|
|
111
|
+
print("[debug] Generating audio...")
|
|
112
|
+
audio_file = murfai.tts(text, voice="Hazel")
|
|
113
|
+
print(f"Audio saved to: {audio_file}")
|