webscout 8.2.7__py3-none-any.whl → 8.2.9__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- webscout/AIauto.py +33 -15
- webscout/AIbase.py +96 -37
- webscout/AIutel.py +703 -250
- webscout/Bard.py +441 -323
- webscout/Extra/Act.md +309 -0
- webscout/Extra/GitToolkit/__init__.py +10 -0
- webscout/Extra/GitToolkit/gitapi/README.md +110 -0
- webscout/Extra/GitToolkit/gitapi/__init__.py +12 -0
- webscout/Extra/GitToolkit/gitapi/repository.py +195 -0
- webscout/Extra/GitToolkit/gitapi/user.py +96 -0
- webscout/Extra/GitToolkit/gitapi/utils.py +62 -0
- webscout/Extra/YTToolkit/README.md +375 -0
- webscout/Extra/YTToolkit/YTdownloader.py +957 -0
- webscout/Extra/YTToolkit/__init__.py +3 -0
- webscout/Extra/YTToolkit/transcriber.py +476 -0
- webscout/Extra/YTToolkit/ytapi/README.md +44 -0
- webscout/Extra/YTToolkit/ytapi/__init__.py +6 -0
- webscout/Extra/YTToolkit/ytapi/channel.py +307 -0
- webscout/Extra/YTToolkit/ytapi/errors.py +13 -0
- webscout/Extra/YTToolkit/ytapi/extras.py +118 -0
- webscout/Extra/YTToolkit/ytapi/https.py +88 -0
- webscout/Extra/YTToolkit/ytapi/patterns.py +61 -0
- webscout/Extra/YTToolkit/ytapi/playlist.py +59 -0
- webscout/Extra/YTToolkit/ytapi/pool.py +8 -0
- webscout/Extra/YTToolkit/ytapi/query.py +40 -0
- webscout/Extra/YTToolkit/ytapi/stream.py +63 -0
- webscout/Extra/YTToolkit/ytapi/utils.py +62 -0
- webscout/Extra/YTToolkit/ytapi/video.py +232 -0
- webscout/Extra/__init__.py +7 -0
- webscout/Extra/autocoder/__init__.py +9 -0
- webscout/Extra/autocoder/autocoder.py +1105 -0
- webscout/Extra/autocoder/autocoder_utiles.py +332 -0
- webscout/Extra/gguf.md +430 -0
- webscout/Extra/gguf.py +684 -0
- webscout/Extra/tempmail/README.md +488 -0
- webscout/Extra/tempmail/__init__.py +28 -0
- webscout/Extra/tempmail/async_utils.py +141 -0
- webscout/Extra/tempmail/base.py +161 -0
- webscout/Extra/tempmail/cli.py +187 -0
- webscout/Extra/tempmail/emailnator.py +84 -0
- webscout/Extra/tempmail/mail_tm.py +361 -0
- webscout/Extra/tempmail/temp_mail_io.py +292 -0
- webscout/Extra/weather.md +281 -0
- webscout/Extra/weather.py +194 -0
- webscout/Extra/weather_ascii.py +76 -0
- webscout/Litlogger/README.md +10 -0
- webscout/Litlogger/__init__.py +15 -0
- webscout/Litlogger/formats.py +4 -0
- webscout/Litlogger/handlers.py +103 -0
- webscout/Litlogger/levels.py +13 -0
- webscout/Litlogger/logger.py +92 -0
- webscout/Provider/AI21.py +177 -0
- webscout/Provider/AISEARCH/DeepFind.py +254 -0
- webscout/Provider/AISEARCH/Perplexity.py +333 -0
- webscout/Provider/AISEARCH/README.md +279 -0
- webscout/Provider/AISEARCH/__init__.py +9 -0
- webscout/Provider/AISEARCH/felo_search.py +202 -0
- webscout/Provider/AISEARCH/genspark_search.py +324 -0
- webscout/Provider/AISEARCH/hika_search.py +186 -0
- webscout/Provider/AISEARCH/iask_search.py +410 -0
- webscout/Provider/AISEARCH/monica_search.py +220 -0
- webscout/Provider/AISEARCH/scira_search.py +298 -0
- webscout/Provider/AISEARCH/webpilotai_search.py +255 -0
- webscout/Provider/Aitopia.py +316 -0
- webscout/Provider/AllenAI.py +440 -0
- webscout/Provider/Andi.py +228 -0
- webscout/Provider/Blackboxai.py +791 -0
- webscout/Provider/ChatGPTClone.py +237 -0
- webscout/Provider/ChatGPTGratis.py +194 -0
- webscout/Provider/ChatSandbox.py +342 -0
- webscout/Provider/Cloudflare.py +324 -0
- webscout/Provider/Cohere.py +208 -0
- webscout/Provider/Deepinfra.py +340 -0
- webscout/Provider/ExaAI.py +261 -0
- webscout/Provider/ExaChat.py +358 -0
- webscout/Provider/Flowith.py +217 -0
- webscout/Provider/FreeGemini.py +250 -0
- webscout/Provider/Gemini.py +169 -0
- webscout/Provider/GithubChat.py +369 -0
- webscout/Provider/GizAI.py +295 -0
- webscout/Provider/Glider.py +225 -0
- webscout/Provider/Groq.py +801 -0
- webscout/Provider/HF_space/__init__.py +0 -0
- webscout/Provider/HF_space/qwen_qwen2.py +206 -0
- webscout/Provider/HeckAI.py +375 -0
- webscout/Provider/HuggingFaceChat.py +469 -0
- webscout/Provider/Hunyuan.py +283 -0
- webscout/Provider/Jadve.py +291 -0
- webscout/Provider/Koboldai.py +384 -0
- webscout/Provider/LambdaChat.py +411 -0
- webscout/Provider/Llama3.py +259 -0
- webscout/Provider/MCPCore.py +315 -0
- webscout/Provider/Marcus.py +198 -0
- webscout/Provider/Nemotron.py +218 -0
- webscout/Provider/Netwrck.py +270 -0
- webscout/Provider/OLLAMA.py +396 -0
- webscout/Provider/OPENAI/BLACKBOXAI.py +766 -0
- webscout/Provider/OPENAI/Cloudflare.py +378 -0
- webscout/Provider/OPENAI/FreeGemini.py +283 -0
- webscout/Provider/OPENAI/NEMOTRON.py +232 -0
- webscout/Provider/OPENAI/Qwen3.py +283 -0
- webscout/Provider/OPENAI/README.md +952 -0
- webscout/Provider/OPENAI/TwoAI.py +357 -0
- webscout/Provider/OPENAI/__init__.py +40 -0
- webscout/Provider/OPENAI/ai4chat.py +293 -0
- webscout/Provider/OPENAI/api.py +969 -0
- webscout/Provider/OPENAI/base.py +249 -0
- webscout/Provider/OPENAI/c4ai.py +373 -0
- webscout/Provider/OPENAI/chatgpt.py +556 -0
- webscout/Provider/OPENAI/chatgptclone.py +494 -0
- webscout/Provider/OPENAI/chatsandbox.py +173 -0
- webscout/Provider/OPENAI/copilot.py +242 -0
- webscout/Provider/OPENAI/deepinfra.py +322 -0
- webscout/Provider/OPENAI/e2b.py +1414 -0
- webscout/Provider/OPENAI/exaai.py +417 -0
- webscout/Provider/OPENAI/exachat.py +444 -0
- webscout/Provider/OPENAI/flowith.py +162 -0
- webscout/Provider/OPENAI/freeaichat.py +359 -0
- webscout/Provider/OPENAI/glider.py +326 -0
- webscout/Provider/OPENAI/groq.py +364 -0
- webscout/Provider/OPENAI/heckai.py +308 -0
- webscout/Provider/OPENAI/llmchatco.py +335 -0
- webscout/Provider/OPENAI/mcpcore.py +389 -0
- webscout/Provider/OPENAI/multichat.py +376 -0
- webscout/Provider/OPENAI/netwrck.py +357 -0
- webscout/Provider/OPENAI/oivscode.py +287 -0
- webscout/Provider/OPENAI/opkfc.py +496 -0
- webscout/Provider/OPENAI/pydantic_imports.py +172 -0
- webscout/Provider/OPENAI/scirachat.py +477 -0
- webscout/Provider/OPENAI/sonus.py +304 -0
- webscout/Provider/OPENAI/standardinput.py +433 -0
- webscout/Provider/OPENAI/textpollinations.py +339 -0
- webscout/Provider/OPENAI/toolbaz.py +413 -0
- webscout/Provider/OPENAI/typefully.py +355 -0
- webscout/Provider/OPENAI/typegpt.py +364 -0
- webscout/Provider/OPENAI/uncovrAI.py +463 -0
- webscout/Provider/OPENAI/utils.py +318 -0
- webscout/Provider/OPENAI/venice.py +431 -0
- webscout/Provider/OPENAI/wisecat.py +387 -0
- webscout/Provider/OPENAI/writecream.py +163 -0
- webscout/Provider/OPENAI/x0gpt.py +365 -0
- webscout/Provider/OPENAI/yep.py +382 -0
- webscout/Provider/OpenGPT.py +209 -0
- webscout/Provider/Openai.py +496 -0
- webscout/Provider/PI.py +429 -0
- webscout/Provider/Perplexitylabs.py +415 -0
- webscout/Provider/QwenLM.py +254 -0
- webscout/Provider/Reka.py +214 -0
- webscout/Provider/StandardInput.py +290 -0
- webscout/Provider/TTI/README.md +82 -0
- webscout/Provider/TTI/__init__.py +7 -0
- webscout/Provider/TTI/aiarta.py +365 -0
- webscout/Provider/TTI/artbit.py +0 -0
- webscout/Provider/TTI/base.py +64 -0
- webscout/Provider/TTI/fastflux.py +200 -0
- webscout/Provider/TTI/magicstudio.py +201 -0
- webscout/Provider/TTI/piclumen.py +203 -0
- webscout/Provider/TTI/pixelmuse.py +225 -0
- webscout/Provider/TTI/pollinations.py +221 -0
- webscout/Provider/TTI/utils.py +11 -0
- webscout/Provider/TTS/README.md +192 -0
- webscout/Provider/TTS/__init__.py +10 -0
- webscout/Provider/TTS/base.py +159 -0
- webscout/Provider/TTS/deepgram.py +156 -0
- webscout/Provider/TTS/elevenlabs.py +111 -0
- webscout/Provider/TTS/gesserit.py +128 -0
- webscout/Provider/TTS/murfai.py +113 -0
- webscout/Provider/TTS/openai_fm.py +129 -0
- webscout/Provider/TTS/parler.py +111 -0
- webscout/Provider/TTS/speechma.py +580 -0
- webscout/Provider/TTS/sthir.py +94 -0
- webscout/Provider/TTS/streamElements.py +333 -0
- webscout/Provider/TTS/utils.py +280 -0
- webscout/Provider/TeachAnything.py +229 -0
- webscout/Provider/TextPollinationsAI.py +308 -0
- webscout/Provider/TwoAI.py +475 -0
- webscout/Provider/TypliAI.py +305 -0
- webscout/Provider/UNFINISHED/ChatHub.py +209 -0
- webscout/Provider/UNFINISHED/Youchat.py +330 -0
- webscout/Provider/UNFINISHED/liner_api_request.py +263 -0
- webscout/Provider/UNFINISHED/puterjs.py +635 -0
- webscout/Provider/UNFINISHED/test_lmarena.py +119 -0
- webscout/Provider/Venice.py +258 -0
- webscout/Provider/VercelAI.py +253 -0
- webscout/Provider/WiseCat.py +233 -0
- webscout/Provider/WrDoChat.py +370 -0
- webscout/Provider/Writecream.py +246 -0
- webscout/Provider/WritingMate.py +269 -0
- webscout/Provider/__init__.py +174 -0
- webscout/Provider/ai4chat.py +174 -0
- webscout/Provider/akashgpt.py +335 -0
- webscout/Provider/asksteve.py +220 -0
- webscout/Provider/cerebras.py +290 -0
- webscout/Provider/chatglm.py +215 -0
- webscout/Provider/cleeai.py +213 -0
- webscout/Provider/copilot.py +425 -0
- webscout/Provider/elmo.py +283 -0
- webscout/Provider/freeaichat.py +285 -0
- webscout/Provider/geminiapi.py +208 -0
- webscout/Provider/granite.py +235 -0
- webscout/Provider/hermes.py +266 -0
- webscout/Provider/julius.py +223 -0
- webscout/Provider/koala.py +170 -0
- webscout/Provider/learnfastai.py +325 -0
- webscout/Provider/llama3mitril.py +215 -0
- webscout/Provider/llmchat.py +258 -0
- webscout/Provider/llmchatco.py +306 -0
- webscout/Provider/lmarena.py +198 -0
- webscout/Provider/meta.py +801 -0
- webscout/Provider/multichat.py +364 -0
- webscout/Provider/oivscode.py +309 -0
- webscout/Provider/samurai.py +224 -0
- webscout/Provider/scira_chat.py +299 -0
- webscout/Provider/scnet.py +243 -0
- webscout/Provider/searchchat.py +292 -0
- webscout/Provider/sonus.py +258 -0
- webscout/Provider/talkai.py +194 -0
- webscout/Provider/toolbaz.py +353 -0
- webscout/Provider/turboseek.py +266 -0
- webscout/Provider/typefully.py +202 -0
- webscout/Provider/typegpt.py +289 -0
- webscout/Provider/uncovr.py +368 -0
- webscout/Provider/x0gpt.py +299 -0
- webscout/Provider/yep.py +389 -0
- webscout/__init__.py +4 -2
- webscout/cli.py +3 -28
- webscout/client.py +70 -0
- webscout/conversation.py +35 -35
- webscout/litagent/Readme.md +276 -0
- webscout/litagent/__init__.py +29 -0
- webscout/litagent/agent.py +455 -0
- webscout/litagent/constants.py +60 -0
- webscout/litprinter/__init__.py +59 -0
- webscout/optimizers.py +419 -419
- webscout/scout/README.md +404 -0
- webscout/scout/__init__.py +8 -0
- webscout/scout/core/__init__.py +7 -0
- webscout/scout/core/crawler.py +210 -0
- webscout/scout/core/scout.py +607 -0
- webscout/scout/core/search_result.py +96 -0
- webscout/scout/core/text_analyzer.py +63 -0
- webscout/scout/core/text_utils.py +277 -0
- webscout/scout/core/web_analyzer.py +52 -0
- webscout/scout/element.py +478 -0
- webscout/scout/parsers/__init__.py +69 -0
- webscout/scout/parsers/html5lib_parser.py +172 -0
- webscout/scout/parsers/html_parser.py +236 -0
- webscout/scout/parsers/lxml_parser.py +178 -0
- webscout/scout/utils.py +37 -0
- webscout/swiftcli/Readme.md +323 -0
- webscout/swiftcli/__init__.py +95 -0
- webscout/swiftcli/core/__init__.py +7 -0
- webscout/swiftcli/core/cli.py +297 -0
- webscout/swiftcli/core/context.py +104 -0
- webscout/swiftcli/core/group.py +241 -0
- webscout/swiftcli/decorators/__init__.py +28 -0
- webscout/swiftcli/decorators/command.py +221 -0
- webscout/swiftcli/decorators/options.py +220 -0
- webscout/swiftcli/decorators/output.py +252 -0
- webscout/swiftcli/exceptions.py +21 -0
- webscout/swiftcli/plugins/__init__.py +9 -0
- webscout/swiftcli/plugins/base.py +135 -0
- webscout/swiftcli/plugins/manager.py +269 -0
- webscout/swiftcli/utils/__init__.py +59 -0
- webscout/swiftcli/utils/formatting.py +252 -0
- webscout/swiftcli/utils/parsing.py +267 -0
- webscout/version.py +1 -1
- webscout/webscout_search.py +2 -182
- webscout/webscout_search_async.py +1 -179
- webscout/zeroart/README.md +89 -0
- webscout/zeroart/__init__.py +135 -0
- webscout/zeroart/base.py +66 -0
- webscout/zeroart/effects.py +101 -0
- webscout/zeroart/fonts.py +1239 -0
- {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/METADATA +262 -83
- webscout-8.2.9.dist-info/RECORD +289 -0
- {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/WHEEL +1 -1
- {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/entry_points.txt +1 -0
- webscout-8.2.7.dist-info/RECORD +0 -26
- {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/licenses/LICENSE.md +0 -0
- {webscout-8.2.7.dist-info → webscout-8.2.9.dist-info}/top_level.txt +0 -0
|
@@ -0,0 +1,156 @@
|
|
|
1
|
+
import time
|
|
2
|
+
import requests
|
|
3
|
+
import pathlib
|
|
4
|
+
import base64
|
|
5
|
+
import tempfile
|
|
6
|
+
from io import BytesIO
|
|
7
|
+
from webscout import exceptions
|
|
8
|
+
from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
9
|
+
from webscout.litagent import LitAgent
|
|
10
|
+
from . import utils
|
|
11
|
+
from .base import BaseTTSProvider
|
|
12
|
+
|
|
13
|
+
class DeepgramTTS(BaseTTSProvider):
|
|
14
|
+
"""
|
|
15
|
+
Text-to-speech provider using the DeepgramTTS API.
|
|
16
|
+
"""
|
|
17
|
+
# Request headers
|
|
18
|
+
headers: dict[str, str] = {
|
|
19
|
+
"User-Agent": LitAgent().random()
|
|
20
|
+
}
|
|
21
|
+
all_voices: dict[str, str] = {
|
|
22
|
+
"Asteria": "aura-asteria-en", "Arcas": "aura-arcas-en", "Luna": "aura-luna-en",
|
|
23
|
+
"Zeus": "aura-zeus-en", "Orpheus": "aura-orpheus-en", "Angus": "aura-angus-en",
|
|
24
|
+
"Athena": "aura-athena-en", "Helios": "aura-helios-en", "Hera": "aura-hera-en",
|
|
25
|
+
"Orion": "aura-orion-en", "Perseus": "aura-perseus-en", "Stella": "aura-stella-en"
|
|
26
|
+
}
|
|
27
|
+
|
|
28
|
+
def __init__(self, timeout: int = 20, proxies: dict = None):
|
|
29
|
+
"""Initializes the DeepgramTTS TTS client."""
|
|
30
|
+
super().__init__()
|
|
31
|
+
self.session = requests.Session()
|
|
32
|
+
self.session.headers.update(self.headers)
|
|
33
|
+
if proxies:
|
|
34
|
+
self.session.proxies.update(proxies)
|
|
35
|
+
self.timeout = timeout
|
|
36
|
+
|
|
37
|
+
def tts(self, text: str, voice: str = "Brian", verbose: bool = True) -> str:
|
|
38
|
+
"""
|
|
39
|
+
Converts text to speech using the DeepgramTTS API and saves it to a file.
|
|
40
|
+
|
|
41
|
+
Args:
|
|
42
|
+
text (str): The text to convert to speech
|
|
43
|
+
voice (str): The voice to use for TTS (default: "Brian")
|
|
44
|
+
verbose (bool): Whether to print progress messages (default: True)
|
|
45
|
+
|
|
46
|
+
Returns:
|
|
47
|
+
str: Path to the generated audio file
|
|
48
|
+
|
|
49
|
+
Raises:
|
|
50
|
+
AssertionError: If the specified voice is not available
|
|
51
|
+
requests.RequestException: If there's an error communicating with the API
|
|
52
|
+
RuntimeError: If there's an error processing the audio
|
|
53
|
+
"""
|
|
54
|
+
assert (
|
|
55
|
+
voice in self.all_voices
|
|
56
|
+
), f"Voice '{voice}' not one of [{', '.join(self.all_voices.keys())}]"
|
|
57
|
+
|
|
58
|
+
url = "https://deepgram.com/api/ttsAudioGeneration"
|
|
59
|
+
filename = pathlib.Path(tempfile.mktemp(suffix=".mp3", dir=self.temp_dir))
|
|
60
|
+
|
|
61
|
+
# Split text into sentences using the utils module
|
|
62
|
+
sentences = utils.split_sentences(text)
|
|
63
|
+
if verbose:
|
|
64
|
+
for index, sen in enumerate(sentences):
|
|
65
|
+
print(f"[debug] Sentence {index}: {sen}")
|
|
66
|
+
|
|
67
|
+
def generate_audio_for_chunk(part_text: str, part_number: int):
|
|
68
|
+
"""
|
|
69
|
+
Generate audio for a single chunk of text.
|
|
70
|
+
|
|
71
|
+
Args:
|
|
72
|
+
part_text (str): The text chunk to convert
|
|
73
|
+
part_number (int): The chunk number for ordering
|
|
74
|
+
|
|
75
|
+
Returns:
|
|
76
|
+
tuple: (part_number, audio_data)
|
|
77
|
+
|
|
78
|
+
Raises:
|
|
79
|
+
requests.RequestException: If there's an API error
|
|
80
|
+
"""
|
|
81
|
+
max_retries = 3
|
|
82
|
+
retry_count = 0
|
|
83
|
+
|
|
84
|
+
while retry_count < max_retries:
|
|
85
|
+
try:
|
|
86
|
+
payload = {"text": part_text, "model": self.all_voices[voice]}
|
|
87
|
+
response = self.session.post(
|
|
88
|
+
url=url,
|
|
89
|
+
headers=self.headers,
|
|
90
|
+
json=payload,
|
|
91
|
+
stream=True,
|
|
92
|
+
timeout=self.timeout
|
|
93
|
+
)
|
|
94
|
+
response.raise_for_status()
|
|
95
|
+
|
|
96
|
+
response_data = response.json().get('data')
|
|
97
|
+
if response_data:
|
|
98
|
+
audio_data = base64.b64decode(response_data)
|
|
99
|
+
if verbose:
|
|
100
|
+
print(f"[debug] Chunk {part_number} processed successfully")
|
|
101
|
+
return part_number, audio_data
|
|
102
|
+
|
|
103
|
+
if verbose:
|
|
104
|
+
print(f"[debug] No data received for chunk {part_number}. Attempt {retry_count + 1}/{max_retries}")
|
|
105
|
+
|
|
106
|
+
except requests.RequestException as e:
|
|
107
|
+
if verbose:
|
|
108
|
+
print(f"[debug] Error processing chunk {part_number}: {str(e)}. Attempt {retry_count + 1}/{max_retries}")
|
|
109
|
+
if retry_count == max_retries - 1:
|
|
110
|
+
raise
|
|
111
|
+
|
|
112
|
+
retry_count += 1
|
|
113
|
+
time.sleep(1)
|
|
114
|
+
|
|
115
|
+
raise RuntimeError(f"Failed to generate audio for chunk {part_number} after {max_retries} attempts")
|
|
116
|
+
|
|
117
|
+
try:
|
|
118
|
+
# Using ThreadPoolExecutor to handle requests concurrently
|
|
119
|
+
with ThreadPoolExecutor() as executor:
|
|
120
|
+
futures = {
|
|
121
|
+
executor.submit(generate_audio_for_chunk, sentence.strip(), chunk_num): chunk_num
|
|
122
|
+
for chunk_num, sentence in enumerate(sentences, start=1)
|
|
123
|
+
}
|
|
124
|
+
|
|
125
|
+
# Dictionary to store results with order preserved
|
|
126
|
+
audio_chunks = {}
|
|
127
|
+
|
|
128
|
+
for future in as_completed(futures):
|
|
129
|
+
chunk_num = futures[future]
|
|
130
|
+
try:
|
|
131
|
+
part_number, audio_data = future.result()
|
|
132
|
+
audio_chunks[part_number] = audio_data
|
|
133
|
+
except Exception as e:
|
|
134
|
+
raise RuntimeError(f"Failed to generate audio for chunk {chunk_num}: {str(e)}")
|
|
135
|
+
|
|
136
|
+
# Combine all audio chunks in order
|
|
137
|
+
with open(filename, 'wb') as f:
|
|
138
|
+
for chunk_num in sorted(audio_chunks.keys()):
|
|
139
|
+
f.write(audio_chunks[chunk_num])
|
|
140
|
+
|
|
141
|
+
if verbose:
|
|
142
|
+
print(f"[debug] Audio saved to {filename}")
|
|
143
|
+
return str(filename)
|
|
144
|
+
|
|
145
|
+
except Exception as e:
|
|
146
|
+
print(f"[debug] Failed to generate audio: {str(e)}") if verbose else None
|
|
147
|
+
raise RuntimeError(f"Failed to generate audio: {str(e)}")
|
|
148
|
+
|
|
149
|
+
# Example usage
|
|
150
|
+
if __name__ == "__main__":
|
|
151
|
+
deepgram = DeepgramTTS()
|
|
152
|
+
text = "This is a test of the DeepgramTTS text-to-speech API. It supports multiple sentences. Let's see how it works!"
|
|
153
|
+
|
|
154
|
+
print("[debug] Generating audio...")
|
|
155
|
+
audio_file = deepgram.tts(text, voice="Asteria")
|
|
156
|
+
print(f"Audio saved to: {audio_file}")
|
|
@@ -0,0 +1,111 @@
|
|
|
1
|
+
import time
|
|
2
|
+
import requests
|
|
3
|
+
import pathlib
|
|
4
|
+
import tempfile
|
|
5
|
+
from io import BytesIO
|
|
6
|
+
from webscout import exceptions
|
|
7
|
+
from webscout.litagent import LitAgent
|
|
8
|
+
from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
9
|
+
from . import utils
|
|
10
|
+
from .base import BaseTTSProvider
|
|
11
|
+
|
|
12
|
+
class ElevenlabsTTS(BaseTTSProvider):
|
|
13
|
+
"""
|
|
14
|
+
Text-to-speech provider using the ElevenlabsTTS API.
|
|
15
|
+
"""
|
|
16
|
+
# Request headers
|
|
17
|
+
headers: dict[str, str] = {
|
|
18
|
+
"User-Agent": LitAgent().random()
|
|
19
|
+
}
|
|
20
|
+
all_voices: dict[str, str] = {"Brian": "nPczCjzI2devNBz1zQrb", "Alice":"Xb7hH8MSUJpSbSDYk0k2", "Bill":"pqHfZKP75CvOlQylNhV4", "Callum":"N2lVS1w4EtoT3dr4eOWO", "Charlie":"IKne3meq5aSn9XLyUdCD", "Charlotte":"XB0fDUnXU5powFXDhCwa", "Chris":"iP95p4xoKVk53GoZ742B", "Daniel":"onwK4e9ZLuTAKqWW03F9", "Eric":"cjVigY5qzO86Huf0OWal", "George":"JBFqnCBsd6RMkjVDRZzb", "Jessica":"cgSgspJ2msm6clMCkdW9", "Laura":"FGY2WhTYpPnrIDTdsKH5", "Liam":"TX3LPaxmHKxFdv7VOQHJ", "Lily":"pFZP5JQG7iQjIQuC4Bku", "Matilda":"XrExE9yKIg1WjnnlVkGX", "Sarah":"EXAVITQu4vr4xnSDxMaL", "Will":"bIHbv24MWmeRgasZH58o"}
|
|
21
|
+
|
|
22
|
+
def __init__(self, timeout: int = 20, proxies: dict = None):
|
|
23
|
+
"""Initializes the ElevenlabsTTS TTS client."""
|
|
24
|
+
super().__init__()
|
|
25
|
+
self.session = requests.Session()
|
|
26
|
+
self.session.headers.update(self.headers)
|
|
27
|
+
if proxies:
|
|
28
|
+
self.session.proxies.update(proxies)
|
|
29
|
+
self.timeout = timeout
|
|
30
|
+
self.params = {'allow_unauthenticated': '1'}
|
|
31
|
+
|
|
32
|
+
def tts(self, text: str, voice: str = "Brian", verbose:bool = True) -> str:
|
|
33
|
+
"""
|
|
34
|
+
Converts text to speech using the ElevenlabsTTS API and saves it to a file.
|
|
35
|
+
"""
|
|
36
|
+
assert (
|
|
37
|
+
voice in self.all_voices
|
|
38
|
+
), f"Voice '{voice}' not one of [{', '.join(self.all_voices.keys())}]"
|
|
39
|
+
|
|
40
|
+
filename = pathlib.Path(tempfile.mktemp(suffix=".mp3", dir=self.temp_dir))
|
|
41
|
+
|
|
42
|
+
# Split text into sentences
|
|
43
|
+
sentences = utils.split_sentences(text)
|
|
44
|
+
|
|
45
|
+
# Function to request audio for each chunk
|
|
46
|
+
def generate_audio_for_chunk(part_text: str, part_number: int):
|
|
47
|
+
while True:
|
|
48
|
+
try:
|
|
49
|
+
json_data = {'text': part_text, 'model_id': 'eleven_multilingual_v2'}
|
|
50
|
+
response = self.session.post(f'https://api.elevenlabs.io/v1/text-to-speech/{self.all_voices[voice]}',params=self.params, headers=self.headers, json=json_data, timeout=self.timeout)
|
|
51
|
+
response.raise_for_status()
|
|
52
|
+
|
|
53
|
+
# Check if the request was successful
|
|
54
|
+
if response.ok and response.status_code == 200:
|
|
55
|
+
if verbose:
|
|
56
|
+
print(f"[debug] Chunk {part_number} processed successfully")
|
|
57
|
+
return part_number, response.content
|
|
58
|
+
else:
|
|
59
|
+
if verbose:
|
|
60
|
+
print(f"[debug] No data received for chunk {part_number}. Retrying...")
|
|
61
|
+
except requests.RequestException as e:
|
|
62
|
+
if verbose:
|
|
63
|
+
print(f"[debug] Error for chunk {part_number}: {e}. Retrying...")
|
|
64
|
+
time.sleep(1)
|
|
65
|
+
try:
|
|
66
|
+
# Using ThreadPoolExecutor to handle requests concurrently
|
|
67
|
+
with ThreadPoolExecutor() as executor:
|
|
68
|
+
futures = {executor.submit(generate_audio_for_chunk, sentence.strip(), chunk_num): chunk_num
|
|
69
|
+
for chunk_num, sentence in enumerate(sentences, start=1)}
|
|
70
|
+
|
|
71
|
+
# Dictionary to store results with order preserved
|
|
72
|
+
audio_chunks = {}
|
|
73
|
+
|
|
74
|
+
for future in as_completed(futures):
|
|
75
|
+
chunk_num = futures[future]
|
|
76
|
+
try:
|
|
77
|
+
part_number, audio_data = future.result()
|
|
78
|
+
audio_chunks[part_number] = audio_data # Store the audio data in correct sequence
|
|
79
|
+
except Exception as e:
|
|
80
|
+
if verbose:
|
|
81
|
+
print(f"[debug] Failed to generate audio for chunk {chunk_num}: {e}")
|
|
82
|
+
|
|
83
|
+
# Combine audio chunks in the correct sequence
|
|
84
|
+
combined_audio = BytesIO()
|
|
85
|
+
for part_number in sorted(audio_chunks.keys()):
|
|
86
|
+
combined_audio.write(audio_chunks[part_number])
|
|
87
|
+
if verbose:
|
|
88
|
+
print(f"[debug] Added chunk {part_number} to the combined file.")
|
|
89
|
+
|
|
90
|
+
# Save the combined audio data to a single file
|
|
91
|
+
with open(filename, 'wb') as f:
|
|
92
|
+
f.write(combined_audio.getvalue())
|
|
93
|
+
if verbose:
|
|
94
|
+
print(f"[debug] Final Audio Saved as {filename}")
|
|
95
|
+
return filename.as_posix()
|
|
96
|
+
|
|
97
|
+
except requests.exceptions.RequestException as e:
|
|
98
|
+
if verbose:
|
|
99
|
+
print(f"[debug] Failed to perform the operation: {e}")
|
|
100
|
+
raise exceptions.FailedToGenerateResponseError(
|
|
101
|
+
f"Failed to perform the operation: {e}"
|
|
102
|
+
)
|
|
103
|
+
|
|
104
|
+
# Example usage
|
|
105
|
+
if __name__ == "__main__":
|
|
106
|
+
elevenlabs = ElevenlabsTTS()
|
|
107
|
+
text = "This is a test of the ElevenlabsTTS text-to-speech API. It supports multiple sentences and advanced logging."
|
|
108
|
+
|
|
109
|
+
print("[debug] Generating audio...")
|
|
110
|
+
audio_file = elevenlabs.tts(text, voice="Brian")
|
|
111
|
+
print(f"Audio saved to: {audio_file}")
|
|
@@ -0,0 +1,128 @@
|
|
|
1
|
+
import time
|
|
2
|
+
import requests
|
|
3
|
+
import pathlib
|
|
4
|
+
import base64
|
|
5
|
+
from io import BytesIO
|
|
6
|
+
from webscout import exceptions
|
|
7
|
+
from webscout.litagent import LitAgent
|
|
8
|
+
from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
9
|
+
from . import utils
|
|
10
|
+
from .base import BaseTTSProvider
|
|
11
|
+
|
|
12
|
+
class GesseritTTS(BaseTTSProvider):
|
|
13
|
+
"""Text-to-speech provider using the GesseritTTS API."""
|
|
14
|
+
# Request headers
|
|
15
|
+
headers: dict[str, str] = {
|
|
16
|
+
"User-Agent": LitAgent().random()
|
|
17
|
+
}
|
|
18
|
+
cache_dir = pathlib.Path("./audio_cache")
|
|
19
|
+
all_voices: dict[str, str] = {
|
|
20
|
+
"Emma": "en_us_001", # Female Voice
|
|
21
|
+
"Liam": "en_us_006", # Male Voice
|
|
22
|
+
"Noah": "en_us_007", # Male Voice
|
|
23
|
+
"Oliver": "en_us_009", # Male Voice
|
|
24
|
+
"Elijah": "en_us_010", # Male Voice
|
|
25
|
+
"James": "en_male_narration", # Male Voice
|
|
26
|
+
"Charlie": "en_male_funny", # Male Voice
|
|
27
|
+
"Sophia": "en_female_emotional", # Female Voice
|
|
28
|
+
"Cody": "en_male_cody", # Male Voice
|
|
29
|
+
}
|
|
30
|
+
|
|
31
|
+
def __init__(self, timeout: int = 20, proxies: dict = None):
|
|
32
|
+
"""Initializes the GesseritTTS TTS client."""
|
|
33
|
+
super().__init__()
|
|
34
|
+
self.session = requests.Session()
|
|
35
|
+
self.session.headers.update(self.headers)
|
|
36
|
+
if proxies:
|
|
37
|
+
self.session.proxies.update(proxies)
|
|
38
|
+
self.timeout = timeout
|
|
39
|
+
|
|
40
|
+
def tts(self, text: str, voice: str = "Oliver", verbose:bool = True) -> str:
|
|
41
|
+
"""Converts text to speech using the GesseritTTS API and saves it to a file."""
|
|
42
|
+
assert (
|
|
43
|
+
voice in self.all_voices
|
|
44
|
+
), f"Voice '{voice}' not one of [{', '.join(self.all_voices.keys())}]"
|
|
45
|
+
|
|
46
|
+
filename = self.cache_dir / f"{int(time.time())}.mp3"
|
|
47
|
+
|
|
48
|
+
voice_id = self.all_voices[voice]
|
|
49
|
+
|
|
50
|
+
# Split text into sentences
|
|
51
|
+
sentences = utils.split_sentences(text)
|
|
52
|
+
|
|
53
|
+
# Function to request audio for each chunk
|
|
54
|
+
def generate_audio_for_chunk(part_text: str, part_number: int):
|
|
55
|
+
while True:
|
|
56
|
+
try:
|
|
57
|
+
payload = {
|
|
58
|
+
"text": part_text,
|
|
59
|
+
"voice": voice_id
|
|
60
|
+
}
|
|
61
|
+
response = self.session.post('https://gesserit.co/api/tiktok-tts', headers=self.headers, json=payload, timeout=self.timeout)
|
|
62
|
+
response.raise_for_status()
|
|
63
|
+
|
|
64
|
+
# Create the audio_cache directory if it doesn't exist
|
|
65
|
+
self.cache_dir.mkdir(parents=True, exist_ok=True)
|
|
66
|
+
|
|
67
|
+
# Check if the request was successful
|
|
68
|
+
if response.ok and response.status_code == 200:
|
|
69
|
+
data = response.json()
|
|
70
|
+
audio_base64 = data["audioUrl"].split(",")[1]
|
|
71
|
+
audio_data = base64.b64decode(audio_base64)
|
|
72
|
+
if verbose:
|
|
73
|
+
print(f"[debug] Chunk {part_number} processed successfully")
|
|
74
|
+
return part_number, audio_data
|
|
75
|
+
else:
|
|
76
|
+
if verbose:
|
|
77
|
+
print(f"[debug] No data received for chunk {part_number}. Retrying...")
|
|
78
|
+
except requests.RequestException as e:
|
|
79
|
+
if verbose:
|
|
80
|
+
print(f"[debug] Error for chunk {part_number}: {e}. Retrying...")
|
|
81
|
+
time.sleep(1)
|
|
82
|
+
try:
|
|
83
|
+
# Using ThreadPoolExecutor to handle requests concurrently
|
|
84
|
+
with ThreadPoolExecutor() as executor:
|
|
85
|
+
futures = {executor.submit(generate_audio_for_chunk, sentence.strip(), chunk_num): chunk_num
|
|
86
|
+
for chunk_num, sentence in enumerate(sentences, start=1)}
|
|
87
|
+
|
|
88
|
+
# Dictionary to store results with order preserved
|
|
89
|
+
audio_chunks = {}
|
|
90
|
+
|
|
91
|
+
for future in as_completed(futures):
|
|
92
|
+
chunk_num = futures[future]
|
|
93
|
+
try:
|
|
94
|
+
part_number, audio_data = future.result()
|
|
95
|
+
audio_chunks[part_number] = audio_data # Store the audio data in correct sequence
|
|
96
|
+
except Exception as e:
|
|
97
|
+
if verbose:
|
|
98
|
+
print(f"[debug] Failed to generate audio for chunk {chunk_num}: {e}")
|
|
99
|
+
|
|
100
|
+
# Combine audio chunks in the correct sequence
|
|
101
|
+
combined_audio = BytesIO()
|
|
102
|
+
for part_number in sorted(audio_chunks.keys()):
|
|
103
|
+
combined_audio.write(audio_chunks[part_number])
|
|
104
|
+
if verbose:
|
|
105
|
+
print(f"[debug] Added chunk {part_number} to the combined file.")
|
|
106
|
+
|
|
107
|
+
# Save the combined audio data to a single file
|
|
108
|
+
with open(filename, 'wb') as f:
|
|
109
|
+
f.write(combined_audio.getvalue())
|
|
110
|
+
if verbose:
|
|
111
|
+
print(f"[debug] Final Audio Saved as {filename}")
|
|
112
|
+
return filename.as_posix()
|
|
113
|
+
|
|
114
|
+
except requests.exceptions.RequestException as e:
|
|
115
|
+
if verbose:
|
|
116
|
+
print(f"[debug] Failed to perform the operation: {e}")
|
|
117
|
+
raise exceptions.FailedToGenerateResponseError(
|
|
118
|
+
f"Failed to perform the operation: {e}"
|
|
119
|
+
)
|
|
120
|
+
|
|
121
|
+
# Example usage
|
|
122
|
+
if __name__ == "__main__":
|
|
123
|
+
gesserit = GesseritTTS()
|
|
124
|
+
text = "This is a test of the GesseritTTS text-to-speech API. It supports multiple sentences and advanced logging."
|
|
125
|
+
|
|
126
|
+
print("[debug] Generating audio...")
|
|
127
|
+
audio_file = gesserit.tts(text, voice="Oliver")
|
|
128
|
+
print(f"Audio saved to: {audio_file}")
|
|
@@ -0,0 +1,113 @@
|
|
|
1
|
+
import time
|
|
2
|
+
import requests
|
|
3
|
+
import pathlib
|
|
4
|
+
import tempfile
|
|
5
|
+
from io import BytesIO
|
|
6
|
+
from urllib.parse import urlencode
|
|
7
|
+
from webscout import exceptions
|
|
8
|
+
from webscout.litagent import LitAgent
|
|
9
|
+
from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
10
|
+
from . import utils
|
|
11
|
+
from .base import BaseTTSProvider
|
|
12
|
+
|
|
13
|
+
class MurfAITTS(BaseTTSProvider):
|
|
14
|
+
"""Text-to-speech provider using the MurfAITTS API."""
|
|
15
|
+
# Request headers
|
|
16
|
+
headers: dict[str, str] = {
|
|
17
|
+
"User-Agent": LitAgent().random()
|
|
18
|
+
}
|
|
19
|
+
all_voices: dict[str, str] = {"Hazel": "en-UK-hazel"}
|
|
20
|
+
|
|
21
|
+
def __init__(self, timeout: int = 20, proxies: dict = None):
|
|
22
|
+
"""Initializes the MurfAITTS TTS client."""
|
|
23
|
+
super().__init__()
|
|
24
|
+
self.session = requests.Session()
|
|
25
|
+
self.session.headers.update(self.headers)
|
|
26
|
+
if proxies:
|
|
27
|
+
self.session.proxies.update(proxies)
|
|
28
|
+
self.timeout = timeout
|
|
29
|
+
|
|
30
|
+
def tts(self, text: str, voice: str = "Hazel", verbose:bool = True) -> str:
|
|
31
|
+
"""Converts text to speech using the MurfAITTS API and saves it to a file."""
|
|
32
|
+
assert (
|
|
33
|
+
voice in self.all_voices
|
|
34
|
+
), f"Voice '{voice}' not one of [{', '.join(self.all_voices.keys())}]"
|
|
35
|
+
|
|
36
|
+
filename = pathlib.Path(tempfile.mktemp(suffix=".mp3", dir=self.temp_dir))
|
|
37
|
+
|
|
38
|
+
voice_id = self.all_voices[voice]
|
|
39
|
+
|
|
40
|
+
# Split text into sentences
|
|
41
|
+
sentences = utils.split_sentences(text)
|
|
42
|
+
|
|
43
|
+
# Function to request audio for each chunk
|
|
44
|
+
def generate_audio_for_chunk(part_text: str, part_number: int):
|
|
45
|
+
while True:
|
|
46
|
+
try:
|
|
47
|
+
params: dict[str, str] = {
|
|
48
|
+
"name": voice_id,
|
|
49
|
+
"text": part_text
|
|
50
|
+
}
|
|
51
|
+
encode_param: str = urlencode(params)
|
|
52
|
+
response = self.session.get(f"https://murf.ai/Prod/anonymous-tts/audio?{encode_param}", headers=self.headers, timeout=self.timeout)
|
|
53
|
+
response.raise_for_status()
|
|
54
|
+
|
|
55
|
+
# Check if the request was successful
|
|
56
|
+
if response.ok and response.status_code == 200:
|
|
57
|
+
if verbose:
|
|
58
|
+
print(f"[debug] Chunk {part_number} processed successfully")
|
|
59
|
+
return part_number, response.content
|
|
60
|
+
else:
|
|
61
|
+
if verbose:
|
|
62
|
+
print(f"[debug] No data received for chunk {part_number}. Retrying...")
|
|
63
|
+
except requests.RequestException as e:
|
|
64
|
+
if verbose:
|
|
65
|
+
print(f"[debug] Error for chunk {part_number}: {e}. Retrying...")
|
|
66
|
+
time.sleep(1)
|
|
67
|
+
try:
|
|
68
|
+
# Using ThreadPoolExecutor to handle requests concurrently
|
|
69
|
+
with ThreadPoolExecutor() as executor:
|
|
70
|
+
futures = {executor.submit(generate_audio_for_chunk, sentence.strip(), chunk_num): chunk_num
|
|
71
|
+
for chunk_num, sentence in enumerate(sentences, start=1)}
|
|
72
|
+
|
|
73
|
+
# Dictionary to store results with order preserved
|
|
74
|
+
audio_chunks = {}
|
|
75
|
+
|
|
76
|
+
for future in as_completed(futures):
|
|
77
|
+
chunk_num = futures[future]
|
|
78
|
+
try:
|
|
79
|
+
part_number, audio_data = future.result()
|
|
80
|
+
audio_chunks[part_number] = audio_data # Store the audio data in correct sequence
|
|
81
|
+
except Exception as e:
|
|
82
|
+
if verbose:
|
|
83
|
+
print(f"[debug] Failed to generate audio for chunk {chunk_num}: {e}")
|
|
84
|
+
|
|
85
|
+
# Combine audio chunks in the correct sequence
|
|
86
|
+
combined_audio = BytesIO()
|
|
87
|
+
for part_number in sorted(audio_chunks.keys()):
|
|
88
|
+
combined_audio.write(audio_chunks[part_number])
|
|
89
|
+
if verbose:
|
|
90
|
+
print(f"[debug] Added chunk {part_number} to the combined file.")
|
|
91
|
+
|
|
92
|
+
# Save the combined audio data to a single file
|
|
93
|
+
with open(filename, 'wb') as f:
|
|
94
|
+
f.write(combined_audio.getvalue())
|
|
95
|
+
if verbose:
|
|
96
|
+
print(f"[debug] Final Audio Saved as {filename}")
|
|
97
|
+
return filename.as_posix()
|
|
98
|
+
|
|
99
|
+
except requests.exceptions.RequestException as e:
|
|
100
|
+
if verbose:
|
|
101
|
+
print(f"[debug] Failed to perform the operation: {e}")
|
|
102
|
+
raise exceptions.FailedToGenerateResponseError(
|
|
103
|
+
f"Failed to perform the operation: {e}"
|
|
104
|
+
)
|
|
105
|
+
|
|
106
|
+
# Example usage
|
|
107
|
+
if __name__ == "__main__":
|
|
108
|
+
murfai = MurfAITTS()
|
|
109
|
+
text = "This is a test of the MurfAITTS text-to-speech API. It supports multiple sentences and advanced logging."
|
|
110
|
+
|
|
111
|
+
print("[debug] Generating audio...")
|
|
112
|
+
audio_file = murfai.tts(text, voice="Hazel")
|
|
113
|
+
print(f"Audio saved to: {audio_file}")
|
|
@@ -0,0 +1,129 @@
|
|
|
1
|
+
##################################################################################
|
|
2
|
+
## OpenAI.fm TTS Provider ##
|
|
3
|
+
##################################################################################
|
|
4
|
+
import time
|
|
5
|
+
import requests
|
|
6
|
+
import pathlib
|
|
7
|
+
import tempfile
|
|
8
|
+
from io import BytesIO
|
|
9
|
+
from webscout import exceptions
|
|
10
|
+
from webscout.litagent import LitAgent
|
|
11
|
+
from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
12
|
+
from webscout.Provider.TTS import utils
|
|
13
|
+
from webscout.Provider.TTS.base import BaseTTSProvider
|
|
14
|
+
|
|
15
|
+
class OpenAIFMTTS(BaseTTSProvider):
|
|
16
|
+
"""
|
|
17
|
+
Text-to-speech provider using the OpenAI.fm API.
|
|
18
|
+
"""
|
|
19
|
+
# Request headers
|
|
20
|
+
headers = {
|
|
21
|
+
"accept": "*/*",
|
|
22
|
+
"accept-language": "en-US,en;q=0.9",
|
|
23
|
+
"cache-control": "no-cache",
|
|
24
|
+
"pragma": "no-cache",
|
|
25
|
+
"sec-fetch-dest": "audio",
|
|
26
|
+
"sec-fetch-mode": "no-cors",
|
|
27
|
+
"sec-fetch-site": "same-origin",
|
|
28
|
+
"user-agent": LitAgent().random(),
|
|
29
|
+
"referer": "https://www.openai.fm"
|
|
30
|
+
}
|
|
31
|
+
|
|
32
|
+
# Available voices with their IDs
|
|
33
|
+
all_voices = {
|
|
34
|
+
# OpenAI.fm voices
|
|
35
|
+
"Alloy": "alloy", # Neutral voice with balanced tone
|
|
36
|
+
"Ash": "ash", # Calm and thoughtful male voice
|
|
37
|
+
"Ballad": "ballad", # Soft and melodic voice
|
|
38
|
+
"Coral": "coral", # Warm and inviting female voice
|
|
39
|
+
"Echo": "echo", # Clear and precise voice
|
|
40
|
+
"Fable": "fable", # Authoritative and narrative voice
|
|
41
|
+
"Onyx": "onyx", # Deep and resonant male voice
|
|
42
|
+
"Nova": "nova", # Energetic and bright female voice
|
|
43
|
+
"Sage": "sage", # Measured and contemplative voice
|
|
44
|
+
"Shimmer": "shimmer", # Bright and optimistic voice
|
|
45
|
+
"Verse": "verse" # Melodic and rhythmic voice
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
def __init__(self, timeout: int = 20, proxies: dict = None):
|
|
49
|
+
"""Initializes the OpenAI.fm TTS client."""
|
|
50
|
+
super().__init__()
|
|
51
|
+
self.api_url = "https://www.openai.fm/api/generate"
|
|
52
|
+
self.session = requests.Session()
|
|
53
|
+
self.session.headers.update(self.headers)
|
|
54
|
+
if proxies:
|
|
55
|
+
self.session.proxies.update(proxies)
|
|
56
|
+
self.timeout = timeout
|
|
57
|
+
|
|
58
|
+
def tts(self, text: str, voice: str = "Coral", instructions: str = None, verbose: bool = True) -> str:
|
|
59
|
+
"""
|
|
60
|
+
Converts text to speech using the OpenAI.fm API and saves it to a file.
|
|
61
|
+
|
|
62
|
+
Args:
|
|
63
|
+
text (str): The text to convert to speech
|
|
64
|
+
voice (str): The voice to use for TTS (default: "Coral")
|
|
65
|
+
instructions (str): Voice instructions/prompt (default: "A cheerful guide. Friendly, clear, and reassuring.")
|
|
66
|
+
verbose (bool): Whether to print debug information (default: True)
|
|
67
|
+
|
|
68
|
+
Returns:
|
|
69
|
+
str: Path to the generated audio file
|
|
70
|
+
|
|
71
|
+
Raises:
|
|
72
|
+
exceptions.FailedToGenerateResponseError: If there is an error generating or saving the audio.
|
|
73
|
+
"""
|
|
74
|
+
# Validate input parameters
|
|
75
|
+
if not text or not isinstance(text, str):
|
|
76
|
+
raise ValueError("Text input must be a non-empty string")
|
|
77
|
+
if len(text) > 10000: # Add reasonable length limit
|
|
78
|
+
raise ValueError("Text input exceeds maximum allowed length")
|
|
79
|
+
|
|
80
|
+
assert (
|
|
81
|
+
voice in self.all_voices
|
|
82
|
+
), f"Voice '{voice}' not one of [{', '.join(self.all_voices.keys())}]"
|
|
83
|
+
|
|
84
|
+
with tempfile.NamedTemporaryFile(suffix=".mp3", dir=self.temp_dir, delete=False) as temp_file:
|
|
85
|
+
filename = pathlib.Path(temp_file.name)
|
|
86
|
+
voice_id = self.all_voices[voice]
|
|
87
|
+
|
|
88
|
+
if instructions is None:
|
|
89
|
+
instructions = "A cheerful guide. Friendly, clear, and reassuring."
|
|
90
|
+
|
|
91
|
+
# Prepare parameters for the API request
|
|
92
|
+
params = {
|
|
93
|
+
"input": text,
|
|
94
|
+
"prompt": instructions,
|
|
95
|
+
"voice": voice_id
|
|
96
|
+
}
|
|
97
|
+
|
|
98
|
+
try:
|
|
99
|
+
# Make the API request
|
|
100
|
+
response = self.session.get(
|
|
101
|
+
self.api_url,
|
|
102
|
+
params=params,
|
|
103
|
+
timeout=self.timeout
|
|
104
|
+
)
|
|
105
|
+
response.raise_for_status()
|
|
106
|
+
|
|
107
|
+
# Save the audio file
|
|
108
|
+
with open(filename, "wb") as f:
|
|
109
|
+
f.write(response.content)
|
|
110
|
+
|
|
111
|
+
if verbose:
|
|
112
|
+
print(f"[debug] Audio saved to {filename}")
|
|
113
|
+
|
|
114
|
+
return filename.as_posix()
|
|
115
|
+
|
|
116
|
+
except requests.exceptions.RequestException as e:
|
|
117
|
+
if verbose:
|
|
118
|
+
print(f"[debug] Failed to perform the operation: {e}")
|
|
119
|
+
raise exceptions.FailedToGenerateResponseError(
|
|
120
|
+
f"Failed to perform the operation: {e}"
|
|
121
|
+
)
|
|
122
|
+
if __name__ == "__main__":
|
|
123
|
+
# Example usage
|
|
124
|
+
tts_provider = OpenAIFMTTS()
|
|
125
|
+
try:
|
|
126
|
+
audio_file = tts_provider.tts("Hello, this is a test.", instructions="A cheerful guide. Friendly, clear, and reassuring.", voice="Coral")
|
|
127
|
+
print(f"Audio file generated: {audio_file}")
|
|
128
|
+
except exceptions.FailedToGenerateResponseError as e:
|
|
129
|
+
print(f"Error: {e}")
|