typecast-python 0.3.3__tar.gz → 0.3.4__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {typecast_python-0.3.3 → typecast_python-0.3.4}/PKG-INFO +1 -1
- {typecast_python-0.3.3 → typecast_python-0.3.4}/pyproject.toml +1 -1
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/async_client.py +38 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/client.py +64 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/models/tts.py +15 -3
- {typecast_python-0.3.3 → typecast_python-0.3.4}/.gitignore +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/LICENSE +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/README.md +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/__init__.py +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/_voice_clone.py +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/conf.py +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/exceptions.py +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/models/__init__.py +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/models/error.py +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/models/subscription.py +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/models/voices.py +0 -0
- {typecast_python-0.3.3 → typecast_python-0.3.4}/src/typecast/utils.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: typecast-python
|
|
3
|
-
Version: 0.3.
|
|
3
|
+
Version: 0.3.4
|
|
4
4
|
Summary: Official Typecast Python SDK - Convert text to lifelike speech using AI-powered voices
|
|
5
5
|
Project-URL: Homepage, https://typecast.ai
|
|
6
6
|
Project-URL: Documentation, https://typecast.ai/docs/overview
|
|
@@ -4,7 +4,7 @@ build-backend = "hatchling.build"
|
|
|
4
4
|
|
|
5
5
|
[project]
|
|
6
6
|
name = "typecast-python"
|
|
7
|
-
version = "0.3.
|
|
7
|
+
version = "0.3.4"
|
|
8
8
|
description = "Official Typecast Python SDK - Convert text to lifelike speech using AI-powered voices"
|
|
9
9
|
authors = [
|
|
10
10
|
{name = "Neosapience", email = "help@typecast.ai"}
|
|
@@ -1,3 +1,4 @@
|
|
|
1
|
+
import asyncio
|
|
1
2
|
from pathlib import Path
|
|
2
3
|
from typing import AsyncIterator, BinaryIO, Optional, Union
|
|
3
4
|
from urllib.parse import quote
|
|
@@ -11,6 +12,8 @@ from ._voice_clone import (
|
|
|
11
12
|
validate_custom_voice_id,
|
|
12
13
|
)
|
|
13
14
|
from .client import _guess_audio_mime
|
|
15
|
+
from .client import _output_with_inferred_format
|
|
16
|
+
from .client import _validate_output_path
|
|
14
17
|
from .exceptions import (
|
|
15
18
|
BadRequestError,
|
|
16
19
|
InternalServerError,
|
|
@@ -23,8 +26,11 @@ from .exceptions import (
|
|
|
23
26
|
)
|
|
24
27
|
from .models import (
|
|
25
28
|
CustomVoice,
|
|
29
|
+
LanguageCode,
|
|
30
|
+
Output,
|
|
26
31
|
SubscriptionResponse,
|
|
27
32
|
TTSModel,
|
|
33
|
+
TTSPrompt,
|
|
28
34
|
TTSRequest,
|
|
29
35
|
TTSRequestStream,
|
|
30
36
|
TTSRequestWithTimestamps,
|
|
@@ -141,6 +147,38 @@ class AsyncTypecast:
|
|
|
141
147
|
format=response.headers.get("Content-Type", "audio/wav").split("/")[-1],
|
|
142
148
|
)
|
|
143
149
|
|
|
150
|
+
async def generate_to_file(
|
|
151
|
+
self,
|
|
152
|
+
path: Union[str, Path],
|
|
153
|
+
*,
|
|
154
|
+
text: str,
|
|
155
|
+
voice_id: str,
|
|
156
|
+
model: TTSModel = TTSModel.SSFM_V30,
|
|
157
|
+
language: Optional[Union[LanguageCode, str]] = None,
|
|
158
|
+
prompt: Optional[TTSPrompt] = None,
|
|
159
|
+
output: Optional[Output] = None,
|
|
160
|
+
seed: Optional[int] = None,
|
|
161
|
+
) -> TTSResponse:
|
|
162
|
+
"""Convert text to speech and write the audio bytes to a file.
|
|
163
|
+
|
|
164
|
+
Browse available API voices at
|
|
165
|
+
``https://typecast.ai/developers/api/voices``.
|
|
166
|
+
"""
|
|
167
|
+
output_path = _validate_output_path(path)
|
|
168
|
+
response = await self.text_to_speech(
|
|
169
|
+
TTSRequest(
|
|
170
|
+
text=text,
|
|
171
|
+
voice_id=voice_id,
|
|
172
|
+
model=model,
|
|
173
|
+
language=language,
|
|
174
|
+
prompt=prompt,
|
|
175
|
+
output=_output_with_inferred_format(output, path),
|
|
176
|
+
seed=seed,
|
|
177
|
+
)
|
|
178
|
+
)
|
|
179
|
+
await asyncio.to_thread(output_path.write_bytes, response.audio_data)
|
|
180
|
+
return response
|
|
181
|
+
|
|
144
182
|
async def text_to_speech_stream(
|
|
145
183
|
self, request: TTSRequestStream, chunk_size: int = 8192
|
|
146
184
|
) -> AsyncIterator[bytes]:
|
|
@@ -22,8 +22,11 @@ from .exceptions import (
|
|
|
22
22
|
)
|
|
23
23
|
from .models import (
|
|
24
24
|
CustomVoice,
|
|
25
|
+
LanguageCode,
|
|
26
|
+
Output,
|
|
25
27
|
SubscriptionResponse,
|
|
26
28
|
TTSModel,
|
|
29
|
+
TTSPrompt,
|
|
27
30
|
TTSRequest,
|
|
28
31
|
TTSRequestStream,
|
|
29
32
|
TTSRequestWithTimestamps,
|
|
@@ -35,6 +38,33 @@ from .models import (
|
|
|
35
38
|
)
|
|
36
39
|
|
|
37
40
|
|
|
41
|
+
def _infer_audio_format_from_path(path: Union[str, Path]) -> Optional[str]:
|
|
42
|
+
suffix = Path(path).suffix.lower()
|
|
43
|
+
if suffix == ".mp3":
|
|
44
|
+
return "mp3"
|
|
45
|
+
if suffix == ".wav":
|
|
46
|
+
return "wav"
|
|
47
|
+
return None
|
|
48
|
+
|
|
49
|
+
|
|
50
|
+
def _output_with_inferred_format(
|
|
51
|
+
output: Optional[Output],
|
|
52
|
+
path: Union[str, Path],
|
|
53
|
+
) -> Optional[Output]:
|
|
54
|
+
audio_format = _infer_audio_format_from_path(path)
|
|
55
|
+
if audio_format is None or (output is not None and output.audio_format is not None):
|
|
56
|
+
return output
|
|
57
|
+
if output is None:
|
|
58
|
+
return Output(audio_format=audio_format)
|
|
59
|
+
return output.model_copy(update={"audio_format": audio_format})
|
|
60
|
+
|
|
61
|
+
|
|
62
|
+
def _validate_output_path(path: Union[str, Path]) -> Path:
|
|
63
|
+
if isinstance(path, str) and not path.strip():
|
|
64
|
+
raise ValueError("path cannot be empty")
|
|
65
|
+
return Path(path)
|
|
66
|
+
|
|
67
|
+
|
|
38
68
|
def _guess_audio_mime(filename: str) -> str:
|
|
39
69
|
"""Guess audio MIME type from filename extension; fall back to octet-stream."""
|
|
40
70
|
lower = filename.lower()
|
|
@@ -136,6 +166,40 @@ class Typecast:
|
|
|
136
166
|
format=response.headers.get("Content-Type", "audio/wav").split("/")[-1],
|
|
137
167
|
)
|
|
138
168
|
|
|
169
|
+
def generate_to_file(
|
|
170
|
+
self,
|
|
171
|
+
path: Union[str, Path],
|
|
172
|
+
*,
|
|
173
|
+
text: str,
|
|
174
|
+
voice_id: str,
|
|
175
|
+
model: TTSModel = TTSModel.SSFM_V30,
|
|
176
|
+
language: Optional[Union[LanguageCode, str]] = None,
|
|
177
|
+
prompt: Optional[TTSPrompt] = None,
|
|
178
|
+
output: Optional[Output] = None,
|
|
179
|
+
seed: Optional[int] = None,
|
|
180
|
+
) -> TTSResponse:
|
|
181
|
+
"""Convert text to speech and write the audio bytes to a file.
|
|
182
|
+
|
|
183
|
+
``model`` defaults to ``ssfm-v30``. If ``output.audio_format`` is not
|
|
184
|
+
set, the format is inferred from a ``.mp3`` or ``.wav`` extension.
|
|
185
|
+
Browse available API voices at
|
|
186
|
+
``https://typecast.ai/developers/api/voices``.
|
|
187
|
+
"""
|
|
188
|
+
output_path = _validate_output_path(path)
|
|
189
|
+
response = self.text_to_speech(
|
|
190
|
+
TTSRequest(
|
|
191
|
+
text=text,
|
|
192
|
+
voice_id=voice_id,
|
|
193
|
+
model=model,
|
|
194
|
+
language=language,
|
|
195
|
+
prompt=prompt,
|
|
196
|
+
output=_output_with_inferred_format(output, path),
|
|
197
|
+
seed=seed,
|
|
198
|
+
)
|
|
199
|
+
)
|
|
200
|
+
output_path.write_bytes(response.audio_data)
|
|
201
|
+
return response
|
|
202
|
+
|
|
139
203
|
def text_to_speech_stream(
|
|
140
204
|
self, request: TTSRequestStream, chunk_size: int = 8192
|
|
141
205
|
) -> Iterator[bytes]:
|
|
@@ -158,7 +158,11 @@ class TTSRequest(BaseModel):
|
|
|
158
158
|
model_config = ConfigDict(json_schema_extra={"exclude_none": True})
|
|
159
159
|
|
|
160
160
|
voice_id: str = Field(
|
|
161
|
-
description=
|
|
161
|
+
description=(
|
|
162
|
+
"Voice ID. Browse available API voices at "
|
|
163
|
+
"https://typecast.ai/developers/api/voices."
|
|
164
|
+
),
|
|
165
|
+
examples=["tc_62a8975e695ad26f7fb514d1"],
|
|
162
166
|
)
|
|
163
167
|
text: str = Field(description="Text", examples=["Hello. How are you?"])
|
|
164
168
|
model: TTSModel = Field(description="Voice model name", examples=["ssfm-v21"])
|
|
@@ -202,7 +206,11 @@ class TTSRequestStream(BaseModel):
|
|
|
202
206
|
model_config = ConfigDict(json_schema_extra={"exclude_none": True})
|
|
203
207
|
|
|
204
208
|
voice_id: str = Field(
|
|
205
|
-
description=
|
|
209
|
+
description=(
|
|
210
|
+
"Voice ID. Browse available API voices at "
|
|
211
|
+
"https://typecast.ai/developers/api/voices."
|
|
212
|
+
),
|
|
213
|
+
examples=["tc_62a8975e695ad26f7fb514d1"],
|
|
206
214
|
)
|
|
207
215
|
text: str = Field(description="Text", examples=["Hello. How are you?"])
|
|
208
216
|
model: TTSModel = Field(description="Voice model name", examples=["ssfm-v21"])
|
|
@@ -253,7 +261,11 @@ class TTSRequestWithTimestamps(BaseModel):
|
|
|
253
261
|
model_config = ConfigDict(json_schema_extra={"exclude_none": True})
|
|
254
262
|
|
|
255
263
|
voice_id: str = Field(
|
|
256
|
-
description=
|
|
264
|
+
description=(
|
|
265
|
+
"Voice ID. Browse available API voices at "
|
|
266
|
+
"https://typecast.ai/developers/api/voices."
|
|
267
|
+
),
|
|
268
|
+
examples=["tc_62a8975e695ad26f7fb514d1"],
|
|
257
269
|
)
|
|
258
270
|
text: str = Field(description="Text", examples=["Hello. How are you?"])
|
|
259
271
|
model: TTSModel = Field(description="Voice model name", examples=["ssfm-v30"])
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|