PyPI - cartesia - Versions diffs - 2.0.2__py3-none-any.whl → 2.0.3__py3-none-any.whl - Mend

cartesia 2.0.2py3-none-any.whl → 2.0.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

cartesia/__init__.py +2 -0
cartesia/core/client_wrapper.py +1 -1
cartesia/tts/__init__.py +2 -0
cartesia/tts/client.py +13 -32
cartesia/tts/requests/generation_request.py +2 -9
cartesia/tts/requests/tts_request.py +2 -8
cartesia/tts/requests/web_socket_tts_request.py +2 -1
cartesia/tts/types/__init__.py +2 -0
cartesia/tts/types/generation_request.py +2 -9
cartesia/tts/types/model_speed.py +5 -0
cartesia/tts/types/tts_request.py +2 -8
cartesia/tts/types/web_socket_tts_request.py +2 -1
cartesia/voices/client.py +11 -13
{cartesia-2.0.2.dist-info → cartesia-2.0.3.dist-info}/METADATA +1 -1
{cartesia-2.0.2.dist-info → cartesia-2.0.3.dist-info}/RECORD +16 -15
{cartesia-2.0.2.dist-info → cartesia-2.0.3.dist-info}/WHEEL +0 -0

cartesia/__init__.py CHANGED Viewed

@@ -29,6 +29,7 @@ from .tts import (
     FlushId,
     GenerationRequest,
     GenerationRequestParams,
+    ModelSpeed,
     Mp3OutputFormat,
     Mp3OutputFormatParams,
     NaturalSpecifier,
@@ -201,6 +202,7 @@ __all__ = [
     "MixVoiceSpecifierParams",
     "MixVoicesRequest",
     "MixVoicesRequestParams",
+    "ModelSpeed",
     "Mp3OutputFormat",
     "Mp3OutputFormatParams",
     "NaturalSpecifier",

cartesia/core/client_wrapper.py CHANGED Viewed

@@ -16,7 +16,7 @@ class BaseClientWrapper:
         headers: typing.Dict[str, str] = {
             "X-Fern-Language": "Python",
             "X-Fern-SDK-Name": "cartesia",
-            "X-Fern-SDK-Version": "2.0.2",
+            "X-Fern-SDK-Version": "2.0.3",
         }
         headers["X-API-Key"] = self.api_key
         headers["Cartesia-Version"] = "2024-11-13"

cartesia/tts/__init__.py CHANGED Viewed

@@ -7,6 +7,7 @@ from .types import (
     Emotion,
     FlushId,
     GenerationRequest,
+    ModelSpeed,
     Mp3OutputFormat,
     NaturalSpecifier,
     NumericalSpecifier,
@@ -94,6 +95,7 @@ __all__ = [
     "FlushId",
     "GenerationRequest",
     "GenerationRequestParams",
+    "ModelSpeed",
     "Mp3OutputFormat",
     "Mp3OutputFormatParams",
     "NaturalSpecifier",

cartesia/tts/client.py CHANGED Viewed

@@ -5,6 +5,7 @@ from ..core.client_wrapper import SyncClientWrapper
 from .requests.tts_request_voice_specifier import TtsRequestVoiceSpecifierParams
 from .requests.output_format import OutputFormatParams
 from .types.supported_language import SupportedLanguage
+from .types.model_speed import ModelSpeed
 from ..core.request_options import RequestOptions
 from ..core.serialization import convert_and_respect_annotation_metadata
 from json.decoder import JSONDecodeError
@@ -32,7 +33,7 @@ class TtsClient:
         output_format: OutputFormatParams,
         language: typing.Optional[SupportedLanguage] = OMIT,
         duration: typing.Optional[float] = OMIT,
-        text_cfg: typing.Optional[float] = OMIT,
+        speed: typing.Optional[ModelSpeed] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> typing.Iterator[bytes]:
         """
@@ -53,12 +54,7 @@ class TtsClient:
             The maximum duration of the audio in seconds. You do not usually need to specify this.
             If the duration is not appropriate for the length of the transcript, the output audio may be truncated.
-        text_cfg : typing.Optional[float]
-            The text [classifier-free guidance](https://arxiv.org/abs/2207.12598) value for the request.
-            Higher values causes the model to attend more to the text but speed up the generation. Lower values reduce the speaking rate but can increase the risk of hallucinations. The default value is `3.0`. For a slower speaking rate, we recommend values between `2.0` and `3.0`. Values are supported between `1.5` and `3.0`.
-            This parameter is only supported for `sonic-2` models.
+        speed : typing.Optional[ModelSpeed]
         request_options : typing.Optional[RequestOptions]
             Request-specific configuration. You can pass in configuration such as `chunk_size`, and more to customize the request and response.
@@ -100,7 +96,7 @@ class TtsClient:
                     object_=output_format, annotation=OutputFormatParams, direction="write"
                 ),
                 "duration": duration,
-                "text_cfg": text_cfg,
+                "speed": speed,
             },
             request_options=request_options,
             omit=OMIT,
@@ -126,7 +122,7 @@ class TtsClient:
         output_format: OutputFormatParams,
         language: typing.Optional[SupportedLanguage] = OMIT,
         duration: typing.Optional[float] = OMIT,
-        text_cfg: typing.Optional[float] = OMIT,
+        speed: typing.Optional[ModelSpeed] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> typing.Iterator[WebSocketResponse]:
         """
@@ -147,12 +143,7 @@ class TtsClient:
             The maximum duration of the audio in seconds. You do not usually need to specify this.
             If the duration is not appropriate for the length of the transcript, the output audio may be truncated.
-        text_cfg : typing.Optional[float]
-            The text [classifier-free guidance](https://arxiv.org/abs/2207.12598) value for the request.
-            Higher values causes the model to attend more to the text but speed up the generation. Lower values reduce the speaking rate but can increase the risk of hallucinations. The default value is `3.0`. For a slower speaking rate, we recommend values between `2.0` and `3.0`. Values are supported between `1.5` and `3.0`.
-            This parameter is only supported for `sonic-2` models.
+        speed : typing.Optional[ModelSpeed]
         request_options : typing.Optional[RequestOptions]
             Request-specific configuration.
@@ -196,7 +187,7 @@ class TtsClient:
                     object_=output_format, annotation=OutputFormatParams, direction="write"
                 ),
                 "duration": duration,
-                "text_cfg": text_cfg,
+                "speed": speed,
             },
             request_options=request_options,
             omit=OMIT,
@@ -236,7 +227,7 @@ class AsyncTtsClient:
         output_format: OutputFormatParams,
         language: typing.Optional[SupportedLanguage] = OMIT,
         duration: typing.Optional[float] = OMIT,
-        text_cfg: typing.Optional[float] = OMIT,
+        speed: typing.Optional[ModelSpeed] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> typing.AsyncIterator[bytes]:
         """
@@ -257,12 +248,7 @@ class AsyncTtsClient:
             The maximum duration of the audio in seconds. You do not usually need to specify this.
             If the duration is not appropriate for the length of the transcript, the output audio may be truncated.
-        text_cfg : typing.Optional[float]
-            The text [classifier-free guidance](https://arxiv.org/abs/2207.12598) value for the request.
-            Higher values causes the model to attend more to the text but speed up the generation. Lower values reduce the speaking rate but can increase the risk of hallucinations. The default value is `3.0`. For a slower speaking rate, we recommend values between `2.0` and `3.0`. Values are supported between `1.5` and `3.0`.
-            This parameter is only supported for `sonic-2` models.
+        speed : typing.Optional[ModelSpeed]
         request_options : typing.Optional[RequestOptions]
             Request-specific configuration. You can pass in configuration such as `chunk_size`, and more to customize the request and response.
@@ -312,7 +298,7 @@ class AsyncTtsClient:
                     object_=output_format, annotation=OutputFormatParams, direction="write"
                 ),
                 "duration": duration,
-                "text_cfg": text_cfg,
+                "speed": speed,
             },
             request_options=request_options,
             omit=OMIT,
@@ -338,7 +324,7 @@ class AsyncTtsClient:
         output_format: OutputFormatParams,
         language: typing.Optional[SupportedLanguage] = OMIT,
         duration: typing.Optional[float] = OMIT,
-        text_cfg: typing.Optional[float] = OMIT,
+        speed: typing.Optional[ModelSpeed] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> typing.AsyncIterator[WebSocketResponse]:
         """
@@ -359,12 +345,7 @@ class AsyncTtsClient:
             The maximum duration of the audio in seconds. You do not usually need to specify this.
             If the duration is not appropriate for the length of the transcript, the output audio may be truncated.
-        text_cfg : typing.Optional[float]
-            The text [classifier-free guidance](https://arxiv.org/abs/2207.12598) value for the request.
-            Higher values causes the model to attend more to the text but speed up the generation. Lower values reduce the speaking rate but can increase the risk of hallucinations. The default value is `3.0`. For a slower speaking rate, we recommend values between `2.0` and `3.0`. Values are supported between `1.5` and `3.0`.
-            This parameter is only supported for `sonic-2` models.
+        speed : typing.Optional[ModelSpeed]
         request_options : typing.Optional[RequestOptions]
             Request-specific configuration.
@@ -416,7 +397,7 @@ class AsyncTtsClient:
                     object_=output_format, annotation=OutputFormatParams, direction="write"
                 ),
                 "duration": duration,
-                "text_cfg": text_cfg,
+                "speed": speed,
             },
             request_options=request_options,
             omit=OMIT,

cartesia/tts/requests/generation_request.py CHANGED Viewed

@@ -6,6 +6,7 @@ from .tts_request_voice_specifier import TtsRequestVoiceSpecifierParams
 import typing_extensions
 from ..types.supported_language import SupportedLanguage
 from .web_socket_raw_output_format import WebSocketRawOutputFormatParams
+from ..types.model_speed import ModelSpeed
 from ..types.context_id import ContextId
 from ...core.serialization import FieldMetadata
@@ -30,15 +31,7 @@ class GenerationRequestParams(typing_extensions.TypedDict):
     If the duration is not appropriate for the length of the transcript, the output audio may be truncated.
     """
-    text_cfg: typing_extensions.NotRequired[float]
-    """
-    The text [classifier-free guidance](https://arxiv.org/abs/2207.12598) value for the request.
-    Higher values causes the model to attend more to the text but speed up the generation. Lower values reduce the speaking rate but can increase the risk of hallucinations. The default value is `3.0`. For a slower speaking rate, we recommend values between `2.0` and `3.0`. Values are supported between `1.5` and `3.0`.
-    This parameter is only supported for `sonic-2` models.
-    """
+    speed: typing_extensions.NotRequired[ModelSpeed]
     context_id: typing_extensions.NotRequired[ContextId]
     continue_: typing_extensions.NotRequired[typing_extensions.Annotated[bool, FieldMetadata(alias="continue")]]
     """

cartesia/tts/requests/tts_request.py CHANGED Viewed

@@ -5,6 +5,7 @@ from .tts_request_voice_specifier import TtsRequestVoiceSpecifierParams
 import typing_extensions
 from ..types.supported_language import SupportedLanguage
 from .output_format import OutputFormatParams
+from ..types.model_speed import ModelSpeed
 class TtsRequestParams(typing_extensions.TypedDict):
@@ -23,11 +24,4 @@ class TtsRequestParams(typing_extensions.TypedDict):
     If the duration is not appropriate for the length of the transcript, the output audio may be truncated.
     """
-    text_cfg: typing_extensions.NotRequired[float]
-    """
-    The text [classifier-free guidance](https://arxiv.org/abs/2207.12598) value for the request.
-    Higher values causes the model to attend more to the text but speed up the generation. Lower values reduce the speaking rate but can increase the risk of hallucinations. The default value is `3.0`. For a slower speaking rate, we recommend values between `2.0` and `3.0`. Values are supported between `1.5` and `3.0`.
-    This parameter is only supported for `sonic-2` models.
-    """
+    speed: typing_extensions.NotRequired[ModelSpeed]

cartesia/tts/requests/web_socket_tts_request.py CHANGED Viewed

@@ -5,6 +5,7 @@ import typing_extensions
 from .output_format import OutputFormatParams
 from .tts_request_voice_specifier import TtsRequestVoiceSpecifierParams
 from ...core.serialization import FieldMetadata
+from ..types.model_speed import ModelSpeed
 class WebSocketTtsRequestParams(typing_extensions.TypedDict):
@@ -24,4 +25,4 @@ class WebSocketTtsRequestParams(typing_extensions.TypedDict):
     continue_: typing_extensions.NotRequired[typing_extensions.Annotated[bool, FieldMetadata(alias="continue")]]
     context_id: typing_extensions.NotRequired[str]
     max_buffer_delay_ms: typing_extensions.NotRequired[int]
-    text_cfg: typing_extensions.NotRequired[float]
+    speed: typing_extensions.NotRequired[ModelSpeed]

cartesia/tts/types/__init__.py CHANGED Viewed

@@ -6,6 +6,7 @@ from .controls import Controls
 from .emotion import Emotion
 from .flush_id import FlushId
 from .generation_request import GenerationRequest
+from .model_speed import ModelSpeed
 from .mp_3_output_format import Mp3OutputFormat
 from .natural_specifier import NaturalSpecifier
 from .numerical_specifier import NumericalSpecifier
@@ -50,6 +51,7 @@ __all__ = [
     "Emotion",
     "FlushId",
     "GenerationRequest",
+    "ModelSpeed",
     "Mp3OutputFormat",
     "NaturalSpecifier",
     "NumericalSpecifier",

cartesia/tts/types/generation_request.py CHANGED Viewed

@@ -6,6 +6,7 @@ import typing
 from .tts_request_voice_specifier import TtsRequestVoiceSpecifier
 from .supported_language import SupportedLanguage
 from .web_socket_raw_output_format import WebSocketRawOutputFormat
+from .model_speed import ModelSpeed
 from .context_id import ContextId
 import typing_extensions
 from ...core.serialization import FieldMetadata
@@ -32,15 +33,7 @@ class GenerationRequest(UniversalBaseModel):
     If the duration is not appropriate for the length of the transcript, the output audio may be truncated.
     """
-    text_cfg: typing.Optional[float] = pydantic.Field(default=None)
-    """
-    The text [classifier-free guidance](https://arxiv.org/abs/2207.12598) value for the request.
-    Higher values causes the model to attend more to the text but speed up the generation. Lower values reduce the speaking rate but can increase the risk of hallucinations. The default value is `3.0`. For a slower speaking rate, we recommend values between `2.0` and `3.0`. Values are supported between `1.5` and `3.0`.
-    This parameter is only supported for `sonic-2` models.
-    """
+    speed: typing.Optional[ModelSpeed] = None
     context_id: typing.Optional[ContextId] = None
     continue_: typing_extensions.Annotated[typing.Optional[bool], FieldMetadata(alias="continue")] = pydantic.Field(
         default=None

cartesia/tts/types/model_speed.py ADDED Viewed

@@ -0,0 +1,5 @@
+# This file was auto-generated by Fern from our API Definition.
+import typing
+ModelSpeed = typing.Union[typing.Literal["slow", "normal", "fast"], typing.Any]

cartesia/tts/types/tts_request.py CHANGED Viewed

@@ -6,6 +6,7 @@ from .tts_request_voice_specifier import TtsRequestVoiceSpecifier
 import typing
 from .supported_language import SupportedLanguage
 from .output_format import OutputFormat
+from .model_speed import ModelSpeed
 from ...core.pydantic_utilities import IS_PYDANTIC_V2
@@ -25,14 +26,7 @@ class TtsRequest(UniversalBaseModel):
     If the duration is not appropriate for the length of the transcript, the output audio may be truncated.
     """
-    text_cfg: typing.Optional[float] = pydantic.Field(default=None)
-    """
-    The text [classifier-free guidance](https://arxiv.org/abs/2207.12598) value for the request.
-    Higher values causes the model to attend more to the text but speed up the generation. Lower values reduce the speaking rate but can increase the risk of hallucinations. The default value is `3.0`. For a slower speaking rate, we recommend values between `2.0` and `3.0`. Values are supported between `1.5` and `3.0`.
-    This parameter is only supported for `sonic-2` models.
-    """
+    speed: typing.Optional[ModelSpeed] = None
     if IS_PYDANTIC_V2:
         model_config: typing.ClassVar[pydantic.ConfigDict] = pydantic.ConfigDict(extra="allow", frozen=True)  # type: ignore # Pydantic v2

cartesia/tts/types/web_socket_tts_request.py CHANGED Viewed

@@ -7,6 +7,7 @@ from .output_format import OutputFormat
 from .tts_request_voice_specifier import TtsRequestVoiceSpecifier
 import typing_extensions
 from ...core.serialization import FieldMetadata
+from .model_speed import ModelSpeed
 from ...core.pydantic_utilities import IS_PYDANTIC_V2
@@ -27,7 +28,7 @@ class WebSocketTtsRequest(UniversalBaseModel):
     continue_: typing_extensions.Annotated[typing.Optional[bool], FieldMetadata(alias="continue")] = None
     context_id: typing.Optional[str] = None
     max_buffer_delay_ms: typing.Optional[int] = None
-    text_cfg: typing.Optional[float] = None
+    speed: typing.Optional[ModelSpeed] = None
     if IS_PYDANTIC_V2:
         model_config: typing.ClassVar[pydantic.ConfigDict] = pydantic.ConfigDict(extra="allow", frozen=True)  # type: ignore # Pydantic v2

cartesia/voices/client.py CHANGED Viewed

@@ -14,8 +14,8 @@ from ..core.api_error import ApiError
 from .. import core
 from ..tts.types.supported_language import SupportedLanguage
 from .types.clone_mode import CloneMode
-from .types.voice_metadata import VoiceMetadata
 from .types.voice_id import VoiceId
+from .types.voice_metadata import VoiceMetadata
 from ..core.jsonable_encoder import jsonable_encoder
 from .types.localize_target_language import LocalizeTargetLanguage
 from .types.gender import Gender
@@ -150,7 +150,7 @@ class VoicesClient:
         mode: CloneMode,
         description: typing.Optional[str] = OMIT,
         enhance: typing.Optional[bool] = OMIT,
-        transcript: typing.Optional[str] = OMIT,
+        base_voice_id: typing.Optional[VoiceId] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> VoiceMetadata:
         """
@@ -182,11 +182,11 @@ class VoicesClient:
         enhance : typing.Optional[bool]
-            Whether to enhance the clip to improve its quality before cloning. Useful if the clip has background noise.
+            Whether to apply AI enhancements to the clip to reduce background noise. This leads to cleaner generated speech at the cost of reduced similarity to the source clip.
-        transcript : typing.Optional[str]
-            Optional transcript of the words spoken in the audio clip. Only used for similarity mode.
+        base_voice_id : typing.Optional[VoiceId]
+            Optional base voice ID that the cloned voice is derived from.
         request_options : typing.Optional[RequestOptions]
@@ -208,7 +208,6 @@ class VoicesClient:
             description="Copied from Cartesia docs",
             mode="stability",
             language="en",
-            enhance=True,
         )
         """
         _response = self._client_wrapper.httpx_client.request(
@@ -220,7 +219,7 @@ class VoicesClient:
                 "language": language,
                 "mode": mode,
                 "enhance": enhance,
-                "transcript": transcript,
+                "base_voice_id": base_voice_id,
             },
             files={
                 "clip": clip,
@@ -719,7 +718,7 @@ class AsyncVoicesClient:
         mode: CloneMode,
         description: typing.Optional[str] = OMIT,
         enhance: typing.Optional[bool] = OMIT,
-        transcript: typing.Optional[str] = OMIT,
+        base_voice_id: typing.Optional[VoiceId] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> VoiceMetadata:
         """
@@ -751,11 +750,11 @@ class AsyncVoicesClient:
         enhance : typing.Optional[bool]
-            Whether to enhance the clip to improve its quality before cloning. Useful if the clip has background noise.
+            Whether to apply AI enhancements to the clip to reduce background noise. This leads to cleaner generated speech at the cost of reduced similarity to the source clip.
-        transcript : typing.Optional[str]
-            Optional transcript of the words spoken in the audio clip. Only used for similarity mode.
+        base_voice_id : typing.Optional[VoiceId]
+            Optional base voice ID that the cloned voice is derived from.
         request_options : typing.Optional[RequestOptions]
@@ -782,7 +781,6 @@ class AsyncVoicesClient:
                 description="Copied from Cartesia docs",
                 mode="stability",
                 language="en",
-                enhance=True,
             )
@@ -797,7 +795,7 @@ class AsyncVoicesClient:
                 "language": language,
                 "mode": mode,
                 "enhance": enhance,
-                "transcript": transcript,
+                "base_voice_id": base_voice_id,
             },
             files={
                 "clip": clip,

{cartesia-2.0.2.dist-info → cartesia-2.0.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: cartesia
-Version: 2.0.2
+Version: 2.0.3
 Summary:
 Requires-Python: >=3.8,<4.0
 Classifier: Intended Audience :: Developers

{cartesia-2.0.2.dist-info → cartesia-2.0.3.dist-info}/RECORD RENAMED Viewed

@@ -1,4 +1,4 @@
-cartesia/__init__.py,sha256=wqKLSdaX3HebPUATK1p8tTcd5TMcLzvhJR2dNcEBKgo,8414
+cartesia/__init__.py,sha256=p9ilqR-oE6N6pPQbiKUbnfEdDy00ihjNTtg7ES7EHg0,8448
 cartesia/api_status/__init__.py,sha256=_dHNLdknrBjxHtU2PvLumttJM-JTQhJQqhhAQkLqt_U,168
 cartesia/api_status/client.py,sha256=GJ9Dq8iCn3hn8vCIqc6k1fCGEhSz0T0kaPGcdFnbMDY,3146
 cartesia/api_status/requests/__init__.py,sha256=ilEMzEy1JEw484CuL92bX5lHGOznc62pjiDMgiZ0tKM,130
@@ -19,7 +19,7 @@ cartesia/base_client.py,sha256=YH0l0UUzanAa9mDdJU6BFQ9XKELiaPTm9NsJpVQ4evA,6539
 cartesia/client.py,sha256=sPAYQLt9W2E_2F17ooocvvJImuNyLrL8xUypgf6dZeI,6238
 cartesia/core/__init__.py,sha256=-t9txgeQZL_1FDw_08GEoj4ft1Cn9Dti6X0Drsadlr0,1519
 cartesia/core/api_error.py,sha256=RE8LELok2QCjABadECTvtDp7qejA1VmINCh6TbqPwSE,426
-cartesia/core/client_wrapper.py,sha256=RLjY6z-CDfSO5WPCxechq__-Xhikk8_gn3-HAdFFXiE,1854
+cartesia/core/client_wrapper.py,sha256=xKyHqaGJ7V2OuMGkVOEjxofnt8QaFjgiEIom7EWhBBI,1854
 cartesia/core/datetime_utils.py,sha256=nBys2IsYrhPdszxGKCNRPSOCwa-5DWOHG95FB8G9PKo,1047
 cartesia/core/file.py,sha256=d4NNbX8XvXP32z8KpK2Xovv33nFfruIrpz0QWxlgpZk,2663
 cartesia/core/http_client.py,sha256=KL5RGa0y4n8nX0-07WRg4ZQUTq30sc-XJbWcP5vjBDg,19552
@@ -51,20 +51,20 @@ cartesia/environment.py,sha256=Qnp91BGLic7hXmKsiYub2m3nPfvDWm59aB1wWta1J6A,160
 cartesia/infill/__init__.py,sha256=FTtvy8EDg9nNNg9WCatVgKTRYV8-_v1roeGPAKoa_pw,65
 cartesia/infill/client.py,sha256=PWE5Ak-wsaBM_8g52oDl9PYx76PkW6f900mnxvZf4Bk,12571
 cartesia/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-cartesia/tts/__init__.py,sha256=G0wcYlPrr7hmu5DQgCG7bDTQq36fpP3iBM5164Z0-Js,4701
+cartesia/tts/__init__.py,sha256=YrVxJT7i-0wygFgN2hOVftYLEM7JoFgCo3SvLoN7pkA,4735
 cartesia/tts/_async_websocket.py,sha256=tJ-6rdJrviKvGhSW8J8t-rCinXM5gXXQJgDO8OgW3EE,18805
 cartesia/tts/_websocket.py,sha256=Uk6B-TP-0nzeyFE9w-_PzNIiVYP14rKqSDZlm6bU24Q,19271
-cartesia/tts/client.py,sha256=oZZDSb9XVVvON4ng5tdL3NeVIMhfUdLs1qSHQ_HBtQw,17376
+cartesia/tts/client.py,sha256=0jWpiNKPp4QbyibfB2tsFb7wqQ9vb4m_QlLB-qxzKP8,15398
 cartesia/tts/requests/__init__.py,sha256=0rcfMLHNbUhkRI1xS09UE4p-WT1BCqrcblFtPxcATOI,3261
 cartesia/tts/requests/cancel_context_request.py,sha256=Wl8g-o5vwl9ENm-H1wsLx441FkIR_4Wt5UYtuWce2Yw,431
 cartesia/tts/requests/controls.py,sha256=xzUJlfgqhaJ1A-JD0LTpoHYk4iEpCuGpSD7qE4YYsRg,285
-cartesia/tts/requests/generation_request.py,sha256=oGCBfIVXc6SvKV5IDdadHvqBT5qLAZLhz_CBVtKfV2Y,3202
+cartesia/tts/requests/generation_request.py,sha256=cUy--5WFsC7E-KEPVay3QpU_-a3GVGnatTKsBw6hIV4,2743
 cartesia/tts/requests/mp_3_output_format.py,sha256=PGDVzC1d7-Jce12rFxtF8G1pTHmlUdiGAhykFTABg0w,316
 cartesia/tts/requests/output_format.py,sha256=8TKu9AAeHCR5L4edzYch8FIYIldn4bM7ySrsCl8W_g8,842
 cartesia/tts/requests/phoneme_timestamps.py,sha256=ft81nmqElZAnvTBT27lY6YWfF18ZGsCx3Y1XHv9J7cM,267
 cartesia/tts/requests/raw_output_format.py,sha256=S60Vp7DeAATCMLF3bXgxhw0zILJBWJ9GhI9irAg_UkI,316
 cartesia/tts/requests/speed.py,sha256=-YGBWwh7_VtCBnYlT5EVsnrmcHFMEBTxy9LathZhkMA,259
-cartesia/tts/requests/tts_request.py,sha256=VqBtdNF6JFcBh392e6tyONCexvJZMUyKpamv03hjTjA,1479
+cartesia/tts/requests/tts_request.py,sha256=KBoahYfPbDENlEWsqnR4z1ZIhGIJwhLrzQIzkbtqtzE,1021
 cartesia/tts/requests/tts_request_embedding_specifier.py,sha256=-M54ZjV0H5LPwcKtz0bOVqlkvO1pPiMbqMbVBMko3Ns,565
 cartesia/tts/requests/tts_request_id_specifier.py,sha256=-0ClfyJnnaH0uAcF5r84s3cM_cw2wT39dp6T4JYzOQ8,536
 cartesia/tts/requests/tts_request_voice_specifier.py,sha256=eGzL4aVGq4gKPxeglsV7-wuhxg8x33Qth3uFTTytgeI,337
@@ -81,16 +81,17 @@ cartesia/tts/requests/web_socket_response.py,sha256=WqZ6RgO4suG78wiVSIsOWwyXBioV
 cartesia/tts/requests/web_socket_stream_options.py,sha256=VIvblFw9hGZvDzFpOnC11G0NvrFSVt-1-0sY5rpcZPI,232
 cartesia/tts/requests/web_socket_timestamps_response.py,sha256=MK3zN2Q_PVWJtX5DidNB0uXoF2o33rv6qCYPVaourxY,351
 cartesia/tts/requests/web_socket_tts_output.py,sha256=pX2uf0XVdziFhXCydwLlVOWb-LvBiuq-cBI6R1INiMg,760
-cartesia/tts/requests/web_socket_tts_request.py,sha256=i6gwa4bvPPCnS2ZnSnu5FY1bjwjp76Kfi0eTb_atBlI,1215
+cartesia/tts/requests/web_socket_tts_request.py,sha256=RBFrdmYe0SRlzhEUwhTFCL8ZC1tbIwD2aFnUgF-my80,1260
 cartesia/tts/requests/word_timestamps.py,sha256=WMfBJtETi6wTpES0pYZCFfFRfEbzWE-RtosDJ5seUWg,261
 cartesia/tts/socket_client.py,sha256=zTPayHbgy-yQQ50AE1HXN4GMyanisZcLXf7Ds1paYks,11621
-cartesia/tts/types/__init__.py,sha256=yV_-DY9EPNAFEfuIk3wgRLcc4Ta5igv0T5g-IIQ53v0,3251
+cartesia/tts/types/__init__.py,sha256=44KWnBiqkNHZZpy8M5uze8cdEFE79sbMRVJStxQSEhM,3305
 cartesia/tts/types/cancel_context_request.py,sha256=zInhk3qRZsSc0F1aYJ-Q5BHJsosTrb22IJWhzue-eKE,856
 cartesia/tts/types/context_id.py,sha256=UCEtq5xFGOeBCECcY6Y-gYVe_Peg1hFhH9YYOkpApQg,81
 cartesia/tts/types/controls.py,sha256=H4CSu79mM1Ld4NZx_5uXw3EwRzTEMQRxKBRvFpcFb8Y,644
 cartesia/tts/types/emotion.py,sha256=zocyDcHTiFFnNRgo2YLMi70iGyffa080B4mkg9lcqVc,764
 cartesia/tts/types/flush_id.py,sha256=HCIKo9o8d7YWKtaSNU3TEvfUVBju93ckGQy01Z9wLcE,79
-cartesia/tts/types/generation_request.py,sha256=HfMLj_HOCeKy5p_yLcltvrJly9WNkzoNCxarwlLE7Nw,3732
+cartesia/tts/types/generation_request.py,sha256=H5ZaNGH2ngTZY-NQ7wqLUiIAArH8KFo3rt690bxWCUw,3242
+cartesia/tts/types/model_speed.py,sha256=iiTj8V0piFCX2FZh5B8EkgRhZDlj4z3VFcQhp66e7y8,160
 cartesia/tts/types/mp_3_output_format.py,sha256=0WGblkuDUL7pZO1aRuQ_mU2Z5gN9xIabRfRKkjtzms8,731
 cartesia/tts/types/natural_specifier.py,sha256=K526P1RRuBGy80hyd_tX8tohPrE8DR9EgTCxS5wce0o,188
 cartesia/tts/types/numerical_specifier.py,sha256=tJpIskWO545luCKMFM9JlVc7VVhBhSvqL1qurhzL9cI,92
@@ -100,7 +101,7 @@ cartesia/tts/types/raw_encoding.py,sha256=eyc2goiYOTxWcuKHAgYZ2SrnfePW22Fbmc-5fG
 cartesia/tts/types/raw_output_format.py,sha256=jZGVaS0KIi9mU6trfskgA3HbMKJolhrwICnuDhF01ic,673
 cartesia/tts/types/speed.py,sha256=4c5WdxocBw6WSMnundSaNnceUeooU0vikhy00FW6M-w,239
 cartesia/tts/types/supported_language.py,sha256=riDRduThMbMWAq9i2uCfxhwVTpgaFwNDZ9LhEIl4zHY,237
-cartesia/tts/types/tts_request.py,sha256=kUTOjNOZsZivSLbVvLA85EzPNsKCEOnY51NPfUmlDwM,1865
+cartesia/tts/types/tts_request.py,sha256=FGcxW-siiQpEzJZSHMET3nDSYHSzRt3WSTO-cCEz9u4,1376
 cartesia/tts/types/tts_request_embedding_specifier.py,sha256=eL_qCEr4pvWfy4qp9hZBuVdCincX5DBVqfv1vLt2_Vk,942
 cartesia/tts/types/tts_request_id_specifier.py,sha256=ktGdkkTRQ9scA-lt8qJ2jn_E5WzoOK8AXMrVqi71gf0,906
 cartesia/tts/types/tts_request_voice_specifier.py,sha256=p-3UQ62uFL1SgbX73Ex1D_V73Ef0wmT1ApOt1iLZmwE,307
@@ -117,7 +118,7 @@ cartesia/tts/types/web_socket_response.py,sha256=mHDECZ4K84QmN2s0IWuBsXBt83Yq7Qx
 cartesia/tts/types/web_socket_stream_options.py,sha256=MhDSxBFqMuQeWjoyPqXVnTEzLjF8g6aojeigb5dQUgU,596
 cartesia/tts/types/web_socket_timestamps_response.py,sha256=kuWXI82ncF1QapnaHEjwrL84qWob7ByQU-yh1e0IEmk,667
 cartesia/tts/types/web_socket_tts_output.py,sha256=uvkv0smTBhdm18Rl17C0Ml4Inh79YBHNzAcKnZBs14Y,979
-cartesia/tts/types/web_socket_tts_request.py,sha256=PzdIyFcj6V9MLwr4rpuh_H3NfEnzq0dHlEv-bKKeTR0,1529
+cartesia/tts/types/web_socket_tts_request.py,sha256=TlqUQPhqZcDZ6jgpzLqzJnYVGBIc9_TQYSu_SVYkVVk,1567
 cartesia/tts/types/word_timestamps.py,sha256=XZ2Q0prdb3F9c3AiOKXu4s3A3jBxE-qIt1npHOf16R0,631
 cartesia/tts/utils/constants.py,sha256=1CHa5flJf8--L_eYyOyOiWJNZ-Q81ufHZxDbJs8xYSk,418
 cartesia/tts/utils/tts.py,sha256=u7PgPxlJs6fcQTfr-jqAvBCAaK3JWLhF5QF4s-PwoMo,2093
@@ -131,7 +132,7 @@ cartesia/voice_changer/types/__init__.py,sha256=qAiHsdRpnFeS0lBkYp_NRrhSJiRXCg5-
 cartesia/voice_changer/types/output_format_container.py,sha256=RqLDELdgeOjYqNTJX1Le62qjiFiJGxf0cYnol88-LLM,166
 cartesia/voice_changer/types/streaming_response.py,sha256=rQ4ZehtOHsCBKijyULz_ahGQYNj1yus6AM6u2wgcBsI,1963
 cartesia/voices/__init__.py,sha256=2D58Bir45LvcvP08QMnPlFE8DD8BONTjPLkIDdKs7vg,1891
-cartesia/voices/client.py,sha256=B0T1YRjrAX7fssBw1hyq5qpQ2CCf-dC-E9F1-AvwvSs,38949
+cartesia/voices/client.py,sha256=A_PEoCLko1znexKKicp-gZVMUcSpDoKqz3p1r4Aa04k,38993
 cartesia/voices/requests/__init__.py,sha256=XiBJbSYeQCgFMtwywKvQ0Nmp7Zf_0WskzRhgr9c8h38,1072
 cartesia/voices/requests/create_voice_request.py,sha256=r6dKb9ga0ZsAi_6PXuE43u2lLgfQg2DIYjk2Neng7pI,617
 cartesia/voices/requests/embedding_response.py,sha256=PGZkBD8UBcv2MYQbBXyD4T6lzaE9oSGGwXx-MoXCp0M,228
@@ -170,6 +171,6 @@ cartesia/voices/types/voice_expand_options.py,sha256=e4FroWdlxEE-LXQfT1RWlGHtswl
 cartesia/voices/types/voice_id.py,sha256=GDoXcRVeIm-V21R4suxG2zqLD3DLYkXE9kgizadzFKo,79
 cartesia/voices/types/voice_metadata.py,sha256=4KNGjXMUKm3niv-NvKIFVGtiilpH13heuzKcZYNQxk4,1181
 cartesia/voices/types/weight.py,sha256=XqDU7_JItNUb5QykIDqTbELlRYQdbt2SviRgW0w2LKo,80
-cartesia-2.0.2.dist-info/METADATA,sha256=EB_DtN2AaHi0snXgpbisp2T1nsTQ7CQlR3S1rowO8L0,11206
-cartesia-2.0.2.dist-info/WHEEL,sha256=Zb28QaM1gQi8f4VCBhsUklF61CTlNYfs9YAZn-TOGFk,88
-cartesia-2.0.2.dist-info/RECORD,,
+cartesia-2.0.3.dist-info/METADATA,sha256=cW9xivCIN1lB-8xc8V_-DMwh0pwJa3gwmsYO3XwJl0M,11206
+cartesia-2.0.3.dist-info/WHEEL,sha256=Zb28QaM1gQi8f4VCBhsUklF61CTlNYfs9YAZn-TOGFk,88
+cartesia-2.0.3.dist-info/RECORD,,

{cartesia-2.0.2.dist-info → cartesia-2.0.3.dist-info}/WHEEL RENAMED Viewed

File without changes

cartesia 2.0.2__py3-none-any.whl → 2.0.3__py3-none-any.whl

cartesia 2.0.2py3-none-any.whl → 2.0.3py3-none-any.whl