PyPI - cartesia - Versions diffs - 1.0.7__tar.gz → 1.0.8__tar.gz - Mend

cartesia 1.0.7tar.gz → 1.0.8tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

{cartesia-1.0.7 → cartesia-1.0.8}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: cartesia
-Version: 1.0.7
+Version: 1.0.8
 Summary: The official Python library for the Cartesia API.
 Home-page:
 Author: Cartesia, Inc.
@@ -25,6 +25,22 @@ The official Cartesia Python library which provides convenient access to the Car
 > [!IMPORTANT]
 > The client library introduces breaking changes in v1.0.0, which was released on June 24th 2024. See the [release notes](https://github.com/cartesia-ai/cartesia-python/releases/tag/v1.0.0) and [migration guide](https://github.com/cartesia-ai/cartesia-python/discussions/44). Reach out to us on [Discord](https://discord.gg/ZVxavqHB9X) for any support requests!
+- [Cartesia Python API Library](#cartesia-python-api-library)
+  - [Documentation](#documentation)
+  - [Installation](#installation)
+  - [Voices](#voices)
+  - [Text-to-Speech](#text-to-speech)
+    - [Server-Sent Events (SSE)](#server-sent-events-sse)
+    - [WebSocket](#websocket)
+      - [Conditioning speech on previous generations using WebSocket](#conditioning-speech-on-previous-generations-using-websocket)
+    - [Generating timestamps using WebSocket](#generating-timestamps-using-websocket)
+    - [Multilingual Text-to-Speech \[Alpha\]](#multilingual-text-to-speech-alpha)
+    - [Speed and Emotion Control \[Experimental\]](#speed-and-emotion-control-experimental)
+    - [Jupyter Notebook Usage](#jupyter-notebook-usage)
+    - [Utility methods](#utility-methods)
+      - [Output Formats](#output-formats)
 ## Documentation
 Our complete API documentation can be found [on docs.cartesia.ai](https://docs.cartesia.ai).
@@ -250,7 +266,7 @@ async def send_transcripts(ctx):
     # You can check out our models at https://docs.cartesia.ai/getting-started/available-models
     model_id = "sonic-english"
     # You can find the supported `output_format`s at https://docs.cartesia.ai/api-reference/endpoints/stream-speech-server-sent-events
     output_format = {
         "container": "raw",
@@ -266,7 +282,7 @@ async def send_transcripts(ctx):
         "As they near Eggman's lair, our heroes charge their abilities for an epic boss battle. ",
         "Get ready to spin, jump, and sound-blast your way to victory in this high-octane crossover!"
     ]
     for transcript in transcripts:
         # Send text inputs as they become available
         await ctx.send(
@@ -278,7 +294,7 @@ async def send_transcripts(ctx):
         )
     # Indicate that no more inputs will be sent. Otherwise, the context will close after 5 seconds of inactivity.
-    await ctx.no_more_inputs()
+    await ctx.no_more_inputs()
 async def receive_and_play_audio(ctx):
     p = pyaudio.PyAudio()
@@ -384,7 +400,7 @@ output_stream = ctx.send(
     voice_id=voice_id,
     output_format=output_format,
 )
 for output in output_stream:
     buffer = output["audio"]

{cartesia-1.0.7 → cartesia-1.0.8}/README.md RENAMED Viewed

@@ -8,6 +8,22 @@ The official Cartesia Python library which provides convenient access to the Car
 > [!IMPORTANT]
 > The client library introduces breaking changes in v1.0.0, which was released on June 24th 2024. See the [release notes](https://github.com/cartesia-ai/cartesia-python/releases/tag/v1.0.0) and [migration guide](https://github.com/cartesia-ai/cartesia-python/discussions/44). Reach out to us on [Discord](https://discord.gg/ZVxavqHB9X) for any support requests!
+- [Cartesia Python API Library](#cartesia-python-api-library)
+  - [Documentation](#documentation)
+  - [Installation](#installation)
+  - [Voices](#voices)
+  - [Text-to-Speech](#text-to-speech)
+    - [Server-Sent Events (SSE)](#server-sent-events-sse)
+    - [WebSocket](#websocket)
+      - [Conditioning speech on previous generations using WebSocket](#conditioning-speech-on-previous-generations-using-websocket)
+    - [Generating timestamps using WebSocket](#generating-timestamps-using-websocket)
+    - [Multilingual Text-to-Speech \[Alpha\]](#multilingual-text-to-speech-alpha)
+    - [Speed and Emotion Control \[Experimental\]](#speed-and-emotion-control-experimental)
+    - [Jupyter Notebook Usage](#jupyter-notebook-usage)
+    - [Utility methods](#utility-methods)
+      - [Output Formats](#output-formats)
 ## Documentation
 Our complete API documentation can be found [on docs.cartesia.ai](https://docs.cartesia.ai).
@@ -233,7 +249,7 @@ async def send_transcripts(ctx):
     # You can check out our models at https://docs.cartesia.ai/getting-started/available-models
     model_id = "sonic-english"
     # You can find the supported `output_format`s at https://docs.cartesia.ai/api-reference/endpoints/stream-speech-server-sent-events
     output_format = {
         "container": "raw",
@@ -249,7 +265,7 @@ async def send_transcripts(ctx):
         "As they near Eggman's lair, our heroes charge their abilities for an epic boss battle. ",
         "Get ready to spin, jump, and sound-blast your way to victory in this high-octane crossover!"
     ]
     for transcript in transcripts:
         # Send text inputs as they become available
         await ctx.send(
@@ -261,7 +277,7 @@ async def send_transcripts(ctx):
         )
     # Indicate that no more inputs will be sent. Otherwise, the context will close after 5 seconds of inactivity.
-    await ctx.no_more_inputs()
+    await ctx.no_more_inputs()
 async def receive_and_play_audio(ctx):
     p = pyaudio.PyAudio()
@@ -367,7 +383,7 @@ output_stream = ctx.send(
     voice_id=voice_id,
     output_format=output_format,
 )
 for output in output_stream:
     buffer = output["audio"]

{cartesia-1.0.7 → cartesia-1.0.8}/cartesia/client.py RENAMED Viewed

@@ -23,7 +23,12 @@ import aiohttp
 import httpx
 import logging
 import requests
-from websockets.sync.client import connect
+try:
+    from websockets.sync.client import connect
+    IS_WEBSOCKET_SYNC_AVAILABLE = True
+except ImportError:
+    IS_WEBSOCKET_SYNC_AVAILABLE = False
 from iterators import TimeoutIterator
 from cartesia.utils.retry import retry_on_connection_error, retry_on_connection_error_async
@@ -208,37 +213,25 @@ class Voices(Resource):
         return response.json()
     def clone(self, filepath: Optional[str] = None, link: Optional[str] = None) -> List[float]:
-        """Clone a voice from a clip or a URL.
+        """Clone a voice from a clip.
         Args:
             filepath: The path to the clip file.
-            link: The URL to the clip
         Returns:
             The embedding of the cloned voice as a list of floats.
         """
         # TODO: Python has a bytes object, use that instead of a filepath
-        if not filepath and not link:
-            raise ValueError("At least one of 'filepath' or 'link' must be specified.")
-        if filepath and link:
-            raise ValueError("Only one of 'filepath' or 'link' should be specified.")
-        if filepath:
-            url = f"{self._http_url()}/voices/clone/clip"
-            with open(filepath, "rb") as file:
-                files = {"clip": file}
-                headers = self.headers.copy()
-                headers.pop("Content-Type", None)
-                response = httpx.post(url, headers=headers, files=files, timeout=self.timeout)
-                if not response.is_success:
-                    raise ValueError(f"Failed to clone voice from clip. Error: {response.text}")
-        elif link:
-            url = f"{self._http_url()}/voices/clone/url"
-            params = {"link": link}
+        if not filepath:
+            raise ValueError("Filepath must be specified.")
+        url = f"{self._http_url()}/voices/clone/clip"
+        with open(filepath, "rb") as file:
+            files = {"clip": file}
             headers = self.headers.copy()
-            headers.pop("Content-Type")  # The content type header is not required for URLs
-            response = httpx.post(url, headers=self.headers, params=params, timeout=self.timeout)
+            headers.pop("Content-Type", None)
+            response = httpx.post(url, headers=headers, files=files, timeout=self.timeout)
             if not response.is_success:
-                raise ValueError(f"Failed to clone voice from URL. Error: {response.text}")
+                raise ValueError(f"Failed to clone voice from clip. Error: {response.text}")
         return response.json()["embedding"]
@@ -469,6 +462,10 @@ class _WebSocket:
         Raises:
             RuntimeError: If the connection to the WebSocket fails.
         """
+        if not IS_WEBSOCKET_SYNC_AVAILABLE:
+            raise ImportError(
+                "The synchronous WebSocket client is not available. Please ensure that you have 'websockets>=12.0' or compatible version installed."
+            )
         if self.websocket is None or self._is_websocket_closed():
             route = "tts/websocket"
             try:

cartesia-1.0.8/cartesia/version.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ __version__ = "1.0.8"

{cartesia-1.0.7 → cartesia-1.0.8}/cartesia.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: cartesia
-Version: 1.0.7
+Version: 1.0.8
 Summary: The official Python library for the Cartesia API.
 Home-page:
 Author: Cartesia, Inc.
@@ -25,6 +25,22 @@ The official Cartesia Python library which provides convenient access to the Car
 > [!IMPORTANT]
 > The client library introduces breaking changes in v1.0.0, which was released on June 24th 2024. See the [release notes](https://github.com/cartesia-ai/cartesia-python/releases/tag/v1.0.0) and [migration guide](https://github.com/cartesia-ai/cartesia-python/discussions/44). Reach out to us on [Discord](https://discord.gg/ZVxavqHB9X) for any support requests!
+- [Cartesia Python API Library](#cartesia-python-api-library)
+  - [Documentation](#documentation)
+  - [Installation](#installation)
+  - [Voices](#voices)
+  - [Text-to-Speech](#text-to-speech)
+    - [Server-Sent Events (SSE)](#server-sent-events-sse)
+    - [WebSocket](#websocket)
+      - [Conditioning speech on previous generations using WebSocket](#conditioning-speech-on-previous-generations-using-websocket)
+    - [Generating timestamps using WebSocket](#generating-timestamps-using-websocket)
+    - [Multilingual Text-to-Speech \[Alpha\]](#multilingual-text-to-speech-alpha)
+    - [Speed and Emotion Control \[Experimental\]](#speed-and-emotion-control-experimental)
+    - [Jupyter Notebook Usage](#jupyter-notebook-usage)
+    - [Utility methods](#utility-methods)
+      - [Output Formats](#output-formats)
 ## Documentation
 Our complete API documentation can be found [on docs.cartesia.ai](https://docs.cartesia.ai).
@@ -250,7 +266,7 @@ async def send_transcripts(ctx):
     # You can check out our models at https://docs.cartesia.ai/getting-started/available-models
     model_id = "sonic-english"
     # You can find the supported `output_format`s at https://docs.cartesia.ai/api-reference/endpoints/stream-speech-server-sent-events
     output_format = {
         "container": "raw",
@@ -266,7 +282,7 @@ async def send_transcripts(ctx):
         "As they near Eggman's lair, our heroes charge their abilities for an epic boss battle. ",
         "Get ready to spin, jump, and sound-blast your way to victory in this high-octane crossover!"
     ]
     for transcript in transcripts:
         # Send text inputs as they become available
         await ctx.send(
@@ -278,7 +294,7 @@ async def send_transcripts(ctx):
         )
     # Indicate that no more inputs will be sent. Otherwise, the context will close after 5 seconds of inactivity.
-    await ctx.no_more_inputs()
+    await ctx.no_more_inputs()
 async def receive_and_play_audio(ctx):
     p = pyaudio.PyAudio()
@@ -384,7 +400,7 @@ output_stream = ctx.send(
     voice_id=voice_id,
     output_format=output_format,
 )
 for output in output_stream:
     buffer = output["audio"]

{cartesia-1.0.7 → cartesia-1.0.8}/tests/test_tts.py RENAMED Viewed

@@ -79,14 +79,6 @@ def test_get_voice_from_id(client: Cartesia):
     voices = client.voices.list()
     assert voice in voices
-# Does not work currently, LB issue
-# def test_clone_voice_with_link(client: Cartesia):
-#     url = "https://youtu.be/g2Z7Ddd573M?si=P8BM_hBqt5P8Ft6I&t=69"
-#     logger.info("Testing voices.clone with link")
-#     cloned_voice_embedding = client.voices.clone(link=url)
-#     assert isinstance(cloned_voice_embedding, list)
-#     assert len(cloned_voice_embedding) == 192
 def test_clone_voice_with_file(client: Cartesia):
     logger.info("Testing voices.clone with file")
     output = client.voices.clone(filepath=os.path.join(RESOURCES_DIR, "sample-speech-4s.wav"))