PyPI - cartesia - Versions diffs - 1.0.10__py2.py3-none-any.whl → 1.0.12__py2.py3-none-any.whl - Mend

cartesia 1.0.10py2.py3-none-any.whl → 1.0.12py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

cartesia/client.py CHANGED Viewed

@@ -32,7 +32,6 @@ except ImportError:
     IS_WEBSOCKET_SYNC_AVAILABLE = False
 from iterators import TimeoutIterator
-from websockets.sync.client import connect
 from cartesia._types import (
     DeprecatedOutputFormatMapping,
@@ -261,6 +260,40 @@ class Voices(Resource):
         return response.json()
+    def mix(self, voices: List[Dict[str, Union[str, float]]]) -> List[float]:
+        """Mix multiple voices together.
+        Args:
+            voices: A list of dictionaries, each containing either:
+                        - 'id': The ID of an existing voice
+                        - 'embedding': A voice embedding
+                    AND
+                        - 'weight': The weight of the voice in the mix (0.0 to 1.0)
+        Returns:
+            The embedding of the mixed voice as a list of floats.
+        Raises:
+            ValueError: If the request fails or if the input is invalid.
+        """
+        url = f"{self._http_url()}/voices/mix"
+        if not voices or not isinstance(voices, list):
+            raise ValueError("voices must be a non-empty list")
+        response = httpx.post(
+            url,
+            headers=self.headers,
+            json={"voices": voices},
+            timeout=self.timeout,
+        )
+        if not response.is_success:
+            raise ValueError(f"Failed to mix voices. Error: {response.text}")
+        result = response.json()
+        return result["embedding"]
 class _TTSContext:
     """Manage a single context over a WebSocket.
@@ -294,6 +327,7 @@ class _TTSContext:
         context_id: Optional[str] = None,
         duration: Optional[int] = None,
         language: Optional[str] = None,
+        add_timestamps: bool = False,
         _experimental_voice_controls: Optional[VoiceControls] = None,
     ) -> Generator[bytes, None, None]:
         """Send audio generation requests to the WebSocket and yield responses.
@@ -307,6 +341,7 @@ class _TTSContext:
             context_id: The context ID to use for the request. If not specified, a random context ID will be generated.
             duration: The duration of the audio in seconds.
             language: The language code for the audio request. This can only be used with `model_id = sonic-multilingual`
+            add_timestamps: Whether to return word-level timestamps.
             _experimental_voice_controls: Experimental voice controls for controlling speed and emotion.
                 Note: This is an experimental feature and may change rapidly in future releases.
@@ -341,6 +376,7 @@ class _TTSContext:
             },
             "context_id": self._context_id,
             "language": language,
+            "add_timestamps": add_timestamps,
         }
         if duration is not None:
@@ -858,9 +894,9 @@ class TTS(Resource):
             raise ValueError("Only one of voice_id or voice_embedding should be specified.")
         if voice_id:
-            voice = {"mode": "id", "id": voice_id}
+            voice = {"id": voice_id}
         else:
-            voice = {"mode": "embedding", "embedding": voice_embedding}
+            voice = {"embedding": voice_embedding}
         if experimental_voice_controls is not None:
             voice["__experimental_controls"] = experimental_voice_controls
         return voice

cartesia/version.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__ = "1.0.10"
1	+ __version__ = "1.0.12"

{cartesia-1.0.10.dist-info → cartesia-1.0.12.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: cartesia
-Version: 1.0.10
+Version: 1.0.12
 Summary: The official Python library for the Cartesia API.
 Home-page:
 Author: Cartesia, Inc.
@@ -91,6 +91,11 @@ print("The embedding for", voice["name"], "is", voice["embedding"])
 # Clone a voice using filepath
 cloned_voice_embedding = client.voices.clone(filepath="path/to/voice")
+# Mix voices together
+mixed_voice_embedding = client.voices.mix(
+    [{ "id": "voice_id_1", "weight": 0.5 }, { "id": "voice_id_2", "weight": 0.25 }, { "id": "voice_id_3", "weight": 0.25 }]
+)
 # Create a new voice
 new_voice = client.voices.create(
     name="New Voice",
@@ -522,6 +527,7 @@ You can enhance the voice output by adjusting the `speed` and `emotion` paramete
 Speed Options:
 - `slowest`, `slow`, `normal`, `fast`, `fastest`
+- Float values between -1.0 and 1.0, where -1.0 is the slowest speed and 1.0 is the fastest speed.
 Emotion Options:
 Use a list of tags in the format `emotion_name:level` where:

{cartesia-1.0.10.dist-info → cartesia-1.0.12.dist-info}/RECORD RENAMED Viewed

@@ -1,12 +1,12 @@
 cartesia/__init__.py,sha256=E4w7psbAwx8X6Iri3W8jGeo11gIlhr3mSU33zChipmI,93
 cartesia/_types.py,sha256=pkFJmsO-OWAJNtqxV80-YcR8KWWLhIwLFejzDjBewbw,4428
-cartesia/client.py,sha256=AfSLYDJw_3eTCxiEyWhLdGVxOhPooW5omA99DeLTw5A,51614
-cartesia/version.py,sha256=5vGk-8GWz6jojEu9w36UP5aNA0LuiwgbNSJ8Umn2rLA,23
+cartesia/client.py,sha256=bYUk-P7QlPNNDhQaI5fldkDZAC8vVVUuHrgRHOq_V78,52818
+cartesia/version.py,sha256=bQ8TKIXU3qSGr-K-gVtWDgjDfBlCgBju76OGKtY9tS8,23
 cartesia/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 cartesia/utils/deprecated.py,sha256=2cXvGtrxhPeUZA5LWy2n_U5OFLDv7SHeFtzqhjSJGyk,1674
 cartesia/utils/retry.py,sha256=O6fyVWpH9Su8c0Fwupl57xMt6JrwJ52txBwP3faUL7k,3339
-cartesia-1.0.10.dist-info/LICENSE.md,sha256=PT2YG5wEtEX1TNDn5sXkUXqbn-neyr7cZenTxd40ql4,1074
-cartesia-1.0.10.dist-info/METADATA,sha256=0eG3fbxXsqofNbwIdGvziDqTpFar2ZetcGLc7Bsut3s,21122
-cartesia-1.0.10.dist-info/WHEEL,sha256=fS9sRbCBHs7VFcwJLnLXN1MZRR0_TVTxvXKzOnaSFs8,110
-cartesia-1.0.10.dist-info/top_level.txt,sha256=rTX4HnnCegMxl1FK9czpVC7GAvf3SwDzPG65qP-BS4w,9
-cartesia-1.0.10.dist-info/RECORD,,
+cartesia-1.0.12.dist-info/LICENSE.md,sha256=PT2YG5wEtEX1TNDn5sXkUXqbn-neyr7cZenTxd40ql4,1074
+cartesia-1.0.12.dist-info/METADATA,sha256=3jeDZosoKAHVx9hcLjE9iZsggAvpR_L2iX3hnP_UFd4,21413
+cartesia-1.0.12.dist-info/WHEEL,sha256=fS9sRbCBHs7VFcwJLnLXN1MZRR0_TVTxvXKzOnaSFs8,110
+cartesia-1.0.12.dist-info/top_level.txt,sha256=rTX4HnnCegMxl1FK9czpVC7GAvf3SwDzPG65qP-BS4w,9
+cartesia-1.0.12.dist-info/RECORD,,

{cartesia-1.0.10.dist-info → cartesia-1.0.12.dist-info}/LICENSE.md RENAMED Viewed

File without changes

{cartesia-1.0.10.dist-info → cartesia-1.0.12.dist-info}/WHEEL RENAMED Viewed

File without changes

{cartesia-1.0.10.dist-info → cartesia-1.0.12.dist-info}/top_level.txt RENAMED Viewed

File without changes

cartesia 1.0.10__py2.py3-none-any.whl → 1.0.12__py2.py3-none-any.whl

cartesia 1.0.10py2.py3-none-any.whl → 1.0.12py2.py3-none-any.whl