PyPI - cartesia - Versions diffs - 1.1.0.dev0__py3-none-any.whl → 1.2.0__py3-none-any.whl - Mend

cartesia 1.1.0.dev0py3-none-any.whl → 1.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

cartesia/_types.py CHANGED Viewed

@@ -27,39 +27,6 @@ class OutputFormatMapping:
             raise ValueError(f"Unsupported format: {format_name}")
-class DeprecatedOutputFormatMapping:
-    """Deprecated formats as of v1.0.1. These will be removed in v1.2.0. Use :class:`OutputFormatMapping` instead."""
-    _format_mapping = {
-        "fp32": {"container": "raw", "encoding": "pcm_f32le", "sample_rate": 44100},
-        "pcm": {"container": "raw", "encoding": "pcm_s16le", "sample_rate": 44100},
-        "fp32_8000": {"container": "raw", "encoding": "pcm_f32le", "sample_rate": 8000},
-        "fp32_16000": {"container": "raw", "encoding": "pcm_f32le", "sample_rate": 16000},
-        "fp32_22050": {"container": "raw", "encoding": "pcm_f32le", "sample_rate": 22050},
-        "fp32_24000": {"container": "raw", "encoding": "pcm_f32le", "sample_rate": 24000},
-        "fp32_44100": {"container": "raw", "encoding": "pcm_f32le", "sample_rate": 44100},
-        "pcm_8000": {"container": "raw", "encoding": "pcm_s16le", "sample_rate": 8000},
-        "pcm_16000": {"container": "raw", "encoding": "pcm_s16le", "sample_rate": 16000},
-        "pcm_22050": {"container": "raw", "encoding": "pcm_s16le", "sample_rate": 22050},
-        "pcm_24000": {"container": "raw", "encoding": "pcm_s16le", "sample_rate": 24000},
-        "pcm_44100": {"container": "raw", "encoding": "pcm_s16le", "sample_rate": 44100},
-        "mulaw_8000": {"container": "raw", "encoding": "pcm_mulaw", "sample_rate": 8000},
-        "alaw_8000": {"container": "raw", "encoding": "pcm_alaw", "sample_rate": 8000},
-    }
-    @classmethod
-    @deprecated(
-        vdeprecated="1.0.1",
-        vremove="1.2.0",
-        reason="Old output format names are being deprecated in favor of names aligned with the Cartesia API. Use names from `OutputFormatMapping` instead.",
-    )
-    def get_format_deprecated(cls, format_name):
-        if format_name in cls._format_mapping:
-            return cls._format_mapping[format_name]
-        else:
-            raise ValueError(f"Unsupported format: {format_name}")
 class VoiceMetadata(TypedDict):
     id: str
     name: str

cartesia/tts.py CHANGED Viewed

@@ -4,7 +4,6 @@ import httpx
 from cartesia._sse import _SSE
 from cartesia._types import (
-    DeprecatedOutputFormatMapping,
     OutputFormat,
     OutputFormatMapping,
     VoiceControls,
@@ -86,10 +85,6 @@ class TTS(Resource):
         """
         if output_format_name in OutputFormatMapping._format_mapping:
             output_format_obj = OutputFormatMapping.get_format(output_format_name)
-        elif output_format_name in DeprecatedOutputFormatMapping._format_mapping:
-            output_format_obj = DeprecatedOutputFormatMapping.get_format_deprecated(
-                output_format_name
-            )
         else:
             raise ValueError(f"Unsupported format: {output_format_name}")
@@ -114,10 +109,6 @@ class TTS(Resource):
         """
         if output_format_name in OutputFormatMapping._format_mapping:
             output_format_obj = OutputFormatMapping.get_format(output_format_name)
-        elif output_format_name in DeprecatedOutputFormatMapping._format_mapping:
-            output_format_obj = DeprecatedOutputFormatMapping.get_format_deprecated(
-                output_format_name
-            )
         else:
             raise ValueError(f"Unsupported format: {output_format_name}")

cartesia/version.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__ = "1.1.0~~-dev0~~"
1	+ __version__ = "1.2.0"

cartesia/voices.py CHANGED Viewed

@@ -58,29 +58,65 @@ class Voices(Resource):
         return response.json()
-    def clone(self, filepath: Optional[str] = None, enhance: str = True) -> List[float]:
+    def clone(
+        self,
+        filepath: Optional[str] = None,
+        enhance: str = True,
+        mode: str = "clip",
+        language: str = "en",
+        name: Optional[str] = None,
+        description: Optional[str] = None,
+        transcript: Optional[str] = None,
+    ) -> Union[List[float], VoiceMetadata]:
         """Clone a voice from a clip.
         Args:
             filepath: The path to the clip file.
             enhance: Whether to enhance the clip before cloning the voice (highly recommended). Defaults to True.
+            mode: The mode to use for cloning. Either "similarity" or "stability".
+            language: The language code of the language spoken in the clip. Defaults to "en".
+            name: The name of the cloned voice.
+            description: The description of the cloned voice.
+            transcript: The transcript of the clip. Only used if mode is "similarity".
         Returns:
             The embedding of the cloned voice as a list of floats.
         """
         if not filepath:
             raise ValueError("Filepath must be specified.")
-        url = f"{self._http_url()}/voices/clone/clip"
+        headers = self.headers.copy()
+        headers.pop("Content-Type", None)
         with open(filepath, "rb") as file:
             files = {"clip": file}
-            files["enhance"] = str(enhance).lower()
-            headers = self.headers.copy()
-            headers.pop("Content-Type", None)
-            response = httpx.post(url, headers=headers, files=files, timeout=self.timeout)
-            if not response.is_success:
-                raise ValueError(f"Failed to clone voice from clip. Error: {response.text}")
-        return response.json()["embedding"]
+            data = {
+                "enhance": str(enhance).lower(),
+                "mode": mode,
+            }
+            if mode == "clip":
+                url = f"{self._http_url()}/voices/clone/clip"
+                response = httpx.post(
+                    url, headers=headers, files=files, data=data, timeout=self.timeout
+                )
+                if not response.is_success:
+                    raise ValueError(f"Failed to clone voice from clip. Error: {response.text}")
+                return response.json()["embedding"]
+            else:
+                data["name"] = name
+                data["description"] = description
+                data["language"] = language
+                if mode == "similarity" and transcript:
+                    data["transcript"] = transcript
+                url = f"{self._http_url()}/voices/clone"
+                response = httpx.post(
+                    url, headers=headers, files=files, data=data, timeout=self.timeout
+                )
+                if not response.is_success:
+                    raise ValueError(
+                        f"Failed to clone voice. Status Code: {response.status_code}\n"
+                        f"Error: {response.text}"
+                    )
+                return response.json()
     def create(
         self,
@@ -88,6 +124,7 @@ class Voices(Resource):
         description: str,
         embedding: List[float],
         base_voice_id: Optional[str] = None,
+        language: str = "en",
     ) -> VoiceMetadata:
         """Create a new voice.
@@ -108,6 +145,7 @@ class Voices(Resource):
                 "description": description,
                 "embedding": embedding,
                 "base_voice_id": base_voice_id,
+                "language": language,
             },
             timeout=self.timeout,
         )

{cartesia-1.1.0.dev0.dist-info → cartesia-1.2.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: cartesia
-Version: 1.1.0.dev0
+Version: 1.2.0
 Summary: The official Python library for the Cartesia API.
 Requires-Python: >=3.9
 Description-Content-Type: text/markdown
@@ -642,8 +642,6 @@ display(audio)
 You can use the `client.tts.get_output_format` method to convert string-based output format names into the `output_format` dictionary which is expected by the `output_format` parameter. You can see the `OutputFormatMapping` class in `cartesia._types` for the currently supported output format names. You can also view the currently supported `output_format`s in our [API Reference](https://docs.cartesia.ai/reference/api-reference/rest/stream-speech-server-sent-events).
-The previously used `output_format` strings are now deprecated and will be removed in v1.2.0. These are listed in the `DeprecatedOutputFormatMapping` class in `cartesia._types`.
 ```python
 # Get the output format dictionary from string name
 output_format = client.tts.get_output_format("raw_pcm_f32le_44100")

{cartesia-1.1.0.dev0.dist-info → cartesia-1.2.0.dist-info}/RECORD RENAMED Viewed

@@ -4,21 +4,21 @@ cartesia/_async_websocket.py,sha256=Gy0nK3g2HKIBwh-PP1AunEBj83kgFpTGCvrq6tnwg9c,
 cartesia/_constants.py,sha256=lquaYIg7IThdmC1fCklnWC8EM7stbSeVCDwRqCzPq-U,389
 cartesia/_logger.py,sha256=vU7QiGSy_AJuJFmClUocqIJ-Ltku_8C24ZU8L6fLJR0,53
 cartesia/_sse.py,sha256=CugabGUAUM-N2BruxNFxDB20HyxDlRdbN-J_yAzvBMY,5667
-cartesia/_types.py,sha256=2fTSCwjL9lJ3jsdbs0P9fHsjkhejyrrYt6oqIXGk1y4,4488
+cartesia/_types.py,sha256=gixQbKbX-H8xbD7jxHmc02KXLyjEaup19lh_57_YBl8,2570
 cartesia/_websocket.py,sha256=CpqkShdl4qBjCGMR8s6dEBHK0LJxkrG-FjbPLhjOP-U,14735
 cartesia/async_client.py,sha256=y_K_Yuv0weA4k9ZYD0M9bNM3x3frsq07tqkg7R9h0-o,2714
 cartesia/async_tts.py,sha256=IbWVRKklNClXASR6ylHaukcMRR304LUguqc4yMopbDU,2076
 cartesia/client.py,sha256=OS1ORUSlR8Jg-em1imeTAFfwkC85AQFnw8PYtTdUuC8,2364
 cartesia/resource.py,sha256=wpnB3IPcTdxYSp0vxSkpntp4NSvqvnwUWF-0ZpgWV9o,1585
-cartesia/tts.py,sha256=RiADE9wjukfq595DrtgBZY8OKoTaFBzef0wCG93yvFM,5345
-cartesia/version.py,sha256=7mgCxmrH_BGK1I131E6uUNAUW91B4b9YhDrULqohQi0,27
-cartesia/voices.py,sha256=DB4tEiSJp7jfnQM0HoiSFS09ZY2oAFbOwMlKe6pofTs,5606
+cartesia/tts.py,sha256=kWvqce9K3gZ4QrWD-ciYdK29n49SNkxhd2A7ueTOwMY,4878
+cartesia/version.py,sha256=MpAT5hgNoHnTtG1XRD_GV_A7QrHVU6vJjGSw_8qMGA4,22
+cartesia/voices.py,sha256=bDYbs0KoikAROJlmbnLdo4TrW0YwzjMvp70uKG6Alp0,7180
 cartesia/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 cartesia/utils/deprecated.py,sha256=2cXvGtrxhPeUZA5LWy2n_U5OFLDv7SHeFtzqhjSJGyk,1674
 cartesia/utils/retry.py,sha256=O6fyVWpH9Su8c0Fwupl57xMt6JrwJ52txBwP3faUL7k,3339
 cartesia/utils/tts.py,sha256=7tJmdyOYwe2QIav5d1UZxhpbcHaYqf7A77bBOlb4U_g,2100
-cartesia-1.1.0.dev0.dist-info/LICENSE.md,sha256=PT2YG5wEtEX1TNDn5sXkUXqbn-neyr7cZenTxd40ql4,1074
-cartesia-1.1.0.dev0.dist-info/METADATA,sha256=TORvxC_g0KM3OdvEpJaGSEwJ2ZawfMM_m4J58MI8ZYU,21190
-cartesia-1.1.0.dev0.dist-info/WHEEL,sha256=OVMc5UfuAQiSplgO0_WdW7vXVGAt9Hdd6qtN4HotdyA,91
-cartesia-1.1.0.dev0.dist-info/top_level.txt,sha256=rTX4HnnCegMxl1FK9czpVC7GAvf3SwDzPG65qP-BS4w,9
-cartesia-1.1.0.dev0.dist-info/RECORD,,
+cartesia-1.2.0.dist-info/LICENSE.md,sha256=PT2YG5wEtEX1TNDn5sXkUXqbn-neyr7cZenTxd40ql4,1074
+cartesia-1.2.0.dist-info/METADATA,sha256=XkVlNno4gSjSecAC0fBIqcvRP_YUAYs6D6dzIdk-c7w,21006
+cartesia-1.2.0.dist-info/WHEEL,sha256=R06PA3UVYHThwHvxuRWMqaGcr-PuniXahwjmQRFMEkY,91
+cartesia-1.2.0.dist-info/top_level.txt,sha256=rTX4HnnCegMxl1FK9czpVC7GAvf3SwDzPG65qP-BS4w,9
+cartesia-1.2.0.dist-info/RECORD,,

{cartesia-1.1.0.dev0.dist-info → cartesia-1.2.0.dist-info}/WHEEL RENAMED Viewed

@@ -1,5 +1,5 @@
 Wheel-Version: 1.0
-Generator: setuptools (75.2.0)
+Generator: setuptools (75.5.0)
 Root-Is-Purelib: true
 Tag: py3-none-any

{cartesia-1.1.0.dev0.dist-info → cartesia-1.2.0.dist-info}/LICENSE.md RENAMED Viewed

File without changes

{cartesia-1.1.0.dev0.dist-info → cartesia-1.2.0.dist-info}/top_level.txt RENAMED Viewed

File without changes

cartesia 1.1.0.dev0__py3-none-any.whl → 1.2.0__py3-none-any.whl

cartesia 1.1.0.dev0py3-none-any.whl → 1.2.0py3-none-any.whl