PyPI - cartesia - Versions diffs - 0.1.1__py2.py3-none-any.whl → 1.0.0__py2.py3-none-any.whl - Mend

cartesia 0.1.1py2.py3-none-any.whl → 1.0.0py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

cartesia/__init__.py +2 -2
cartesia/_types.py +33 -39
cartesia/client.py +874 -0
cartesia/version.py +1 -1
cartesia-1.0.0.dist-info/METADATA +364 -0
cartesia-1.0.0.dist-info/RECORD +9 -0
cartesia/tts.py +0 -702
cartesia-0.1.1.dist-info/METADATA +0 -189
cartesia-0.1.1.dist-info/RECORD +0 -9
{cartesia-0.1.1.dist-info → cartesia-1.0.0.dist-info}/WHEEL +0 -0
{cartesia-0.1.1.dist-info → cartesia-1.0.0.dist-info}/top_level.txt +0 -0

cartesia/__init__.py CHANGED Viewed

@@ -1,3 +1,3 @@
-from cartesia.tts import AsyncCartesiaTTS, CartesiaTTS
+from cartesia.client import Cartesia, AsyncCartesia
-__all__ = ["CartesiaTTS", "AsyncCartesiaTTS"]
+__all__ = ["Cartesia", "AsyncCartesia"]

cartesia/_types.py CHANGED Viewed

@@ -1,43 +1,37 @@
-from enum import Enum
-from typing import List, Optional, TypedDict, Union
-try:
-    import numpy as np
-    _NUMPY_AVAILABLE = True
-except ImportError:
-    _NUMPY_AVAILABLE = False
-class AudioDataReturnType(Enum):
-    BYTES = "bytes"
-    ARRAY = "array"
-class AudioOutputFormat(Enum):
-    """Supported output formats for the audio."""
-    FP32 = "fp32"  # float32
-    PCM = "pcm"  # 16-bit signed integer PCM
-    FP32_16000 = "fp32_16000"  # float32, 16 kHz
-    FP32_22050 = "fp32_22050"  # float32, 22.05 kHz
-    FP32_44100 = "fp32_44100"  # float32, 44.1 kHz
-    PCM_16000 = "pcm_16000"  # 16-bit signed integer PCM, 16 kHz
-    PCM_22050 = "pcm_22050"  # 16-bit signed integer PCM, 22.05 kHz
-    PCM_44100 = "pcm_44100"  # 16-bit signed integer PCM, 44.1 kHz
-    MULAW_8000 = "mulaw_8000"  # 8-bit mu-law, 8 kHz
-class AudioOutput(TypedDict):
-    audio: Union[bytes, "np.ndarray"]
-    sampling_rate: int
-Embedding = List[float]
+from typing import List, TypedDict
+class OutputFormatMapping:
+    _format_mapping = {
+        "fp32": {"container": "raw", "encoding": "pcm_f32le", "sample_rate": 44100},
+        "pcm": {"container": "raw", "encoding": "pcm_s16le", "sample_rate": 44100},
+        "fp32_16000": {"container": "raw", "encoding": "pcm_f32le", "sample_rate": 16000},
+        "fp32_22050": {"container": "raw", "encoding": "pcm_f32le", "sample_rate": 22050},
+        "fp32_44100": {"container": "raw", "encoding": "pcm_f32le", "sample_rate": 44100},
+        "pcm_16000": {"container": "raw", "encoding": "pcm_s16le", "sample_rate": 16000},
+        "pcm_22050": {"container": "raw", "encoding": "pcm_s16le", "sample_rate": 22050},
+        "pcm_44100": {"container": "raw", "encoding": "pcm_s16le", "sample_rate": 44100},
+        "mulaw_8000": {"container": "raw", "encoding": "pcm_mulaw", "sample_rate": 8000},
+        "alaw_8000": {"container": "raw", "encoding": "pcm_alaw", "sample_rate": 8000},
+    }
+    @classmethod
+    def get_format(cls, format_name):
+        if format_name in cls._format_mapping:
+            return cls._format_mapping[format_name]
+        else:
+            raise ValueError(f"Unsupported format: {format_name}")
 class VoiceMetadata(TypedDict):
     id: str
     name: str
     description: str
-    embedding: Optional[Embedding]
+    embedding: List[float]
+    is_public: bool
+    user_id: str
+    created_at: str
+    language: str
+class OutputFormat(TypedDict):
+    container: str
+    encoding: str
+    sample_rate: int

cartesia 0.1.1__py2.py3-none-any.whl → 1.0.0__py2.py3-none-any.whl

cartesia 0.1.1py2.py3-none-any.whl → 1.0.0py2.py3-none-any.whl