PyPI - smallestai - Versions diffs - 4.0.1__py3-none-any.whl → 4.1.0__py3-none-any.whl - Mend

smallestai 4.0.1py3-none-any.whl → 4.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of smallestai might be problematic. Click here for more details.

Files changed (10) hide show

smallestai/waves/async_waves_client.py CHANGED Viewed

@@ -6,8 +6,8 @@ import aiofiles
 import requests
 from typing import Optional, Union, List
-from smallestai.waves.exceptions import TTSError, APIError
-from smallestai.waves.utils import (TTSOptions, validate_input,
+from smallestai.waves.exceptions import InvalidError, APIError
+from smallestai.waves.utils import (TTSOptions, validate_input, validate_asr_input,
                      get_smallest_languages, get_smallest_models, ALLOWED_AUDIO_EXTENSIONS, API_BASE_URL)
@@ -52,7 +52,7 @@ class AsyncWavesClient:
         """
         self.api_key = api_key or os.environ.get("SMALLEST_API_KEY")
         if not self.api_key:
-            raise TTSError()
+            raise InvalidError()
         if model == "lightning-large" and voice_id is None:
             voice_id = "lakshya"
@@ -150,7 +150,7 @@ class AsyncWavesClient:
             - Otherwise, returns the synthesized audio content as bytes.
         Raises:
-        - TTSError: If the provided file name does not have a .wav or .mp3 extension when `save_as` is specified.
+        - InvalidError: If the provided file name does not have a .wav or .mp3 extension when `save_as` is specified.
         - APIError: If the API request fails or returns an error.
         - ValueError: If an unexpected parameter is passed in `kwargs`.
         """
@@ -223,17 +223,17 @@ class AsyncWavesClient:
         - str: The response from the API as a formatted JSON string.
         Raises:
-        - TTSError: If the file does not exist or is not a valid audio file.
+        - InvalidError: If the file does not exist or is not a valid audio file.
         - APIError: If the API request fails or returns an error.
         """
         url = f"{API_BASE_URL}/lightning-large/add_voice"
         if not os.path.exists(file_path):
-            raise TTSError("Invalid file path. File does not exist.")
+            raise InvalidError("Invalid file path. File does not exist.")
         file_extension = os.path.splitext(file_path)[1].lower()
         if file_extension not in ALLOWED_AUDIO_EXTENSIONS:
-            raise TTSError(f"Invalid file type. Supported formats are: {ALLOWED_AUDIO_EXTENSIONS}")
+            raise InvalidError(f"Invalid file type. Supported formats are: {ALLOWED_AUDIO_EXTENSIONS}")
         headers = {
             'Authorization': f"Bearer {self.api_key}",
@@ -255,7 +255,7 @@ class AsyncWavesClient:
                 if res.status != 200:
                     raise APIError(f"Failed to add voice: {await res.text()}. For more information, visit https://waves.smallest.ai/")
-                return json.dumps(await res.json(), indent=4, ensure_ascii=False)
+                return await res.json()
         finally:
             if should_cleanup and self.session:
@@ -290,8 +290,61 @@ class AsyncWavesClient:
                 if res.status != 200:
                     raise APIError(f"Failed to delete voice: {await res.text()}. For more information, visit https://waves.smallest.ai/")
-                return json.dumps(await res.json(), indent=4, ensure_ascii=False)
+                return await res.json()
         finally:
             if should_cleanup and self.session:
                 await self.session.close()
-                self.session = None
+                self.session = None
+    async def transcribe(
+        self,
+        file_path: str,
+        language: Optional[str] = "en",
+        word_timestamps: Optional[bool] = False,
+        age_detection: Optional[bool] = False,
+        gender_detection: Optional[bool] = False,
+        emotion_detection: Optional[bool] = False,
+        model: Optional[str] = "lightning"
+    ) -> dict:
+        validate_asr_input(file_path, model, language)
+        url = f"{API_BASE_URL}/speech-to-text"
+        headers = {
+            'Authorization': f"Bearer {self.api_key}",
+        }
+        should_cleanup = await self._ensure_session()
+        try:
+            file_extension = os.path.splitext(file_path)[1].lower()
+            content_type = f"audio/{file_extension[1:]}" if file_extension else "application/octet-stream"
+            async with aiofiles.open(file_path, 'rb') as f:
+                file_data = await f.read()
+            form = aiohttp.FormData()
+            form.add_field(
+                'file',
+                file_data,
+                filename=os.path.basename(file_path),
+                content_type=content_type
+            )
+            # Send options as multipart form fields (not query params)
+            form.add_field('model', model)
+            form.add_field('language', language)
+            form.add_field('word_timestamps', str(bool(word_timestamps)).lower())
+            form.add_field('age_detection', str(bool(age_detection)).lower())
+            form.add_field('gender_detection', str(bool(gender_detection)).lower())
+            form.add_field('emotion_detection', str(bool(emotion_detection)).lower())
+            async with self.session.post(url, headers=headers, data=form) as res:
+                if res.status != 200:
+                    raise APIError(
+                        f"Failed to transcribe audio: {await res.text()}. "
+                        "For more information, visit https://waves-docs.smallest.ai/v4.0.0/content/api-references/asr-post-api"
+                    )
+                return await res.json()
+        finally:
+            if should_cleanup and self.session:
+                await self.session.close()
+                self.session = None

smallestai/waves/exceptions.py CHANGED Viewed

@@ -1,18 +1,18 @@
-class TTSError(Exception):
+class InvalidError(Exception):
     """Base exception for TTS SDK"""
     default_message = "API key is required. Please set the `SMALLEST_API_KEY` environment variable or visit https://waves.smallest.ai/ to obtain your API key."
     def __init__(self, message=None):
         super().__init__(message or self.default_message)
-class APIError(TTSError):
+class APIError(InvalidError):
     """Raised when the API returns an error"""
     pass
-class ValidationError(TTSError):
+class ValidationError(InvalidError):
     """Raised when input validation fails"""
     pass
-class AuthenticationError(TTSError):
+class AuthenticationError(InvalidError):
     """Raised when authentication fails"""
     pass

smallestai/waves/models.py CHANGED Viewed

@@ -6,3 +6,11 @@ TTSModels = [
     "lightning-large",
     "lightning-v2"
 ]
+ASRLanguages_lightning = [
+    "it", "es", "en", "pt", "hi", "de", "fr", "uk", "ru", "kn", "ml", "pl",
+    "mr", "gu", "cs", "sk", "te", "or", "nl", "bn", "lv", "et", "ro", "pa",
+    "fi", "sv", "bg", "ta", "hu", "da", "lt", "mt", "multi"
+]
+ASRModels = [
+    "lightning"
+]

smallestai/waves/utils.py CHANGED Viewed

@@ -1,9 +1,10 @@
+import os
 from typing import List
 from typing import Optional
 from dataclasses import dataclass
 from smallestai.waves.exceptions import ValidationError
-from smallestai.waves.models import TTSModels, TTSLanguages_lightning, TTSLanguages_lightning_large, TTSLanguages_lightning_v2
+from smallestai.waves.models import TTSModels, TTSLanguages_lightning, TTSLanguages_lightning_large, TTSLanguages_lightning_v2, ASRModels, ASRLanguages_lightning
 API_BASE_URL = "https://waves-api.smallest.ai/api/v1"
@@ -25,7 +26,24 @@ class TTSOptions:
     enhancement: int
     language: str
     output_format: str
+@dataclass
+class ASROptions:
+    model: str
+    api_key: str
+    language: str
+    word_timestamps: bool
+    age_detection: bool
+    gender_detection: bool
+    emotion_detection: bool
+def validate_asr_input(file_path: str, model: str, language: str):
+    if not os.path.isfile(file_path):
+        raise ValidationError("Invalid file path. File does not exist.")
+    if model not in ASRModels:
+        raise ValidationError(f"Invalid model: {model}. Must be one of {ASRModels}")
+    if language not in ASRLanguages_lightning:
+        raise ValidationError(f"Invalid language: {language}. Must be one of {ASRLanguages_lightning}")
 def validate_input(text: str, model: str, sample_rate: int, speed: float, consistency: Optional[float] = None, similarity: Optional[float] = None, enhancement: Optional[int] = None):
     if not text:

smallestai/waves/waves_client.py CHANGED Viewed

@@ -4,8 +4,8 @@ import copy
 import requests
 from typing import Optional, Union, List
-from smallestai.waves.exceptions import TTSError, APIError
-from smallestai.waves.utils import (TTSOptions, validate_input,
+from smallestai.waves.exceptions import InvalidError, APIError
+from smallestai.waves.utils import (TTSOptions, validate_input, validate_asr_input,
                         get_smallest_languages, get_smallest_models, ALLOWED_AUDIO_EXTENSIONS, API_BASE_URL)
 class WavesClient:
@@ -48,7 +48,7 @@ class WavesClient:
         """
         self.api_key = api_key or os.environ.get("SMALLEST_API_KEY")
         if not self.api_key:
-            raise TTSError()
+            raise InvalidError()
         if model == "lightning-large" and voice_id is None:
             voice_id = "lakshya"
@@ -125,7 +125,7 @@ class WavesClient:
             - Otherwise, returns the synthesized audio content as bytes.
         Raises:
-        - TTSError: If the provided file name does not have a .wav or .mp3 extension when `save_as` is specified.
+        - InvalidError: If the provided file name does not have a .wav or .mp3 extension when `save_as` is specified.
         - APIError: If the API request fails or returns an error.
         """
         opts = copy.deepcopy(self.opts)
@@ -184,15 +184,15 @@ class WavesClient:
         - str: The response from the API as a formatted JSON string.
         Raises:
-        - TTSError: If the file does not exist or is not a valid audio file.
+        - InvalidError: If the file does not exist or is not a valid audio file.
         - APIError: If the API request fails or returns an error.
         """
         if not os.path.isfile(file_path):
-            raise TTSError("Invalid file path. File does not exist.")
+            raise InvalidError("Invalid file path. File does not exist.")
         file_extension = os.path.splitext(file_path)[1].lower()
         if file_extension not in ALLOWED_AUDIO_EXTENSIONS:
-            raise TTSError(f"Invalid file type. Supported formats are: {ALLOWED_AUDIO_EXTENSIONS}")
+            raise InvalidError(f"Invalid file type. Supported formats are: {ALLOWED_AUDIO_EXTENSIONS}")
         url = f"{API_BASE_URL}/lightning-large/add_voice"
         payload = {'displayName': display_name}
@@ -206,8 +206,8 @@ class WavesClient:
         response = requests.post(url, headers=headers, data=payload, files=files)
         if response.status_code != 200:
             raise APIError(f"Failed to add voice: {response.text}. For more information, visit https://waves.smallest.ai/")
-        return json.dumps(response.json(), indent=4, ensure_ascii=False)
+        return response.json()
     def delete_voice(self, voice_id: str) -> str:
@@ -234,4 +234,41 @@ class WavesClient:
         if response.status_code != 200:
             raise APIError(f"Failed to delete voice: {response.text}. For more information, visit https://waves.smallest.ai/")
-        return json.dumps(response.json(), indent=4, ensure_ascii=False)
+        return response.json()
+    def transcribe(
+        self,
+        file_path: str,
+        language: Optional[str] = "en",
+        word_timestamps: Optional[bool] = False,
+        age_detection: Optional[bool] = False,
+        gender_detection: Optional[bool] = False,
+        emotion_detection: Optional[bool] = False,
+        model: Optional[str] = "lightning"
+    ) -> dict:
+        validate_asr_input(file_path, model, language)
+        url = f"{API_BASE_URL}/speech-to-text"
+        headers = {
+            'Authorization': f"Bearer {self.api_key}",
+        }
+        payload = {
+            'model': model,
+            'language': language,
+            'word_timestamps': str(bool(word_timestamps)).lower(),
+            'age_detection': str(bool(age_detection)).lower(),
+            'gender_detection': str(bool(gender_detection)).lower(),
+            'emotion_detection': str(bool(emotion_detection)).lower()
+        }
+        file_extension = os.path.splitext(file_path)[1].lower()
+        content_type = f"audio/{file_extension[1:]}" if file_extension else "application/octet-stream"
+        with open(file_path, 'rb') as f:
+            files = {'file': (os.path.basename(file_path), f, content_type)}
+            response = requests.post(url, headers=headers, files=files, data=payload)
+        if response.status_code != 200:
+            raise APIError(f"Failed to transcribe audio: {response.text}. For more information, visit https://waves-docs.smallest.ai/v4.0.0/content/api-references/asr-post-api")
+        return response.json()

{smallestai-4.0.1.dist-info → smallestai-4.1.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: smallestai
-Version: 4.0.1
+Version: 4.1.0
 Summary: Official Python client for the Smallest AI API
 Author-email: Smallest <support@smallest.ai>
 License: MIT

{smallestai-4.0.1.dist-info → smallestai-4.1.0.dist-info}/RECORD RENAMED Viewed

@@ -134,14 +134,14 @@ smallestai/atoms/models/webhook_post_request_events_inner.py,sha256=xrJ41CgtZMEX
 smallestai/atoms/models/webhook_subscription.py,sha256=tU_IthL9wOlEqL0WlhUTaLjNheHV0SORiJxBNcqPsUs,3908
 smallestai/atoms/models/webhook_subscription_populated.py,sha256=3mfU3cvtpOnWWsSqUv7m2NFP7lAjNUrXRmeLKrelAlc,4207
 smallestai/waves/__init__.py,sha256=hxyqisgFiKiroxupuZeNXpXFIbnivmdgPrid3CnLhh0,268
-smallestai/waves/async_waves_client.py,sha256=BgiSqd2UjwECCPwuh2dyhLSBP0inIsbPUEbduWTJrmI,11704
-smallestai/waves/exceptions.py,sha256=nY6I8fCXe2By54CytQ0-i3hFiYtt8TYAKj0g6OYsCjc,585
-smallestai/waves/models.py,sha256=FaMVkOFyNCVpWvyMCmqkv3t1wmnfCs1HIULxLr1L8XE,283
+smallestai/waves/async_waves_client.py,sha256=1eRgJV5ZuyqH0gTMYpijjKoqI3epSgyvTRLP3-Fex5s,13865
+smallestai/waves/exceptions.py,sha256=zJ_erDTHcVVW7UKCfMCnyAZfvTypHBek28LJqxsbH50,601
+smallestai/waves/models.py,sha256=RaCy9Wfg_HiVF0FBh_WE4C8C5t_06zLoXTDciIjI8GI,556
 smallestai/waves/stream_tts.py,sha256=c9r8mZuuFjbyWsUrlZ1jb0WNX7-lR39EXDUqyF-5g14,6792
-smallestai/waves/utils.py,sha256=sqDpfa5SC60C_kJZo4MKxlDfkX7RRzO6aJ2hKpNMemE,2273
-smallestai/waves/waves_client.py,sha256=U6aqClYL49cTtYisvpUVhas2miGZiCfqwTU0eDUY548,9770
-smallestai-4.0.1.dist-info/licenses/LICENSE,sha256=kK3HNKhN7luQhkjkNWIvy9_gizbEDUM4mSv_HWq9uuM,1068
-smallestai-4.0.1.dist-info/METADATA,sha256=c9DX-VrtU8V0Lh4CWp7FfSY-pQT6CbQLFg9O3dmSAYY,20421
-smallestai-4.0.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-smallestai-4.0.1.dist-info/top_level.txt,sha256=pdJzm1VC2J6RxoobATz45L9U3cki4AFLigsfvETz7Io,11
-smallestai-4.0.1.dist-info/RECORD,,
+smallestai/waves/utils.py,sha256=f88r6uqDELWPos1Kmee3W53Ec0lrcT8CWnkyLPHl17E,2952
+smallestai/waves/waves_client.py,sha256=7kHgLyHpduYoQr_zQ6edyF2a_FGKcrEvICnz6_OFoBo,11252
+smallestai-4.1.0.dist-info/licenses/LICENSE,sha256=kK3HNKhN7luQhkjkNWIvy9_gizbEDUM4mSv_HWq9uuM,1068
+smallestai-4.1.0.dist-info/METADATA,sha256=Dg58pZfqEBnles1XTwBruWfeuYodezYXw-xqR3r5GxE,20421
+smallestai-4.1.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+smallestai-4.1.0.dist-info/top_level.txt,sha256=pdJzm1VC2J6RxoobATz45L9U3cki4AFLigsfvETz7Io,11
+smallestai-4.1.0.dist-info/RECORD,,

{smallestai-4.0.1.dist-info → smallestai-4.1.0.dist-info}/WHEEL RENAMED Viewed

File without changes

{smallestai-4.0.1.dist-info → smallestai-4.1.0.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{smallestai-4.0.1.dist-info → smallestai-4.1.0.dist-info}/top_level.txt RENAMED Viewed

File without changes

smallestai 4.0.1__py3-none-any.whl → 4.1.0__py3-none-any.whl

Potentially problematic release.

smallestai 4.0.1py3-none-any.whl → 4.1.0py3-none-any.whl