PyPI - audiopod - Versions diffs - 1.2.0__py3-none-any.whl → 1.5.0__py3-none-any.whl - Mend

audiopod 1.2.0py3-none-any.whl → 1.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

audiopod/__init__.py +13 -63
audiopod/client.py +149 -172
audiopod/config.py +4 -50
audiopod/exceptions.py +16 -71
audiopod/services/__init__.py +10 -6
audiopod/services/base.py +51 -195
audiopod/services/credits.py +26 -30
audiopod/services/denoiser.py +125 -40
audiopod/services/music.py +180 -485
audiopod/services/speaker.py +117 -36
audiopod/services/stem_extraction.py +249 -142
audiopod/services/transcription.py +182 -184
audiopod/services/translation.py +109 -170
audiopod/services/video.py +329 -0
audiopod/services/voice.py +141 -424
audiopod/services/wallet.py +235 -0
audiopod-1.5.0.dist-info/METADATA +206 -0
audiopod-1.5.0.dist-info/RECORD +21 -0
{audiopod-1.2.0.dist-info → audiopod-1.5.0.dist-info}/WHEEL +1 -1
audiopod/cli.py +0 -285
audiopod/models.py +0 -250
audiopod/py.typed +0 -2
audiopod/services/karaoke.py +0 -61
audiopod-1.2.0.dist-info/METADATA +0 -454
audiopod-1.2.0.dist-info/RECORD +0 -24
audiopod-1.2.0.dist-info/entry_points.txt +0 -2
{audiopod-1.2.0.dist-info → audiopod-1.5.0.dist-info}/licenses/LICENSE +0 -0
{audiopod-1.2.0.dist-info → audiopod-1.5.0.dist-info}/top_level.txt +0 -0

audiopod/services/speaker.py CHANGED Viewed

@@ -1,53 +1,134 @@
 """
-Speaker Service - Speaker analysis and diarization
+Speaker Service - Speaker diarization and extraction
 """
-from typing import Optional, Union
+from typing import Optional, Dict, Any, List
 from .base import BaseService
-from ..models import Job, SpeakerAnalysisResult
 class SpeakerService(BaseService):
-    """Service for speaker diarization and analysis"""
-    def diarize_speakers(
+    """Service for speaker diarization and extraction."""
+    def diarize(
         self,
-        audio_file: str,
+        audio_file: Optional[str] = None,
+        url: Optional[str] = None,
         num_speakers: Optional[int] = None,
         wait_for_completion: bool = False,
-        timeout: int = 600
-    ) -> Union[Job, SpeakerAnalysisResult]:
-        """Identify and separate speakers in audio"""
-        files = self._prepare_file_upload(audio_file, "file")
+        timeout: int = 600,
+    ) -> Dict[str, Any]:
+        """
+        Identify and separate speakers in audio.
+        Args:
+            audio_file: Path to local audio file
+            url: URL of audio file
+            num_speakers: Expected number of speakers (auto-detected if not provided)
+            wait_for_completion: Wait for completion
+            timeout: Max wait time in seconds
+        Returns:
+            Job dict with speaker segments when completed
+        """
         data = {}
         if num_speakers:
             data["num_speakers"] = num_speakers
+        if url:
+            data["url"] = url
+        files = self._prepare_file_upload(audio_file, "file") if audio_file else None
         if self.async_mode:
-            return self._async_diarize(files, data, wait_for_completion, timeout)
-        else:
-            response = self.client.request(
-                "POST", "/api/v1/speaker/diarize",
-                data=data, files=files
-            )
-            job = Job.from_dict(response)
-            if wait_for_completion:
-                completed_job = self._wait_for_completion(job.id, timeout)
-                return SpeakerAnalysisResult.from_dict(completed_job.result or completed_job.__dict__)
-            return job
-    async def _async_diarize(self, files, data, wait_for_completion, timeout):
-        """Async version of diarize_speakers"""
+            return self._async_diarize(data, files, wait_for_completion, timeout)
+        response = self.client.request("POST", "/api/v1/speaker/diarize", data=data, files=files)
+        if wait_for_completion:
+            return self._wait_for_completion(response["id"], timeout)
+        return response
+    async def _async_diarize(
+        self, data: Dict, files: Optional[Dict], wait_for_completion: bool, timeout: int
+    ) -> Dict[str, Any]:
         response = await self.client.request(
-            "POST", "/api/v1/speaker/diarize",
-            data=data, files=files
+            "POST", "/api/v1/speaker/diarize", data=data, files=files
         )
-        job = Job.from_dict(response)
         if wait_for_completion:
-            completed_job = await self._async_wait_for_completion(job.id, timeout)
-            return SpeakerAnalysisResult.from_dict(completed_job.result or completed_job.__dict__)
-        return job
+            return await self._async_wait_for_completion(response["id"], timeout)
+        return response
+    def extract(
+        self,
+        audio_file: Optional[str] = None,
+        url: Optional[str] = None,
+        wait_for_completion: bool = False,
+        timeout: int = 600,
+    ) -> Dict[str, Any]:
+        """
+        Extract individual speaker audio tracks.
+        Args:
+            audio_file: Path to local audio file
+            url: URL of audio file
+            wait_for_completion: Wait for completion
+            timeout: Max wait time in seconds
+        Returns:
+            Job dict with speaker audio URLs when completed
+        """
+        data = {}
+        if url:
+            data["url"] = url
+        files = self._prepare_file_upload(audio_file, "file") if audio_file else None
+        if self.async_mode:
+            return self._async_extract(data, files, wait_for_completion, timeout)
+        response = self.client.request("POST", "/api/v1/speaker/extract", data=data, files=files)
+        if wait_for_completion:
+            return self._wait_for_completion(response["id"], timeout)
+        return response
+    async def _async_extract(
+        self, data: Dict, files: Optional[Dict], wait_for_completion: bool, timeout: int
+    ) -> Dict[str, Any]:
+        response = await self.client.request(
+            "POST", "/api/v1/speaker/extract", data=data, files=files
+        )
+        if wait_for_completion:
+            return await self._async_wait_for_completion(response["id"], timeout)
+        return response
+    def get_job(self, job_id: int) -> Dict[str, Any]:
+        """Get speaker job details and status."""
+        if self.async_mode:
+            return self._async_get_job(job_id)
+        return self.client.request("GET", f"/api/v1/speaker/jobs/{job_id}")
+    async def _async_get_job(self, job_id: int) -> Dict[str, Any]:
+        return await self.client.request("GET", f"/api/v1/speaker/jobs/{job_id}")
+    def list_jobs(self, skip: int = 0, limit: int = 50) -> List[Dict[str, Any]]:
+        """List speaker jobs."""
+        if self.async_mode:
+            return self._async_list_jobs(skip, limit)
+        return self.client.request(
+            "GET", "/api/v1/speaker/jobs", params={"skip": skip, "limit": limit}
+        )
+    async def _async_list_jobs(self, skip: int, limit: int) -> List[Dict[str, Any]]:
+        return await self.client.request(
+            "GET", "/api/v1/speaker/jobs", params={"skip": skip, "limit": limit}
+        )
+    def delete_job(self, job_id: int) -> Dict[str, str]:
+        """Delete a speaker job."""
+        if self.async_mode:
+            return self._async_delete_job(job_id)
+        return self.client.request("DELETE", f"/api/v1/speaker/jobs/{job_id}")
+    async def _async_delete_job(self, job_id: int) -> Dict[str, str]:
+        return await self.client.request("DELETE", f"/api/v1/speaker/jobs/{job_id}")

audiopod/services/stem_extraction.py CHANGED Viewed

@@ -1,180 +1,287 @@
 """
-Stem Extraction Service - Audio stem separation operations
+Stem Extraction Service - Audio stem separation
 """
-from typing import List, Optional, Dict, Any, Union
+from typing import List, Optional, Dict, Any, Literal
 from .base import BaseService
-from ..models import Job
 from ..exceptions import ValidationError
+# Valid separation modes for the new API
+StemMode = Literal["single", "two", "four", "six", "producer", "studio", "mastering"]
+SingleStem = Literal["vocals", "drums", "bass", "guitar", "piano", "other", "instrumental"]
 class StemExtractionService(BaseService):
-    """Service for audio stem extraction operations"""
+    """
+    Service for audio stem separation.
+    Example:
+        ```python
+        from audiopod import Client
+        client = Client()
+        # Simple mode-based extraction (recommended)
+        result = client.stem_extraction.separate(
+            url="https://youtube.com/watch?v=VIDEO_ID",
+            mode="six"
+        )
+        for stem, url in result["download_urls"].items():
+            print(f"{stem}: {url}")
+        # Or extract only vocals
+        result = client.stem_extraction.separate(
+            file="song.mp3",
+            mode="single",
+            stem="vocals"
+        )
+        ```
+    """
+    def separate(
+        self,
+        file: Optional[str] = None,
+        url: Optional[str] = None,
+        mode: StemMode = "four",
+        stem: Optional[SingleStem] = None,
+        wait_for_completion: bool = True,
+        timeout: int = 900,
+    ) -> Dict[str, Any]:
+        """
+        Separate audio into stems using simple mode selection.
+        Args:
+            file: Path to local audio file
+            url: URL of audio/video (YouTube, SoundCloud, direct link)
+            mode: Separation mode:
+                - "single": Extract one stem (specify stem param)
+                - "two": Vocals + Instrumental
+                - "four": Vocals, Drums, Bass, Other (default)
+                - "six": Vocals, Drums, Bass, Guitar, Piano, Other
+                - "producer": 8 stems with kick, snare, hihat
+                - "studio": 12 stems for professional mixing
+                - "mastering": 16 stems maximum detail
+            stem: For mode="single", which stem to extract
+            wait_for_completion: Wait for job to complete (default: True)
+            timeout: Max wait time in seconds
+        Returns:
+            Job dict with id, status, download_urls (when completed)
+        """
+        if not file and not url:
+            raise ValidationError("Provide file or url")
+        if file and url:
+            raise ValidationError("Provide file or url, not both")
+        if mode == "single" and not stem:
+            raise ValidationError(
+                "stem parameter required for mode='single'. "
+                "Options: vocals, drums, bass, guitar, piano, other, instrumental"
+            )
+        data = {"mode": mode}
+        if stem:
+            data["stem"] = stem
+        if url:
+            data["url"] = url
+        files = self._prepare_file_upload(file, "file") if file else None
+        if self.async_mode:
+            return self._async_separate(data, files, wait_for_completion, timeout)
+        response = self.client.request(
+            "POST", "/api/v1/stem-extraction/api/extract", data=data, files=files
+        )
+        if wait_for_completion:
+            return self._wait_for_stem_job(response["id"], timeout)
+        return response
+    async def _async_separate(
+        self,
+        data: Dict[str, Any],
+        files: Optional[Dict[str, Any]],
+        wait_for_completion: bool,
+        timeout: int,
+    ) -> Dict[str, Any]:
+        response = await self.client.request(
+            "POST", "/api/v1/stem-extraction/api/extract", data=data, files=files
+        )
+        if wait_for_completion:
+            return await self._async_wait_for_stem_job(response["id"], timeout)
+        return response
+    def extract(
+        self,
+        file: Optional[str] = None,
+        url: Optional[str] = None,
+        mode: StemMode = "four",
+        stem: Optional[SingleStem] = None,
+    ) -> Dict[str, Any]:
+        """
+        Submit stem extraction job (returns immediately without waiting).
+        Use wait_for_completion() to poll for results.
+        """
+        return self.separate(file=file, url=url, mode=mode, stem=stem, wait_for_completion=False)
+    def wait_for_completion(self, job_id: int, timeout: int = 900) -> Dict[str, Any]:
+        """Wait for stem extraction job to complete."""
+        return self._wait_for_stem_job(job_id, timeout)
+    def status(self, job_id: int) -> Dict[str, Any]:
+        """Get stem extraction job status (alias for get_job)."""
+        return self.get_job(job_id)
+    def modes(self) -> Dict[str, Any]:
+        """Get available separation modes."""
+        if self.async_mode:
+            return self._async_modes()
+        return self.client.request("GET", "/api/v1/stem-extraction/modes")
+    async def _async_modes(self) -> Dict[str, Any]:
+        return await self.client.request("GET", "/api/v1/stem-extraction/modes")
+    # Legacy method - kept for backward compatibility
     def extract_stems(
         self,
         audio_file: Optional[str] = None,
         url: Optional[str] = None,
-        stem_types: List[str] = None,
+        stem_types: Optional[List[str]] = None,
         model_name: str = "htdemucs",
         two_stems_mode: Optional[str] = None,
         wait_for_completion: bool = False,
-        timeout: int = 900
-    ) -> Job:
+        timeout: int = 900,
+    ) -> Dict[str, Any]:
         """
-        Extract stems from audio file
+        Extract stems from audio (legacy method).
+        For new code, use separate() instead which uses the simpler mode-based API.
         Args:
-            audio_file: Path to audio file to process
-            url: URL of audio file to process (alternative to audio_file)
-            stem_types: List of stems to extract (e.g., ['vocals', 'drums', 'bass', 'other'])
-            model_name: Model to use for separation ('htdemucs' or 'htdemucs_6s')
-            two_stems_mode: Two-stem mode for vocals/instrumental separation
-            wait_for_completion: Whether to wait for completion
-            timeout: Maximum time to wait
+            audio_file: Path to local audio file
+            url: URL of audio file (alternative to audio_file)
+            stem_types: Stems to extract (e.g., ["vocals", "drums", "bass", "other"])
+            model_name: Model to use ("htdemucs" or "htdemucs_6s")
+            two_stems_mode: Two-stem mode ("vocals", "drums", or "bass")
+            wait_for_completion: Wait for job to complete
+            timeout: Max wait time in seconds
         Returns:
-            Job object with stem extraction details
+            Job dict with id, status, download_urls (when completed)
         """
         if not audio_file and not url:
-            raise ValidationError("Either audio_file or url must be provided")
+            raise ValidationError("Provide audio_file or url")
         if audio_file and url:
-            raise ValidationError("Provide either audio_file or url, not both")
-        # Set default stem types based on model
+            raise ValidationError("Provide audio_file or url, not both")
         if stem_types is None:
-            if model_name == "htdemucs_6s":
-                stem_types = ["vocals", "drums", "bass", "other", "piano", "guitar"]
-            else:
-                stem_types = ["vocals", "drums", "bass", "other"]
-        # Validate model name
-        if model_name not in ["htdemucs", "htdemucs_6s"]:
-            raise ValidationError("Model name must be 'htdemucs' or 'htdemucs_6s'")
-        # Prepare request
-        files = {}
-        data = {
-            "stem_types": str(stem_types),  # API expects string representation
-            "model_name": model_name
-        }
-        if audio_file:
-            files = self._prepare_file_upload(audio_file, "file")
+            stem_types = (
+                ["vocals", "drums", "bass", "other", "piano", "guitar"]
+                if model_name == "htdemucs_6s"
+                else ["vocals", "drums", "bass", "other"]
+            )
+        data = {"stem_types": str(stem_types), "model_name": model_name}
         if url:
             data["url"] = url
         if two_stems_mode:
             data["two_stems_mode"] = two_stems_mode
+        files = self._prepare_file_upload(audio_file, "file") if audio_file else None
         if self.async_mode:
-            return self._async_extract_stems(files, data, wait_for_completion, timeout)
-        else:
-            response = self.client.request(
-                "POST",
-                "/api/v1/stem-extraction/extract",
-                data=data,
-                files=files if files else None
-            )
-            job = Job.from_dict(response)
-            if wait_for_completion:
-                return self._wait_for_completion(job.id, timeout)
-            return job
+            return self._async_extract_stems(data, files, wait_for_completion, timeout)
+        response = self.client.request(
+            "POST", "/api/v1/stem-extraction/extract", data=data, files=files
+        )
+        if wait_for_completion:
+            return self._wait_for_stem_job(response["id"], timeout)
+        return response
     async def _async_extract_stems(
         self,
-        files: Dict[str, Any],
         data: Dict[str, Any],
+        files: Optional[Dict[str, Any]],
         wait_for_completion: bool,
-        timeout: int
-    ) -> Job:
-        """Async version of extract_stems"""
+        timeout: int,
+    ) -> Dict[str, Any]:
         response = await self.client.request(
-            "POST",
-            "/api/v1/stem-extraction/extract",
-            data=data,
-            files=files if files else None
+            "POST", "/api/v1/stem-extraction/extract", data=data, files=files
         )
-        job = Job.from_dict(response)
         if wait_for_completion:
-            return await self._async_wait_for_completion(job.id, timeout)
-        return job
-    def get_stem_job(self, job_id: int) -> Job:
-        """
-        Get stem extraction job status
-        Args:
-            job_id: ID of the stem extraction job
-        Returns:
-            Job object with current status
-        """
+            return await self._async_wait_for_stem_job(response["id"], timeout)
+        return response
+    def get_job(self, job_id: int) -> Dict[str, Any]:
+        """Get stem extraction job status."""
         if self.async_mode:
-            return self._async_get_stem_job(job_id)
-        else:
-            response = self.client.request("GET", f"/api/v1/stem-extraction/status/{job_id}")
-            return Job.from_dict(response)
-    async def _async_get_stem_job(self, job_id: int) -> Job:
-        """Async version of get_stem_job"""
-        response = await self.client.request("GET", f"/api/v1/stem-extraction/status/{job_id}")
-        return Job.from_dict(response)
-    def list_stem_jobs(
-        self,
-        skip: int = 0,
-        limit: int = 50
-    ) -> List[Job]:
-        """
-        List stem extraction jobs
-        Args:
-            skip: Number of jobs to skip
-            limit: Maximum number of jobs to return
-        Returns:
-            List of stem extraction jobs
-        """
-        params = {
-            "skip": skip,
-            "limit": limit
-        }
+            return self._async_get_job(job_id)
+        return self.client.request("GET", f"/api/v1/stem-extraction/status/{job_id}")
+    async def _async_get_job(self, job_id: int) -> Dict[str, Any]:
+        return await self.client.request("GET", f"/api/v1/stem-extraction/status/{job_id}")
+    def list_jobs(self, skip: int = 0, limit: int = 50) -> List[Dict[str, Any]]:
+        """List stem extraction jobs."""
         if self.async_mode:
-            return self._async_list_stem_jobs(params)
-        else:
-            response = self.client.request("GET", "/api/v1/stem-extraction/jobs", params=params)
-            return [Job.from_dict(job_data) for job_data in response]
-    async def _async_list_stem_jobs(self, params: Dict[str, Any]) -> List[Job]:
-        """Async version of list_stem_jobs"""
-        response = await self.client.request("GET", "/api/v1/stem-extraction/jobs", params=params)
-        return [Job.from_dict(job_data) for job_data in response]
-    def delete_stem_job(self, job_id: int) -> Dict[str, str]:
-        """
-        Delete a stem extraction job
-        Args:
-            job_id: ID of the job to delete
-        Returns:
-            Deletion confirmation
-        """
+            return self._async_list_jobs(skip, limit)
+        return self.client.request(
+            "GET", "/api/v1/stem-extraction/jobs", params={"skip": skip, "limit": limit}
+        )
+    async def _async_list_jobs(self, skip: int, limit: int) -> List[Dict[str, Any]]:
+        return await self.client.request(
+            "GET", "/api/v1/stem-extraction/jobs", params={"skip": skip, "limit": limit}
+        )
+    def delete_job(self, job_id: int) -> Dict[str, str]:
+        """Delete a stem extraction job."""
         if self.async_mode:
-            return self._async_delete_stem_job(job_id)
-        else:
-            return self.client.request("DELETE", f"/api/v1/stem-extraction/jobs/{job_id}")
-    async def _async_delete_stem_job(self, job_id: int) -> Dict[str, str]:
-        """Async version of delete_stem_job"""
+            return self._async_delete_job(job_id)
+        return self.client.request("DELETE", f"/api/v1/stem-extraction/jobs/{job_id}")
+    async def _async_delete_job(self, job_id: int) -> Dict[str, str]:
         return await self.client.request("DELETE", f"/api/v1/stem-extraction/jobs/{job_id}")
+    def _wait_for_stem_job(self, job_id: int, timeout: int = 900) -> Dict[str, Any]:
+        """Wait for stem job completion."""
+        import time
+        start = time.time()
+        while time.time() - start < timeout:
+            job = self.get_job(job_id)
+            status = job.get("status", "").upper()
+            if status == "COMPLETED":
+                return job
+            elif status in ["FAILED", "ERROR"]:
+                raise Exception(f"Job failed: {job.get('error_message', 'Unknown')}")
+            time.sleep(5)
+        raise TimeoutError(f"Job {job_id} timed out after {timeout}s")
+    async def _async_wait_for_stem_job(self, job_id: int, timeout: int = 900) -> Dict[str, Any]:
+        """Async wait for stem job completion."""
+        import asyncio
+        import time
+        start = time.time()
+        while time.time() - start < timeout:
+            job = await self.get_job(job_id)
+            status = job.get("status", "").upper()
+            if status == "COMPLETED":
+                return job
+            elif status in ["FAILED", "ERROR"]:
+                raise Exception(f"Job failed: {job.get('error_message', 'Unknown')}")
+            await asyncio.sleep(5)
+        raise TimeoutError(f"Job {job_id} timed out after {timeout}s")

audiopod 1.2.0__py3-none-any.whl → 1.5.0__py3-none-any.whl

audiopod 1.2.0py3-none-any.whl → 1.5.0py3-none-any.whl