PyPI - openspeechapi - Versions diffs - 0.1.0__py3-none-any.whl - Mend

openspeechapi 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (118) hide show

openspeech/__init__.py +75 -0
openspeech/__main__.py +5 -0
openspeech/cli.py +413 -0
openspeech/client/__init__.py +4 -0
openspeech/client/client.py +145 -0
openspeech/config.py +212 -0
openspeech/core/__init__.py +0 -0
openspeech/core/base.py +75 -0
openspeech/core/enums.py +39 -0
openspeech/core/models.py +61 -0
openspeech/core/registry.py +37 -0
openspeech/core/settings.py +8 -0
openspeech/demo.py +675 -0
openspeech/dispatch/__init__.py +0 -0
openspeech/dispatch/context.py +34 -0
openspeech/dispatch/dispatcher.py +661 -0
openspeech/dispatch/executors/__init__.py +0 -0
openspeech/dispatch/executors/base.py +34 -0
openspeech/dispatch/executors/in_process.py +66 -0
openspeech/dispatch/executors/remote.py +64 -0
openspeech/dispatch/executors/subprocess_exec.py +446 -0
openspeech/dispatch/fanout.py +95 -0
openspeech/dispatch/filters.py +73 -0
openspeech/dispatch/lifecycle.py +178 -0
openspeech/dispatch/watcher.py +82 -0
openspeech/engine_catalog.py +236 -0
openspeech/engine_registry.yaml +347 -0
openspeech/exceptions.py +51 -0
openspeech/factory.py +325 -0
openspeech/local_engines/__init__.py +12 -0
openspeech/local_engines/aim_resolver.py +91 -0
openspeech/local_engines/backends/__init__.py +1 -0
openspeech/local_engines/backends/docker_backend.py +490 -0
openspeech/local_engines/backends/native_backend.py +902 -0
openspeech/local_engines/base.py +30 -0
openspeech/local_engines/engines/__init__.py +1 -0
openspeech/local_engines/engines/faster_whisper.py +36 -0
openspeech/local_engines/engines/fish_speech.py +33 -0
openspeech/local_engines/engines/sherpa_onnx.py +56 -0
openspeech/local_engines/engines/whisper.py +41 -0
openspeech/local_engines/engines/whisperlivekit.py +60 -0
openspeech/local_engines/manager.py +208 -0
openspeech/local_engines/models.py +50 -0
openspeech/local_engines/progress.py +69 -0
openspeech/local_engines/registry.py +19 -0
openspeech/local_engines/task_store.py +52 -0
openspeech/local_engines/tasks.py +71 -0
openspeech/logging_config.py +607 -0
openspeech/observe/__init__.py +0 -0
openspeech/observe/base.py +79 -0
openspeech/observe/debug.py +44 -0
openspeech/observe/latency.py +19 -0
openspeech/observe/metrics.py +47 -0
openspeech/observe/tracing.py +44 -0
openspeech/observe/usage.py +27 -0
openspeech/providers/__init__.py +0 -0
openspeech/providers/_template.py +101 -0
openspeech/providers/stt/__init__.py +0 -0
openspeech/providers/stt/alibaba.py +86 -0
openspeech/providers/stt/assemblyai.py +135 -0
openspeech/providers/stt/azure_speech.py +99 -0
openspeech/providers/stt/baidu.py +135 -0
openspeech/providers/stt/deepgram.py +311 -0
openspeech/providers/stt/elevenlabs.py +385 -0
openspeech/providers/stt/faster_whisper.py +211 -0
openspeech/providers/stt/google_cloud.py +106 -0
openspeech/providers/stt/iflytek.py +427 -0
openspeech/providers/stt/macos_speech.py +226 -0
openspeech/providers/stt/openai.py +84 -0
openspeech/providers/stt/sherpa_onnx.py +353 -0
openspeech/providers/stt/tencent.py +212 -0
openspeech/providers/stt/volcengine.py +107 -0
openspeech/providers/stt/whisper.py +153 -0
openspeech/providers/stt/whisperlivekit.py +530 -0
openspeech/providers/stt/windows_speech.py +249 -0
openspeech/providers/tts/__init__.py +0 -0
openspeech/providers/tts/alibaba.py +95 -0
openspeech/providers/tts/azure_speech.py +123 -0
openspeech/providers/tts/baidu.py +143 -0
openspeech/providers/tts/coqui.py +64 -0
openspeech/providers/tts/cosyvoice.py +90 -0
openspeech/providers/tts/deepgram.py +174 -0
openspeech/providers/tts/elevenlabs.py +311 -0
openspeech/providers/tts/fish_speech.py +158 -0
openspeech/providers/tts/google_cloud.py +107 -0
openspeech/providers/tts/iflytek.py +209 -0
openspeech/providers/tts/macos_say.py +251 -0
openspeech/providers/tts/minimax.py +122 -0
openspeech/providers/tts/openai.py +104 -0
openspeech/providers/tts/piper.py +104 -0
openspeech/providers/tts/tencent.py +189 -0
openspeech/providers/tts/volcengine.py +117 -0
openspeech/providers/tts/windows_sapi.py +234 -0
openspeech/server/__init__.py +1 -0
openspeech/server/app.py +72 -0
openspeech/server/auth.py +42 -0
openspeech/server/middleware.py +75 -0
openspeech/server/routes/__init__.py +1 -0
openspeech/server/routes/management.py +848 -0
openspeech/server/routes/stt.py +121 -0
openspeech/server/routes/tts.py +159 -0
openspeech/server/routes/webui.py +29 -0
openspeech/server/webui/app.js +2649 -0
openspeech/server/webui/index.html +216 -0
openspeech/server/webui/styles.css +617 -0
openspeech/server/ws/__init__.py +1 -0
openspeech/server/ws/stt_stream.py +263 -0
openspeech/server/ws/tts_stream.py +207 -0
openspeech/telemetry/__init__.py +21 -0
openspeech/telemetry/perf.py +307 -0
openspeech/utils/__init__.py +5 -0
openspeech/utils/audio_converter.py +406 -0
openspeech/utils/audio_playback.py +156 -0
openspeech/vendor_registry.yaml +74 -0
openspeechapi-0.1.0.dist-info/METADATA +101 -0
openspeechapi-0.1.0.dist-info/RECORD +118 -0
openspeechapi-0.1.0.dist-info/WHEEL +4 -0
openspeechapi-0.1.0.dist-info/entry_points.txt +3 -0

openspeech/engine_registry.yaml ADDED Viewed

@@ -0,0 +1,347 @@
+# Engine Registry — lists all available engines with basic metadata.
+# Provider code supplies default_settings and field_options at runtime.
+# This file can be updated from a remote URL in the future.
+version: 1
+engines:
+  # ---- Cloud STT ----
+  - name: openai-stt
+    vendor: openai
+    provider: openai-stt
+    type: stt
+    category: cloud
+    display_name: "OpenAI STT"
+    description: "OpenAI Whisper API (also compatible with Groq, SiliconFlow)"
+    default_alias: openai_stt
+    default_exec_mode: remote
+    pip_extras: [openai]
+  - name: deepgram-stt
+    vendor: deepgram
+    provider: deepgram
+    type: stt
+    category: cloud
+    display_name: "Deepgram STT"
+    description: "Deepgram Nova STT — fast, accurate, word-level timestamps"
+    default_alias: deepgram_stt
+    default_exec_mode: remote
+    pip_extras: [deepgram]
+  - name: elevenlabs-stt
+    vendor: elevenlabs
+    provider: elevenlabs-stt
+    type: stt
+    category: cloud
+    display_name: "ElevenLabs STT"
+    description: "ElevenLabs Scribe Speech-to-Text"
+    default_alias: elevenlabs_stt
+    default_exec_mode: remote
+    pip_extras: [elevenlabs-stt]
+  - name: deepgram-tts
+    vendor: deepgram
+    provider: deepgram-tts
+    type: tts
+    category: cloud
+    display_name: "Deepgram TTS"
+    description: "Deepgram Aura TTS — fast, natural text-to-speech"
+    default_alias: deepgram_tts
+    default_exec_mode: remote
+  - name: google-stt
+    vendor: google
+    provider: google-stt
+    type: stt
+    category: cloud
+    display_name: "Google STT"
+    description: "Google Cloud Speech-to-Text v1"
+    default_alias: google_stt
+    default_exec_mode: remote
+  - name: azure-stt
+    vendor: azure
+    provider: azure-stt
+    type: stt
+    category: cloud
+    display_name: "Azure STT"
+    description: "Azure Cognitive Services Speech-to-Text"
+    default_alias: azure_stt
+    default_exec_mode: remote
+  - name: assemblyai-stt
+    vendor: assemblyai
+    provider: assemblyai-stt
+    type: stt
+    category: cloud
+    display_name: "AssemblyAI STT"
+    description: "AssemblyAI STT — async upload + poll"
+    default_alias: assemblyai_stt
+    default_exec_mode: remote
+  - name: volcengine-stt
+    vendor: volcengine
+    provider: volcengine-stt
+    type: stt
+    category: cloud
+    display_name: "Volcengine STT"
+    description: "Volcengine (火山引擎) Speech-to-Text"
+    default_alias: volcengine_stt
+    default_exec_mode: remote
+  - name: alibaba-stt
+    vendor: alibaba
+    provider: alibaba-stt
+    type: stt
+    category: cloud
+    display_name: "Alibaba STT"
+    description: "Alibaba Cloud (阿里云百炼) STT — OpenAI-compatible"
+    default_alias: alibaba_stt
+    default_exec_mode: remote
+  - name: tencent-stt
+    vendor: tencent
+    provider: tencent-stt
+    type: stt
+    category: cloud
+    display_name: "Tencent STT"
+    description: "Tencent Cloud (腾讯云) Speech-to-Text"
+    default_alias: tencent_stt
+    default_exec_mode: remote
+  - name: baidu-stt
+    vendor: baidu
+    provider: baidu-stt
+    type: stt
+    category: cloud
+    display_name: "Baidu STT"
+    description: "Baidu (百度) Speech-to-Text"
+    default_alias: baidu_stt
+    default_exec_mode: remote
+  - name: iflytek-stt
+    vendor: iflytek
+    provider: iflytek-stt
+    type: stt
+    category: cloud
+    display_name: "iFlytek STT"
+    description: "iFlytek (科大讯飞) Speech-to-Text"
+    default_alias: iflytek_stt
+    default_exec_mode: remote
+    pip_extras: [iflytek-stt]
+  # ---- Cloud TTS ----
+  - name: openai-tts
+    vendor: openai
+    provider: openai-tts
+    type: tts
+    category: cloud
+    display_name: "OpenAI TTS"
+    description: "OpenAI TTS API (also compatible with Groq, SiliconFlow, Minimax)"
+    default_alias: openai_tts
+    default_exec_mode: remote
+    pip_extras: [openai]
+  - name: elevenlabs-tts
+    vendor: elevenlabs
+    provider: elevenlabs
+    type: tts
+    category: cloud
+    display_name: "ElevenLabs TTS"
+    description: "ElevenLabs TTS — high quality, voice cloning"
+    default_alias: elevenlabs
+    default_exec_mode: remote
+    pip_extras: [elevenlabs-tts]
+  - name: minimax-tts
+    vendor: minimax
+    provider: minimax
+    type: tts
+    category: cloud
+    display_name: "MiniMax TTS"
+    description: "MiniMax TTS — 300+ voices, OpenAI-compatible"
+    default_alias: minimax
+    default_exec_mode: remote
+  - name: google-tts
+    vendor: google
+    provider: google-tts
+    type: tts
+    category: cloud
+    display_name: "Google TTS"
+    description: "Google Cloud Text-to-Speech"
+    default_alias: google_tts
+    default_exec_mode: remote
+  - name: azure-tts
+    vendor: azure
+    provider: azure-tts
+    type: tts
+    category: cloud
+    display_name: "Azure TTS"
+    description: "Azure Cognitive Services Text-to-Speech"
+    default_alias: azure_tts
+    default_exec_mode: remote
+  - name: volcengine-tts
+    vendor: volcengine
+    provider: volcengine-tts
+    type: tts
+    category: cloud
+    display_name: "Volcengine TTS"
+    description: "Volcengine (火山引擎) Text-to-Speech"
+    default_alias: volcengine_tts
+    default_exec_mode: remote
+  - name: alibaba-tts
+    vendor: alibaba
+    provider: alibaba-tts
+    type: tts
+    category: cloud
+    display_name: "Alibaba TTS"
+    description: "Alibaba Cloud (阿里云百炼) TTS — OpenAI-compatible"
+    default_alias: alibaba_tts
+    default_exec_mode: remote
+  - name: tencent-tts
+    vendor: tencent
+    provider: tencent-tts
+    type: tts
+    category: cloud
+    display_name: "Tencent TTS"
+    description: "Tencent Cloud (腾讯云) Text-to-Speech"
+    default_alias: tencent_tts
+    default_exec_mode: remote
+  - name: baidu-tts
+    vendor: baidu
+    provider: baidu-tts
+    type: tts
+    category: cloud
+    display_name: "Baidu TTS"
+    description: "Baidu (百度) Text-to-Speech"
+    default_alias: baidu_tts
+    default_exec_mode: remote
+  - name: iflytek-tts
+    vendor: iflytek
+    provider: iflytek-tts
+    type: tts
+    category: cloud
+    display_name: "iFlytek TTS"
+    description: "iFlytek (科大讯飞) Text-to-Speech"
+    default_alias: iflytek_tts
+    default_exec_mode: remote
+    pip_extras: [iflytek-tts]
+  # ---- Local STT ----
+  - name: faster-whisper
+    provider: faster-whisper
+    type: stt
+    category: local
+    display_name: "Faster Whisper"
+    description: "Faster Whisper — CTranslate2-based, fast local STT"
+    default_alias: stt_fw
+    default_exec_mode: subprocess
+    pip_extras: [faster-whisper]
+  - name: whisper
+    provider: whisper
+    type: stt
+    category: local
+    display_name: "Whisper"
+    description: "OpenAI Whisper — original local STT model"
+    default_alias: stt_whisper
+    default_exec_mode: subprocess
+    pip_extras: [whisper]
+  - name: whisperlivekit
+    provider: whisperlivekit-stt
+    type: stt
+    category: local
+    display_name: "WhisperLiveKit"
+    description: "WhisperLiveKit — streaming STT with MLX backend"
+    default_alias: stt_wlk
+    default_exec_mode: local
+    pip_extras: [whisperlivekit]
+  - name: sherpa-onnx
+    provider: sherpa-onnx-stt
+    type: stt
+    category: local
+    display_name: "Sherpa ONNX"
+    description: "Sherpa-ONNX — lightweight streaming STT"
+    default_alias: stt_sherpa
+    default_exec_mode: local
+  # ---- Local TTS ----
+  - name: fish-speech
+    provider: fish-speech
+    type: tts
+    category: local
+    display_name: "Fish Speech"
+    description: "Fish Speech — high quality local TTS"
+    default_alias: fish_speech
+    default_exec_mode: local
+    pip_extras: [fish-speech]
+  # ---- macOS Native ----
+  - name: macos-stt
+    provider: macos-stt
+    type: stt
+    category: native
+    display_name: "macOS STT"
+    description: "macOS SFSpeechRecognizer — built-in speech recognition"
+    default_alias: macos_stt
+    default_exec_mode: in_process
+    platforms: [darwin]
+  - name: macos-tts
+    provider: macos-say
+    type: tts
+    category: native
+    display_name: "macOS TTS"
+    description: "macOS say command — built-in text-to-speech"
+    default_alias: macos_tts
+    default_exec_mode: in_process
+    platforms: [darwin]
+  # ---- Windows Native ----
+  - name: windows-stt
+    provider: windows-stt
+    type: stt
+    category: native
+    display_name: "Windows STT"
+    description: "Windows System.Speech — built-in speech recognition"
+    default_alias: windows_stt
+    default_exec_mode: in_process
+    platforms: [win32]
+  - name: windows-tts
+    provider: windows-tts
+    type: tts
+    category: native
+    display_name: "Windows TTS"
+    description: "Windows SAPI5 — built-in text-to-speech"
+    default_alias: windows_tts
+    default_exec_mode: in_process
+    platforms: [win32]
+    pip_extras: [windows-tts]
+  # ---- Cross-platform Native (auto-detect) ----
+  - name: native-stt
+    provider: native-stt
+    type: stt
+    category: native
+    display_name: "Native STT"
+    description: "Platform native STT (macOS SFSpeech / Windows System.Speech)"
+    default_alias: native_stt
+    default_exec_mode: in_process
+  - name: native-tts
+    provider: native-tts
+    type: tts
+    category: native
+    display_name: "Native TTS"
+    description: "Platform native TTS (macOS say / Windows SAPI5)"
+    default_alias: native_tts
+    default_exec_mode: in_process

openspeech/exceptions.py ADDED Viewed

@@ -0,0 +1,51 @@
+"""OpenSpeech exception hierarchy."""
+class OpenSpeechError(Exception):
+    """Base exception for all OpenSpeech errors."""
+class ProviderError(OpenSpeechError):
+    """Error from a provider invocation."""
+    def __init__(self, provider_name: str, original_type: str, message: str) -> None:
+        self.provider_name = provider_name
+        self.original_type = original_type
+        super().__init__(f"[{provider_name}] {original_type}: {message}")
+class ProviderCrashedError(OpenSpeechError):
+    """Provider subprocess crashed during invocation."""
+    def __init__(self, provider_name: str) -> None:
+        self.provider_name = provider_name
+        super().__init__(f"Provider '{provider_name}' crashed during invocation")
+class ProviderUnavailableError(OpenSpeechError):
+    """Provider exhausted restart attempts and is unavailable."""
+    def __init__(self, provider_name: str) -> None:
+        self.provider_name = provider_name
+        super().__init__(f"Provider '{provider_name}' is unavailable (max restarts exhausted)")
+class ConfigError(OpenSpeechError):
+    """Configuration loading or validation error."""
+class FanOutAllFailedError(OpenSpeechError):
+    """All providers in a fanout invocation failed."""
+    def __init__(self, errors: dict[str, Exception]) -> None:
+        self.errors = errors
+        names = ", ".join(errors.keys())
+        super().__init__(f"All fanout providers failed: {names}")
+class ProviderNotFoundError(OpenSpeechError):
+    """Provider not found in registry or dispatcher."""
+    def __init__(self, name: str) -> None:
+        self.name = name
+        super().__init__(f"Provider '{name}' not found")