livekit-plugins-speechmatics 0.0.2__tar.gz → 1.0.0.dev5__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- livekit_plugins_speechmatics-1.0.0.dev5/.gitignore +168 -0
- {livekit_plugins_speechmatics-0.0.2 → livekit_plugins_speechmatics-1.0.0.dev5}/PKG-INFO +10 -20
- {livekit_plugins_speechmatics-0.0.2 → livekit_plugins_speechmatics-1.0.0.dev5}/livekit/plugins/speechmatics/stt.py +13 -23
- {livekit_plugins_speechmatics-0.0.2 → livekit_plugins_speechmatics-1.0.0.dev5}/livekit/plugins/speechmatics/types.py +5 -7
- {livekit_plugins_speechmatics-0.0.2 → livekit_plugins_speechmatics-1.0.0.dev5}/livekit/plugins/speechmatics/utils.py +3 -9
- {livekit_plugins_speechmatics-0.0.2 → livekit_plugins_speechmatics-1.0.0.dev5}/livekit/plugins/speechmatics/version.py +1 -1
- livekit_plugins_speechmatics-1.0.0.dev5/pyproject.toml +39 -0
- livekit_plugins_speechmatics-0.0.2/livekit_plugins_speechmatics.egg-info/PKG-INFO +0 -66
- livekit_plugins_speechmatics-0.0.2/livekit_plugins_speechmatics.egg-info/SOURCES.txt +0 -14
- livekit_plugins_speechmatics-0.0.2/livekit_plugins_speechmatics.egg-info/dependency_links.txt +0 -1
- livekit_plugins_speechmatics-0.0.2/livekit_plugins_speechmatics.egg-info/requires.txt +0 -1
- livekit_plugins_speechmatics-0.0.2/livekit_plugins_speechmatics.egg-info/top_level.txt +0 -1
- livekit_plugins_speechmatics-0.0.2/setup.cfg +0 -4
- livekit_plugins_speechmatics-0.0.2/setup.py +0 -58
- {livekit_plugins_speechmatics-0.0.2 → livekit_plugins_speechmatics-1.0.0.dev5}/README.md +0 -0
- {livekit_plugins_speechmatics-0.0.2 → livekit_plugins_speechmatics-1.0.0.dev5}/livekit/plugins/speechmatics/__init__.py +0 -0
- {livekit_plugins_speechmatics-0.0.2 → livekit_plugins_speechmatics-1.0.0.dev5}/livekit/plugins/speechmatics/log.py +0 -0
- {livekit_plugins_speechmatics-0.0.2 → livekit_plugins_speechmatics-1.0.0.dev5}/livekit/plugins/speechmatics/py.typed +0 -0
@@ -0,0 +1,168 @@
|
|
1
|
+
**/.vscode
|
2
|
+
**/.DS_Store
|
3
|
+
|
4
|
+
# Byte-compiled / optimized / DLL files
|
5
|
+
__pycache__/
|
6
|
+
*.py[cod]
|
7
|
+
*$py.class
|
8
|
+
|
9
|
+
# C extensions
|
10
|
+
*.so
|
11
|
+
|
12
|
+
# Distribution / packaging
|
13
|
+
.Python
|
14
|
+
build/
|
15
|
+
develop-eggs/
|
16
|
+
dist/
|
17
|
+
downloads/
|
18
|
+
eggs/
|
19
|
+
.eggs/
|
20
|
+
lib/
|
21
|
+
lib64/
|
22
|
+
parts/
|
23
|
+
sdist/
|
24
|
+
var/
|
25
|
+
wheels/
|
26
|
+
share/python-wheels/
|
27
|
+
*.egg-info/
|
28
|
+
.installed.cfg
|
29
|
+
*.egg
|
30
|
+
MANIFEST
|
31
|
+
|
32
|
+
# PyInstaller
|
33
|
+
# Usually these files are written by a python script from a template
|
34
|
+
# before PyInstaller builds the exe, so as to inject date/other infos into it.
|
35
|
+
*.manifest
|
36
|
+
*.spec
|
37
|
+
|
38
|
+
# Installer logs
|
39
|
+
pip-log.txt
|
40
|
+
pip-delete-this-directory.txt
|
41
|
+
|
42
|
+
# Unit test / coverage reports
|
43
|
+
htmlcov/
|
44
|
+
.tox/
|
45
|
+
.nox/
|
46
|
+
.coverage
|
47
|
+
.coverage.*
|
48
|
+
.cache
|
49
|
+
nosetests.xml
|
50
|
+
coverage.xml
|
51
|
+
*.cover
|
52
|
+
*.py,cover
|
53
|
+
.hypothesis/
|
54
|
+
.pytest_cache/
|
55
|
+
cover/
|
56
|
+
|
57
|
+
# Translations
|
58
|
+
*.mo
|
59
|
+
*.pot
|
60
|
+
|
61
|
+
# Django stuff:
|
62
|
+
*.log
|
63
|
+
local_settings.py
|
64
|
+
db.sqlite3
|
65
|
+
db.sqlite3-journal
|
66
|
+
|
67
|
+
# Flask stuff:
|
68
|
+
instance/
|
69
|
+
.webassets-cache
|
70
|
+
|
71
|
+
# Scrapy stuff:
|
72
|
+
.scrapy
|
73
|
+
|
74
|
+
# Sphinx documentation
|
75
|
+
docs/_build/
|
76
|
+
|
77
|
+
# PyBuilder
|
78
|
+
.pybuilder/
|
79
|
+
target/
|
80
|
+
|
81
|
+
# Jupyter Notebook
|
82
|
+
.ipynb_checkpoints
|
83
|
+
|
84
|
+
# IPython
|
85
|
+
profile_default/
|
86
|
+
ipython_config.py
|
87
|
+
|
88
|
+
# pyenv
|
89
|
+
# For a library or package, you might want to ignore these files since the code is
|
90
|
+
# intended to run in multiple environments; otherwise, check them in:
|
91
|
+
# .python-version
|
92
|
+
|
93
|
+
# pipenv
|
94
|
+
# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
|
95
|
+
# However, in case of collaboration, if having platform-specific dependencies or dependencies
|
96
|
+
# having no cross-platform support, pipenv may install dependencies that don't work, or not
|
97
|
+
# install all needed dependencies.
|
98
|
+
#Pipfile.lock
|
99
|
+
|
100
|
+
# poetry
|
101
|
+
# Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
|
102
|
+
# This is especially recommended for binary packages to ensure reproducibility, and is more
|
103
|
+
# commonly ignored for libraries.
|
104
|
+
# https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
|
105
|
+
#poetry.lock
|
106
|
+
|
107
|
+
# pdm
|
108
|
+
# Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
|
109
|
+
#pdm.lock
|
110
|
+
# pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
|
111
|
+
# in version control.
|
112
|
+
# https://pdm.fming.dev/#use-with-ide
|
113
|
+
.pdm.toml
|
114
|
+
|
115
|
+
# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
|
116
|
+
__pypackages__/
|
117
|
+
|
118
|
+
# Celery stuff
|
119
|
+
celerybeat-schedule
|
120
|
+
celerybeat.pid
|
121
|
+
|
122
|
+
# SageMath parsed files
|
123
|
+
*.sage.py
|
124
|
+
|
125
|
+
# Environments
|
126
|
+
.env
|
127
|
+
.venv
|
128
|
+
env/
|
129
|
+
venv/
|
130
|
+
ENV/
|
131
|
+
env.bak/
|
132
|
+
venv.bak/
|
133
|
+
|
134
|
+
# Spyder project settings
|
135
|
+
.spyderproject
|
136
|
+
.spyproject
|
137
|
+
|
138
|
+
# Rope project settings
|
139
|
+
.ropeproject
|
140
|
+
|
141
|
+
# mkdocs documentation
|
142
|
+
/site
|
143
|
+
|
144
|
+
# mypy
|
145
|
+
.mypy_cache/
|
146
|
+
.dmypy.json
|
147
|
+
dmypy.json
|
148
|
+
|
149
|
+
# Pyre type checker
|
150
|
+
.pyre/
|
151
|
+
|
152
|
+
# pytype static type analyzer
|
153
|
+
.pytype/
|
154
|
+
|
155
|
+
# Cython debug symbols
|
156
|
+
cython_debug/
|
157
|
+
|
158
|
+
# PyCharm
|
159
|
+
# JetBrains specific template is maintained in a separate JetBrains.gitignore that can
|
160
|
+
# be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
|
161
|
+
# and can be added to the global gitignore or merged into this file. For a more nuclear
|
162
|
+
# option (not recommended) you can uncomment the following to ignore the entire idea folder.
|
163
|
+
.idea/
|
164
|
+
|
165
|
+
node_modules
|
166
|
+
|
167
|
+
credentials.json
|
168
|
+
pyrightconfig.json
|
@@ -1,35 +1,25 @@
|
|
1
|
-
Metadata-Version: 2.
|
1
|
+
Metadata-Version: 2.4
|
2
2
|
Name: livekit-plugins-speechmatics
|
3
|
-
Version: 0.0.
|
3
|
+
Version: 1.0.0.dev5
|
4
4
|
Summary: Agent Framework plugin for Speechmatics
|
5
|
-
Home-page: https://github.com/livekit/agents
|
6
|
-
License: Apache-2.0
|
7
5
|
Project-URL: Documentation, https://docs.livekit.io
|
8
6
|
Project-URL: Website, https://livekit.io/
|
9
7
|
Project-URL: Source, https://github.com/livekit/agents
|
10
|
-
|
8
|
+
Author-email: LiveKit <support@livekit.io>
|
9
|
+
License-Expression: Apache-2.0
|
10
|
+
Keywords: audio,livekit,realtime,video,webrtc
|
11
11
|
Classifier: Intended Audience :: Developers
|
12
12
|
Classifier: License :: OSI Approved :: Apache Software License
|
13
|
-
Classifier: Topic :: Multimedia :: Sound/Audio
|
14
|
-
Classifier: Topic :: Multimedia :: Video
|
15
|
-
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
16
13
|
Classifier: Programming Language :: Python :: 3
|
14
|
+
Classifier: Programming Language :: Python :: 3 :: Only
|
17
15
|
Classifier: Programming Language :: Python :: 3.9
|
18
16
|
Classifier: Programming Language :: Python :: 3.10
|
19
|
-
Classifier:
|
17
|
+
Classifier: Topic :: Multimedia :: Sound/Audio
|
18
|
+
Classifier: Topic :: Multimedia :: Video
|
19
|
+
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
20
20
|
Requires-Python: >=3.9.0
|
21
|
+
Requires-Dist: livekit-agents>=1.0.0.dev5
|
21
22
|
Description-Content-Type: text/markdown
|
22
|
-
Requires-Dist: livekit-agents<1.0.0,>=0.12.16
|
23
|
-
Dynamic: classifier
|
24
|
-
Dynamic: description
|
25
|
-
Dynamic: description-content-type
|
26
|
-
Dynamic: home-page
|
27
|
-
Dynamic: keywords
|
28
|
-
Dynamic: license
|
29
|
-
Dynamic: project-url
|
30
|
-
Dynamic: requires-dist
|
31
|
-
Dynamic: requires-python
|
32
|
-
Dynamic: summary
|
33
23
|
|
34
24
|
# LiveKit Plugins Speechmatics
|
35
25
|
|
@@ -20,9 +20,9 @@ import dataclasses
|
|
20
20
|
import json
|
21
21
|
import os
|
22
22
|
import weakref
|
23
|
-
from typing import Dict, List, Optional
|
24
23
|
|
25
24
|
import aiohttp
|
25
|
+
|
26
26
|
from livekit.agents import (
|
27
27
|
DEFAULT_API_CONNECT_OPTIONS,
|
28
28
|
APIConnectOptions,
|
@@ -57,8 +57,8 @@ class STT(stt.STT):
|
|
57
57
|
url="wss://eu2.rt.speechmatics.com/v2",
|
58
58
|
),
|
59
59
|
audio_settings: AudioSettings = AudioSettings(),
|
60
|
-
http_session:
|
61
|
-
extra_headers:
|
60
|
+
http_session: aiohttp.ClientSession | None = None,
|
61
|
+
extra_headers: dict | None = None,
|
62
62
|
):
|
63
63
|
super().__init__(
|
64
64
|
capabilities=stt.STTCapabilities(
|
@@ -91,9 +91,9 @@ class STT(stt.STT):
|
|
91
91
|
def stream(
|
92
92
|
self,
|
93
93
|
*,
|
94
|
-
language:
|
94
|
+
language: str | None = None,
|
95
95
|
conn_options: APIConnectOptions = DEFAULT_API_CONNECT_OPTIONS,
|
96
|
-
) ->
|
96
|
+
) -> SpeechStream:
|
97
97
|
config = dataclasses.replace(self._audio_settings)
|
98
98
|
stream = SpeechStream(
|
99
99
|
stt=self,
|
@@ -118,11 +118,9 @@ class SpeechStream(stt.SpeechStream):
|
|
118
118
|
connection_settings: ConnectionSettings,
|
119
119
|
conn_options: APIConnectOptions,
|
120
120
|
http_session: aiohttp.ClientSession,
|
121
|
-
extra_headers:
|
121
|
+
extra_headers: dict | None = None,
|
122
122
|
) -> None:
|
123
|
-
super().__init__(
|
124
|
-
stt=stt, conn_options=conn_options, sample_rate=audio_settings.sample_rate
|
125
|
-
)
|
123
|
+
super().__init__(stt=stt, conn_options=conn_options, sample_rate=audio_settings.sample_rate)
|
126
124
|
self._transcription_config = transcription_config
|
127
125
|
self._audio_settings = audio_settings
|
128
126
|
self._connection_settings = connection_settings
|
@@ -188,9 +186,7 @@ class SpeechStream(stt.SpeechStream):
|
|
188
186
|
return
|
189
187
|
|
190
188
|
# this will trigger a reconnection, see the _run loop
|
191
|
-
raise APIStatusError(
|
192
|
-
message="Speechmatics connection closed unexpectedly"
|
193
|
-
)
|
189
|
+
raise APIStatusError(message="Speechmatics connection closed unexpectedly")
|
194
190
|
|
195
191
|
try:
|
196
192
|
data = json.loads(msg.data)
|
@@ -229,9 +225,7 @@ class SpeechStream(stt.SpeechStream):
|
|
229
225
|
await ws.close()
|
230
226
|
|
231
227
|
async def _connect_ws(self) -> aiohttp.ClientWebSocketResponse:
|
232
|
-
api_key = self._connection_settings.api_key or os.environ.get(
|
233
|
-
"SPEECHMATICS_API_KEY"
|
234
|
-
)
|
228
|
+
api_key = self._connection_settings.api_key or os.environ.get("SPEECHMATICS_API_KEY")
|
235
229
|
if api_key is None:
|
236
230
|
raise ValueError(
|
237
231
|
"Speechmatics API key is required. "
|
@@ -244,9 +238,7 @@ class SpeechStream(stt.SpeechStream):
|
|
244
238
|
"Authorization": f"Bearer {api_key}",
|
245
239
|
**self._extra_headers,
|
246
240
|
}
|
247
|
-
url = sanitize_url(
|
248
|
-
self._connection_settings.url, self._transcription_config.language
|
249
|
-
)
|
241
|
+
url = sanitize_url(self._connection_settings.url, self._transcription_config.language)
|
250
242
|
return await self._session.ws_connect(
|
251
243
|
url,
|
252
244
|
ssl=self._connection_settings.ssl_context,
|
@@ -281,9 +273,7 @@ class SpeechStream(stt.SpeechStream):
|
|
281
273
|
usage_event = stt.SpeechEvent(
|
282
274
|
type=stt.SpeechEventType.RECOGNITION_USAGE,
|
283
275
|
alternatives=[],
|
284
|
-
recognition_usage=stt.RecognitionUsage(
|
285
|
-
audio_duration=self._speech_duration
|
286
|
-
),
|
276
|
+
recognition_usage=stt.RecognitionUsage(audio_duration=self._speech_duration),
|
287
277
|
)
|
288
278
|
self._event_ch.send_nowait(usage_event)
|
289
279
|
self._speech_duration = 0
|
@@ -295,8 +285,8 @@ class SpeechStream(stt.SpeechStream):
|
|
295
285
|
raise Exception("Speechmatics connection closed unexpectedly")
|
296
286
|
|
297
287
|
|
298
|
-
def live_transcription_to_speech_data(data: dict) ->
|
299
|
-
speech_data:
|
288
|
+
def live_transcription_to_speech_data(data: dict) -> list[stt.SpeechData]:
|
289
|
+
speech_data: list[stt.SpeechData] = []
|
300
290
|
|
301
291
|
for result in data.get("results", []):
|
302
292
|
start_time, end_time, is_eos = (
|
@@ -1,7 +1,7 @@
|
|
1
1
|
import ssl
|
2
2
|
from dataclasses import asdict, dataclass, field
|
3
3
|
from enum import Enum
|
4
|
-
from typing import Any,
|
4
|
+
from typing import Any, Optional
|
5
5
|
|
6
6
|
|
7
7
|
@dataclass
|
@@ -20,10 +20,10 @@ class TranscriptionConfig:
|
|
20
20
|
diarization: Optional[str] = None
|
21
21
|
"""Indicates type of diarization to use, if any."""
|
22
22
|
|
23
|
-
additional_vocab: Optional[
|
23
|
+
additional_vocab: Optional[dict] = None
|
24
24
|
"""Additional vocabulary that is not part of the standard language."""
|
25
25
|
|
26
|
-
punctuation_overrides: Optional[
|
26
|
+
punctuation_overrides: Optional[dict] = None
|
27
27
|
"""Permitted puctuation marks for advanced punctuation."""
|
28
28
|
|
29
29
|
enable_entities: Optional[bool] = None
|
@@ -46,11 +46,9 @@ class TranscriptionConfig:
|
|
46
46
|
"""Indicates if partials for transcription, where words are produced
|
47
47
|
immediately, is enabled."""
|
48
48
|
|
49
|
-
def asdict(self) ->
|
49
|
+
def asdict(self) -> dict[Any, Any]:
|
50
50
|
"""Returns model as a dict while excluding None values recursively."""
|
51
|
-
return asdict(
|
52
|
-
self, dict_factory=lambda x: {k: v for (k, v) in x if v is not None}
|
53
|
-
)
|
51
|
+
return asdict(self, dict_factory=lambda x: {k: v for (k, v) in x if v is not None})
|
54
52
|
|
55
53
|
|
56
54
|
@dataclass
|
@@ -5,26 +5,20 @@ import aiohttp
|
|
5
5
|
|
6
6
|
|
7
7
|
async def get_access_token(api_key: str) -> str:
|
8
|
-
mp_api_url = os.getenv(
|
9
|
-
"SPEECHMATICS_MANAGEMENT_PLATFORM_URL", "https://mp.speechmatics.com"
|
10
|
-
)
|
8
|
+
mp_api_url = os.getenv("SPEECHMATICS_MANAGEMENT_PLATFORM_URL", "https://mp.speechmatics.com")
|
11
9
|
endpoint = f"{mp_api_url}/v1/api_keys"
|
12
10
|
params = {"type": "rt", "sm-sdk": get_sdk_version()}
|
13
11
|
json_body = {"ttl": 60}
|
14
12
|
headers = {"Authorization": f"Bearer {api_key}", "Content-Type": "application/json"}
|
15
13
|
|
16
14
|
async with aiohttp.ClientSession() as session:
|
17
|
-
async with session.post(
|
18
|
-
endpoint, params=params, json=json_body, headers=headers
|
19
|
-
) as resp:
|
15
|
+
async with session.post(endpoint, params=params, json=json_body, headers=headers) as resp:
|
20
16
|
if resp.status == 201:
|
21
17
|
try:
|
22
18
|
data = await resp.json()
|
23
19
|
return data["key_value"]
|
24
20
|
except (ValueError, KeyError) as e:
|
25
|
-
raise Exception(
|
26
|
-
f"Failed to parse Speechmatics access token response: {e}"
|
27
|
-
)
|
21
|
+
raise Exception(f"Failed to parse Speechmatics access token response: {e}")
|
28
22
|
else:
|
29
23
|
error_message = await resp.text()
|
30
24
|
raise Exception(
|
@@ -0,0 +1,39 @@
|
|
1
|
+
[build-system]
|
2
|
+
requires = ["hatchling"]
|
3
|
+
build-backend = "hatchling.build"
|
4
|
+
|
5
|
+
[project]
|
6
|
+
name = "livekit-plugins-speechmatics"
|
7
|
+
dynamic = ["version"]
|
8
|
+
description = "Agent Framework plugin for Speechmatics"
|
9
|
+
readme = "README.md"
|
10
|
+
license = "Apache-2.0"
|
11
|
+
requires-python = ">=3.9.0"
|
12
|
+
authors = [{ name = "LiveKit", email = "support@livekit.io" }]
|
13
|
+
keywords = ["webrtc", "realtime", "audio", "video", "livekit"]
|
14
|
+
classifiers = [
|
15
|
+
"Intended Audience :: Developers",
|
16
|
+
"License :: OSI Approved :: Apache Software License",
|
17
|
+
"Topic :: Multimedia :: Sound/Audio",
|
18
|
+
"Topic :: Multimedia :: Video",
|
19
|
+
"Topic :: Scientific/Engineering :: Artificial Intelligence",
|
20
|
+
"Programming Language :: Python :: 3",
|
21
|
+
"Programming Language :: Python :: 3.9",
|
22
|
+
"Programming Language :: Python :: 3.10",
|
23
|
+
"Programming Language :: Python :: 3 :: Only",
|
24
|
+
]
|
25
|
+
dependencies = ["livekit-agents>=1.0.0.dev5"]
|
26
|
+
|
27
|
+
[project.urls]
|
28
|
+
Documentation = "https://docs.livekit.io"
|
29
|
+
Website = "https://livekit.io/"
|
30
|
+
Source = "https://github.com/livekit/agents"
|
31
|
+
|
32
|
+
[tool.hatch.version]
|
33
|
+
path = "livekit/plugins/speechmatics/version.py"
|
34
|
+
|
35
|
+
[tool.hatch.build.targets.wheel]
|
36
|
+
packages = ["livekit"]
|
37
|
+
|
38
|
+
[tool.hatch.build.targets.sdist]
|
39
|
+
include = ["/livekit"]
|
@@ -1,66 +0,0 @@
|
|
1
|
-
Metadata-Version: 2.2
|
2
|
-
Name: livekit-plugins-speechmatics
|
3
|
-
Version: 0.0.2
|
4
|
-
Summary: Agent Framework plugin for Speechmatics
|
5
|
-
Home-page: https://github.com/livekit/agents
|
6
|
-
License: Apache-2.0
|
7
|
-
Project-URL: Documentation, https://docs.livekit.io
|
8
|
-
Project-URL: Website, https://livekit.io/
|
9
|
-
Project-URL: Source, https://github.com/livekit/agents
|
10
|
-
Keywords: webrtc,realtime,audio,video,livekit
|
11
|
-
Classifier: Intended Audience :: Developers
|
12
|
-
Classifier: License :: OSI Approved :: Apache Software License
|
13
|
-
Classifier: Topic :: Multimedia :: Sound/Audio
|
14
|
-
Classifier: Topic :: Multimedia :: Video
|
15
|
-
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
16
|
-
Classifier: Programming Language :: Python :: 3
|
17
|
-
Classifier: Programming Language :: Python :: 3.9
|
18
|
-
Classifier: Programming Language :: Python :: 3.10
|
19
|
-
Classifier: Programming Language :: Python :: 3 :: Only
|
20
|
-
Requires-Python: >=3.9.0
|
21
|
-
Description-Content-Type: text/markdown
|
22
|
-
Requires-Dist: livekit-agents<1.0.0,>=0.12.16
|
23
|
-
Dynamic: classifier
|
24
|
-
Dynamic: description
|
25
|
-
Dynamic: description-content-type
|
26
|
-
Dynamic: home-page
|
27
|
-
Dynamic: keywords
|
28
|
-
Dynamic: license
|
29
|
-
Dynamic: project-url
|
30
|
-
Dynamic: requires-dist
|
31
|
-
Dynamic: requires-python
|
32
|
-
Dynamic: summary
|
33
|
-
|
34
|
-
# LiveKit Plugins Speechmatics
|
35
|
-
|
36
|
-
Agent Framework plugin for Speechmatics.
|
37
|
-
|
38
|
-
## Installation
|
39
|
-
|
40
|
-
```bash
|
41
|
-
pip install livekit-plugins-speechmatics
|
42
|
-
```
|
43
|
-
|
44
|
-
Usage:
|
45
|
-
|
46
|
-
```python
|
47
|
-
agent = VoicePipelineAgent(
|
48
|
-
stt=speechmatics.STT(),
|
49
|
-
turn_detector=turn_detector.EOUModel(),
|
50
|
-
min_endpointing_delay=0.5,
|
51
|
-
max_endpointing_delay=5.0,
|
52
|
-
...
|
53
|
-
)
|
54
|
-
```
|
55
|
-
|
56
|
-
Note: The plugin was built with
|
57
|
-
LiveKit's [end-of-turn detection feature](https://github.com/livekit/agents#in-house-phrase-endpointing-model) in mind,
|
58
|
-
and it doesn't implement phrase endpointing. `AddTranscript` and `AddPartialTranscript` events are emitted as soon
|
59
|
-
as they’re received from the Speechmatics STT engine. For the best user experience,
|
60
|
-
we recommend running the agent with end-of-turn detection enabled (
|
61
|
-
see [example](https://github.com/livekit-examples/voice-pipeline-agent-python/blob/main/agent.py)).
|
62
|
-
|
63
|
-
## Pre-requisites
|
64
|
-
|
65
|
-
You'll need to specify a Speechmatics API Key. It can be set as environment variable `SPEECHMATICS_API_KEY` or
|
66
|
-
`.env.local` file.
|
@@ -1,14 +0,0 @@
|
|
1
|
-
README.md
|
2
|
-
setup.py
|
3
|
-
livekit/plugins/speechmatics/__init__.py
|
4
|
-
livekit/plugins/speechmatics/log.py
|
5
|
-
livekit/plugins/speechmatics/py.typed
|
6
|
-
livekit/plugins/speechmatics/stt.py
|
7
|
-
livekit/plugins/speechmatics/types.py
|
8
|
-
livekit/plugins/speechmatics/utils.py
|
9
|
-
livekit/plugins/speechmatics/version.py
|
10
|
-
livekit_plugins_speechmatics.egg-info/PKG-INFO
|
11
|
-
livekit_plugins_speechmatics.egg-info/SOURCES.txt
|
12
|
-
livekit_plugins_speechmatics.egg-info/dependency_links.txt
|
13
|
-
livekit_plugins_speechmatics.egg-info/requires.txt
|
14
|
-
livekit_plugins_speechmatics.egg-info/top_level.txt
|
livekit_plugins_speechmatics-0.0.2/livekit_plugins_speechmatics.egg-info/dependency_links.txt
DELETED
@@ -1 +0,0 @@
|
|
1
|
-
|
@@ -1 +0,0 @@
|
|
1
|
-
livekit-agents<1.0.0,>=0.12.16
|
@@ -1 +0,0 @@
|
|
1
|
-
livekit
|
@@ -1,58 +0,0 @@
|
|
1
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
2
|
-
# you may not use this file except in compliance with the License.
|
3
|
-
# You may obtain a copy of the License at
|
4
|
-
#
|
5
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
6
|
-
#
|
7
|
-
# Unless required by applicable law or agreed to in writing, software
|
8
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
9
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
10
|
-
# See the License for the specific language governing permissions and
|
11
|
-
# limitations under the License.
|
12
|
-
|
13
|
-
import os
|
14
|
-
import pathlib
|
15
|
-
|
16
|
-
import setuptools.command.build_py
|
17
|
-
|
18
|
-
here = pathlib.Path(__file__).parent.resolve()
|
19
|
-
about = {}
|
20
|
-
with open(
|
21
|
-
os.path.join(here, "livekit", "plugins", "speechmatics", "version.py"), "r"
|
22
|
-
) as f:
|
23
|
-
exec(f.read(), about)
|
24
|
-
|
25
|
-
|
26
|
-
setuptools.setup(
|
27
|
-
name="livekit-plugins-speechmatics",
|
28
|
-
version=about["__version__"],
|
29
|
-
description="Agent Framework plugin for Speechmatics",
|
30
|
-
long_description=(here / "README.md").read_text(encoding="utf-8"),
|
31
|
-
long_description_content_type="text/markdown",
|
32
|
-
url="https://github.com/livekit/agents",
|
33
|
-
cmdclass={},
|
34
|
-
classifiers=[
|
35
|
-
"Intended Audience :: Developers",
|
36
|
-
"License :: OSI Approved :: Apache Software License",
|
37
|
-
"Topic :: Multimedia :: Sound/Audio",
|
38
|
-
"Topic :: Multimedia :: Video",
|
39
|
-
"Topic :: Scientific/Engineering :: Artificial Intelligence",
|
40
|
-
"Programming Language :: Python :: 3",
|
41
|
-
"Programming Language :: Python :: 3.9",
|
42
|
-
"Programming Language :: Python :: 3.10",
|
43
|
-
"Programming Language :: Python :: 3 :: Only",
|
44
|
-
],
|
45
|
-
keywords=["webrtc", "realtime", "audio", "video", "livekit"],
|
46
|
-
license="Apache-2.0",
|
47
|
-
packages=setuptools.find_namespace_packages(include=["livekit.*"]),
|
48
|
-
python_requires=">=3.9.0",
|
49
|
-
install_requires=[
|
50
|
-
"livekit-agents>=0.12.16,<1.0.0",
|
51
|
-
],
|
52
|
-
package_data={},
|
53
|
-
project_urls={
|
54
|
-
"Documentation": "https://docs.livekit.io",
|
55
|
-
"Website": "https://livekit.io/",
|
56
|
-
"Source": "https://github.com/livekit/agents",
|
57
|
-
},
|
58
|
-
)
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|