voice-bird-cli 0.2.7__tar.gz → 0.3.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (29) hide show
  1. voice_bird_cli-0.3.2/LICENSE +21 -0
  2. voice_bird_cli-0.3.2/PKG-INFO +134 -0
  3. voice_bird_cli-0.3.2/README.md +113 -0
  4. voice_bird_cli-0.3.2/pyproject.toml +37 -0
  5. voice_bird_cli-0.3.2/python/voice_bird_cli/__init__.py +4 -0
  6. voice_bird_cli-0.3.2/python/voice_bird_cli/__main__.py +36 -0
  7. voice_bird_cli-0.3.2/python/voice_bird_cli.egg-info/PKG-INFO +134 -0
  8. voice_bird_cli-0.3.2/python/voice_bird_cli.egg-info/SOURCES.txt +10 -0
  9. voice_bird_cli-0.3.2/python/voice_bird_cli.egg-info/dependency_links.txt +1 -0
  10. voice_bird_cli-0.3.2/python/voice_bird_cli.egg-info/entry_points.txt +2 -0
  11. voice_bird_cli-0.3.2/python/voice_bird_cli.egg-info/top_level.txt +1 -0
  12. voice_bird_cli-0.3.2/setup.cfg +4 -0
  13. voice_bird_cli-0.2.7/PKG-INFO +0 -74
  14. voice_bird_cli-0.2.7/pyproject.toml +0 -34
  15. voice_bird_cli-0.2.7/python/voice_bird_cli/__init__.py +0 -1
  16. voice_bird_cli-0.2.7/python/voice_bird_cli/__main__.py +0 -50
  17. voice_bird_cli-0.2.7/voice-bird-cli/Cargo.lock +0 -2673
  18. voice_bird_cli-0.2.7/voice-bird-cli/Cargo.toml +0 -58
  19. voice_bird_cli-0.2.7/voice-bird-cli/README.md +0 -53
  20. voice_bird_cli-0.2.7/voice-bird-cli/src/app.rs +0 -226
  21. voice_bird_cli-0.2.7/voice-bird-cli/src/audio.rs +0 -223
  22. voice_bird_cli-0.2.7/voice-bird-cli/src/config.rs +0 -56
  23. voice_bird_cli-0.2.7/voice-bird-cli/src/logger.rs +0 -47
  24. voice_bird_cli-0.2.7/voice-bird-cli/src/main.rs +0 -315
  25. voice_bird_cli-0.2.7/voice-bird-cli/src/platform/macos.rs +0 -289
  26. voice_bird_cli-0.2.7/voice-bird-cli/src/platform/mod.rs +0 -71
  27. voice_bird_cli-0.2.7/voice-bird-cli/src/platform/windows.rs +0 -380
  28. voice_bird_cli-0.2.7/voice-bird-cli/src/streaming.rs +0 -243
  29. voice_bird_cli-0.2.7/voice-bird-cli/src/ui.rs +0 -327
@@ -0,0 +1,21 @@
1
+ MIT License
2
+
3
+ Copyright (c) 2026 Voice Bird contributors
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
@@ -0,0 +1,134 @@
1
+ Metadata-Version: 2.4
2
+ Name: voice-bird-cli
3
+ Version: 0.3.2
4
+ Summary: Voice Bird CLI - local-first voice transcription TUI
5
+ Author: Voice Bird contributors
6
+ License-Expression: MIT
7
+ Project-URL: Homepage, https://github.com/voice-bird/voice-bird-cli
8
+ Project-URL: Repository, https://github.com/voice-bird/voice-bird-cli
9
+ Project-URL: Issues, https://github.com/voice-bird/voice-bird-cli/issues
10
+ Keywords: voice,transcription,whisper,cli,tui
11
+ Classifier: Development Status :: 4 - Beta
12
+ Classifier: Environment :: Console
13
+ Classifier: Intended Audience :: End Users/Desktop
14
+ Classifier: Programming Language :: Rust
15
+ Classifier: Programming Language :: Python :: 3
16
+ Classifier: Topic :: Multimedia :: Sound/Audio :: Speech
17
+ Requires-Python: >=3.9
18
+ Description-Content-Type: text/markdown
19
+ License-File: LICENSE
20
+ Dynamic: license-file
21
+
22
+ # Voice Bird CLI
23
+
24
+ Voice Bird CLI is a terminal voice transcription app. It runs **locally by default** with Whisper models, so local recordings stay on your machine. When you want hosted transcription, you can opt in per source to VoiceBird Web cloud mode.
25
+
26
+ ![Voice Bird CLI basic flow](docs/assets/basic-flow.svg)
27
+
28
+ ## Basic Flow
29
+
30
+ 1. Pick a microphone, system-output loopback device, or app audio source.
31
+ 2. Choose local or cloud mode for that source.
32
+ 3. Press `Enter` to start a transcription slot.
33
+ 4. Watch committed and tentative transcript text stream into the TUI.
34
+ 5. In local mode, review session files under `~/voice-bird/sessions/<timestamp>-<source>/`.
35
+
36
+ Local sessions contain:
37
+
38
+ | File | Content |
39
+ | --- | --- |
40
+ | `audio.wav` | 16 kHz mono recording |
41
+ | `transcript.jsonl` | Append-only transcript log, useful after crashes |
42
+ | `transcript.json` | Finalized transcript segments and metadata |
43
+ | `transcript.txt` | Plain-text transcript |
44
+ | `meta.json` | Device, source, model, engine, and duration |
45
+
46
+ ## Getting Started
47
+
48
+ Install one of the CLI packages, then run:
49
+
50
+ ```bash
51
+ voice-bird-cli
52
+ ```
53
+
54
+ On first launch, Voice Bird picks a local Whisper model and downloads it into your OS cache directory. The default model is `distil-small.en`. Settings are stored in `~/.config/voice-bird/config.toml` on Linux/macOS and `%APPDATA%\voice-bird\config.toml` on Windows.
55
+
56
+ Press `m` to change models. The picker includes `nemotron-3.5-asr-streaming-0.6b`, NVIDIA's latest Nemotron 3.5 ASR streaming model via the local `parakeet-rs` engine. Select it, let the package download/unpack, then start recording; the engine label and `meta.json` should show `nemotron`.
57
+
58
+ macOS users may need to grant Screen Recording permission for system or app audio capture. Apple Silicon users can optionally build the WhisperKit sidecar for ANE-accelerated local inference:
59
+
60
+ ```bash
61
+ cargo run -p xtask -- build-sidecar
62
+ ```
63
+
64
+ Without the sidecar, Voice Bird falls back to `whisper-rs` with whisper.cpp.
65
+
66
+ ## Install
67
+
68
+ Cargo installs the native Rust binary directly:
69
+
70
+ ```bash
71
+ cargo install voice-bird-cli
72
+ ```
73
+
74
+ PyPI installs a small wrapper that installs/runs the Cargo binary:
75
+
76
+ ```bash
77
+ pipx install voice-bird-cli
78
+ # or
79
+ pip install voice-bird-cli
80
+ ```
81
+
82
+ npm installs a small wrapper that installs/runs the Cargo binary:
83
+
84
+ ```bash
85
+ npm install -g voice-bird-cli
86
+ ```
87
+
88
+ From source:
89
+
90
+ ```bash
91
+ git clone https://github.com/voice-bird/voice-bird-cli.git
92
+ cd voice-bird-cli
93
+ cargo install --path .
94
+ ```
95
+
96
+ The npm and PyPI packages require Rust Cargo on the machine. Use the Cargo or source install when you want the simplest path.
97
+
98
+ ## Local And Cloud Modes
99
+
100
+ **Free local mode** is the default. It uses local Whisper inference through `whisper-rs`, or WhisperKit on macOS when the sidecar is available. Local mode does not send audio to a server and writes session artifacts to disk. Current local models are English-focused in the app flow.
101
+
102
+ **Cloud mode** streams audio to VoiceBird Web at `wss://voicebird.app/api/audio/stream`. It is opt-in, requires a Voice Bird API key, and is useful when local hardware cannot keep up or when you want cloud language support. Cloud recordings live in your VoiceBird Web account instead of the local sessions folder.
103
+
104
+ Your Voice Bird API key is stored in plaintext in `config.toml`; on Unix the app sets the file to `0600` best-effort.
105
+
106
+ ## Usage
107
+
108
+ ```bash
109
+ voice-bird-cli # start the TUI
110
+ voice-bird-cli --recover <session-dir> # rebuild transcript.{json,txt} after a crash
111
+ ```
112
+
113
+ ## Keys
114
+
115
+ | Key | Action |
116
+ | --- | --- |
117
+ | `↑` / `↓` | Select device or app |
118
+ | `←` / `→` | Move between panes |
119
+ | `Enter` | Start the selected source |
120
+ | `Space` | Clear selected app pairing |
121
+ | `Tab` | Move between transcript slots |
122
+ | `r` | Refresh devices and apps |
123
+ | `c` | Toggle cloud mode for the focused source |
124
+ | `l` | Change language for cloud mode |
125
+ | `m` | Change model |
126
+ | `e` | Export the latest local transcript |
127
+ | `p` | Change local session path |
128
+ | `x` | Clear stopped transcript slot |
129
+ | `q` | Quit |
130
+ | `?` | Help |
131
+
132
+ ## License
133
+
134
+ MIT
@@ -0,0 +1,113 @@
1
+ # Voice Bird CLI
2
+
3
+ Voice Bird CLI is a terminal voice transcription app. It runs **locally by default** with Whisper models, so local recordings stay on your machine. When you want hosted transcription, you can opt in per source to VoiceBird Web cloud mode.
4
+
5
+ ![Voice Bird CLI basic flow](docs/assets/basic-flow.svg)
6
+
7
+ ## Basic Flow
8
+
9
+ 1. Pick a microphone, system-output loopback device, or app audio source.
10
+ 2. Choose local or cloud mode for that source.
11
+ 3. Press `Enter` to start a transcription slot.
12
+ 4. Watch committed and tentative transcript text stream into the TUI.
13
+ 5. In local mode, review session files under `~/voice-bird/sessions/<timestamp>-<source>/`.
14
+
15
+ Local sessions contain:
16
+
17
+ | File | Content |
18
+ | --- | --- |
19
+ | `audio.wav` | 16 kHz mono recording |
20
+ | `transcript.jsonl` | Append-only transcript log, useful after crashes |
21
+ | `transcript.json` | Finalized transcript segments and metadata |
22
+ | `transcript.txt` | Plain-text transcript |
23
+ | `meta.json` | Device, source, model, engine, and duration |
24
+
25
+ ## Getting Started
26
+
27
+ Install one of the CLI packages, then run:
28
+
29
+ ```bash
30
+ voice-bird-cli
31
+ ```
32
+
33
+ On first launch, Voice Bird picks a local Whisper model and downloads it into your OS cache directory. The default model is `distil-small.en`. Settings are stored in `~/.config/voice-bird/config.toml` on Linux/macOS and `%APPDATA%\voice-bird\config.toml` on Windows.
34
+
35
+ Press `m` to change models. The picker includes `nemotron-3.5-asr-streaming-0.6b`, NVIDIA's latest Nemotron 3.5 ASR streaming model via the local `parakeet-rs` engine. Select it, let the package download/unpack, then start recording; the engine label and `meta.json` should show `nemotron`.
36
+
37
+ macOS users may need to grant Screen Recording permission for system or app audio capture. Apple Silicon users can optionally build the WhisperKit sidecar for ANE-accelerated local inference:
38
+
39
+ ```bash
40
+ cargo run -p xtask -- build-sidecar
41
+ ```
42
+
43
+ Without the sidecar, Voice Bird falls back to `whisper-rs` with whisper.cpp.
44
+
45
+ ## Install
46
+
47
+ Cargo installs the native Rust binary directly:
48
+
49
+ ```bash
50
+ cargo install voice-bird-cli
51
+ ```
52
+
53
+ PyPI installs a small wrapper that installs/runs the Cargo binary:
54
+
55
+ ```bash
56
+ pipx install voice-bird-cli
57
+ # or
58
+ pip install voice-bird-cli
59
+ ```
60
+
61
+ npm installs a small wrapper that installs/runs the Cargo binary:
62
+
63
+ ```bash
64
+ npm install -g voice-bird-cli
65
+ ```
66
+
67
+ From source:
68
+
69
+ ```bash
70
+ git clone https://github.com/voice-bird/voice-bird-cli.git
71
+ cd voice-bird-cli
72
+ cargo install --path .
73
+ ```
74
+
75
+ The npm and PyPI packages require Rust Cargo on the machine. Use the Cargo or source install when you want the simplest path.
76
+
77
+ ## Local And Cloud Modes
78
+
79
+ **Free local mode** is the default. It uses local Whisper inference through `whisper-rs`, or WhisperKit on macOS when the sidecar is available. Local mode does not send audio to a server and writes session artifacts to disk. Current local models are English-focused in the app flow.
80
+
81
+ **Cloud mode** streams audio to VoiceBird Web at `wss://voicebird.app/api/audio/stream`. It is opt-in, requires a Voice Bird API key, and is useful when local hardware cannot keep up or when you want cloud language support. Cloud recordings live in your VoiceBird Web account instead of the local sessions folder.
82
+
83
+ Your Voice Bird API key is stored in plaintext in `config.toml`; on Unix the app sets the file to `0600` best-effort.
84
+
85
+ ## Usage
86
+
87
+ ```bash
88
+ voice-bird-cli # start the TUI
89
+ voice-bird-cli --recover <session-dir> # rebuild transcript.{json,txt} after a crash
90
+ ```
91
+
92
+ ## Keys
93
+
94
+ | Key | Action |
95
+ | --- | --- |
96
+ | `↑` / `↓` | Select device or app |
97
+ | `←` / `→` | Move between panes |
98
+ | `Enter` | Start the selected source |
99
+ | `Space` | Clear selected app pairing |
100
+ | `Tab` | Move between transcript slots |
101
+ | `r` | Refresh devices and apps |
102
+ | `c` | Toggle cloud mode for the focused source |
103
+ | `l` | Change language for cloud mode |
104
+ | `m` | Change model |
105
+ | `e` | Export the latest local transcript |
106
+ | `p` | Change local session path |
107
+ | `x` | Clear stopped transcript slot |
108
+ | `q` | Quit |
109
+ | `?` | Help |
110
+
111
+ ## License
112
+
113
+ MIT
@@ -0,0 +1,37 @@
1
+ [build-system]
2
+ requires = ["setuptools>=68", "wheel"]
3
+ build-backend = "setuptools.build_meta"
4
+
5
+ [project]
6
+ name = "voice-bird-cli"
7
+ version = "0.3.2"
8
+ description = "Voice Bird CLI - local-first voice transcription TUI"
9
+ readme = "README.md"
10
+ license = "MIT"
11
+ requires-python = ">=3.9"
12
+ authors = [
13
+ { name = "Voice Bird contributors" }
14
+ ]
15
+ keywords = ["voice", "transcription", "whisper", "cli", "tui"]
16
+ classifiers = [
17
+ "Development Status :: 4 - Beta",
18
+ "Environment :: Console",
19
+ "Intended Audience :: End Users/Desktop",
20
+ "Programming Language :: Rust",
21
+ "Programming Language :: Python :: 3",
22
+ "Topic :: Multimedia :: Sound/Audio :: Speech"
23
+ ]
24
+
25
+ [project.urls]
26
+ Homepage = "https://github.com/voice-bird/voice-bird-cli"
27
+ Repository = "https://github.com/voice-bird/voice-bird-cli"
28
+ Issues = "https://github.com/voice-bird/voice-bird-cli/issues"
29
+
30
+ [project.scripts]
31
+ voice-bird-cli = "voice_bird_cli.__main__:main"
32
+
33
+ [tool.setuptools]
34
+ package-dir = {"" = "python"}
35
+
36
+ [tool.setuptools.packages.find]
37
+ where = ["python"]
@@ -0,0 +1,4 @@
1
+ """Python wrapper for the Voice Bird CLI Rust binary."""
2
+
3
+ __all__ = ["__version__"]
4
+ __version__ = "0.3.2"
@@ -0,0 +1,36 @@
1
+ from __future__ import annotations
2
+
3
+ import os
4
+ import subprocess
5
+ import sys
6
+ from pathlib import Path
7
+
8
+
9
+ def _cargo_bin() -> Path:
10
+ name = "voice-bird-cli.exe" if os.name == "nt" else "voice-bird-cli"
11
+ return Path.home() / ".cargo" / "bin" / name
12
+
13
+
14
+ def main() -> int:
15
+ exe = _cargo_bin()
16
+ if not exe.exists():
17
+ try:
18
+ subprocess.run(
19
+ ["cargo", "install", "voice-bird-cli", "--locked"],
20
+ check=True,
21
+ )
22
+ except FileNotFoundError:
23
+ print(
24
+ "voice-bird-cli PyPI package requires Rust Cargo. "
25
+ "Install Rust from https://rustup.rs/ and run this command again.",
26
+ file=sys.stderr,
27
+ )
28
+ return 1
29
+ except subprocess.CalledProcessError as exc:
30
+ return exc.returncode
31
+
32
+ return subprocess.run([str(exe), *sys.argv[1:]]).returncode
33
+
34
+
35
+ if __name__ == "__main__":
36
+ raise SystemExit(main())
@@ -0,0 +1,134 @@
1
+ Metadata-Version: 2.4
2
+ Name: voice-bird-cli
3
+ Version: 0.3.2
4
+ Summary: Voice Bird CLI - local-first voice transcription TUI
5
+ Author: Voice Bird contributors
6
+ License-Expression: MIT
7
+ Project-URL: Homepage, https://github.com/voice-bird/voice-bird-cli
8
+ Project-URL: Repository, https://github.com/voice-bird/voice-bird-cli
9
+ Project-URL: Issues, https://github.com/voice-bird/voice-bird-cli/issues
10
+ Keywords: voice,transcription,whisper,cli,tui
11
+ Classifier: Development Status :: 4 - Beta
12
+ Classifier: Environment :: Console
13
+ Classifier: Intended Audience :: End Users/Desktop
14
+ Classifier: Programming Language :: Rust
15
+ Classifier: Programming Language :: Python :: 3
16
+ Classifier: Topic :: Multimedia :: Sound/Audio :: Speech
17
+ Requires-Python: >=3.9
18
+ Description-Content-Type: text/markdown
19
+ License-File: LICENSE
20
+ Dynamic: license-file
21
+
22
+ # Voice Bird CLI
23
+
24
+ Voice Bird CLI is a terminal voice transcription app. It runs **locally by default** with Whisper models, so local recordings stay on your machine. When you want hosted transcription, you can opt in per source to VoiceBird Web cloud mode.
25
+
26
+ ![Voice Bird CLI basic flow](docs/assets/basic-flow.svg)
27
+
28
+ ## Basic Flow
29
+
30
+ 1. Pick a microphone, system-output loopback device, or app audio source.
31
+ 2. Choose local or cloud mode for that source.
32
+ 3. Press `Enter` to start a transcription slot.
33
+ 4. Watch committed and tentative transcript text stream into the TUI.
34
+ 5. In local mode, review session files under `~/voice-bird/sessions/<timestamp>-<source>/`.
35
+
36
+ Local sessions contain:
37
+
38
+ | File | Content |
39
+ | --- | --- |
40
+ | `audio.wav` | 16 kHz mono recording |
41
+ | `transcript.jsonl` | Append-only transcript log, useful after crashes |
42
+ | `transcript.json` | Finalized transcript segments and metadata |
43
+ | `transcript.txt` | Plain-text transcript |
44
+ | `meta.json` | Device, source, model, engine, and duration |
45
+
46
+ ## Getting Started
47
+
48
+ Install one of the CLI packages, then run:
49
+
50
+ ```bash
51
+ voice-bird-cli
52
+ ```
53
+
54
+ On first launch, Voice Bird picks a local Whisper model and downloads it into your OS cache directory. The default model is `distil-small.en`. Settings are stored in `~/.config/voice-bird/config.toml` on Linux/macOS and `%APPDATA%\voice-bird\config.toml` on Windows.
55
+
56
+ Press `m` to change models. The picker includes `nemotron-3.5-asr-streaming-0.6b`, NVIDIA's latest Nemotron 3.5 ASR streaming model via the local `parakeet-rs` engine. Select it, let the package download/unpack, then start recording; the engine label and `meta.json` should show `nemotron`.
57
+
58
+ macOS users may need to grant Screen Recording permission for system or app audio capture. Apple Silicon users can optionally build the WhisperKit sidecar for ANE-accelerated local inference:
59
+
60
+ ```bash
61
+ cargo run -p xtask -- build-sidecar
62
+ ```
63
+
64
+ Without the sidecar, Voice Bird falls back to `whisper-rs` with whisper.cpp.
65
+
66
+ ## Install
67
+
68
+ Cargo installs the native Rust binary directly:
69
+
70
+ ```bash
71
+ cargo install voice-bird-cli
72
+ ```
73
+
74
+ PyPI installs a small wrapper that installs/runs the Cargo binary:
75
+
76
+ ```bash
77
+ pipx install voice-bird-cli
78
+ # or
79
+ pip install voice-bird-cli
80
+ ```
81
+
82
+ npm installs a small wrapper that installs/runs the Cargo binary:
83
+
84
+ ```bash
85
+ npm install -g voice-bird-cli
86
+ ```
87
+
88
+ From source:
89
+
90
+ ```bash
91
+ git clone https://github.com/voice-bird/voice-bird-cli.git
92
+ cd voice-bird-cli
93
+ cargo install --path .
94
+ ```
95
+
96
+ The npm and PyPI packages require Rust Cargo on the machine. Use the Cargo or source install when you want the simplest path.
97
+
98
+ ## Local And Cloud Modes
99
+
100
+ **Free local mode** is the default. It uses local Whisper inference through `whisper-rs`, or WhisperKit on macOS when the sidecar is available. Local mode does not send audio to a server and writes session artifacts to disk. Current local models are English-focused in the app flow.
101
+
102
+ **Cloud mode** streams audio to VoiceBird Web at `wss://voicebird.app/api/audio/stream`. It is opt-in, requires a Voice Bird API key, and is useful when local hardware cannot keep up or when you want cloud language support. Cloud recordings live in your VoiceBird Web account instead of the local sessions folder.
103
+
104
+ Your Voice Bird API key is stored in plaintext in `config.toml`; on Unix the app sets the file to `0600` best-effort.
105
+
106
+ ## Usage
107
+
108
+ ```bash
109
+ voice-bird-cli # start the TUI
110
+ voice-bird-cli --recover <session-dir> # rebuild transcript.{json,txt} after a crash
111
+ ```
112
+
113
+ ## Keys
114
+
115
+ | Key | Action |
116
+ | --- | --- |
117
+ | `↑` / `↓` | Select device or app |
118
+ | `←` / `→` | Move between panes |
119
+ | `Enter` | Start the selected source |
120
+ | `Space` | Clear selected app pairing |
121
+ | `Tab` | Move between transcript slots |
122
+ | `r` | Refresh devices and apps |
123
+ | `c` | Toggle cloud mode for the focused source |
124
+ | `l` | Change language for cloud mode |
125
+ | `m` | Change model |
126
+ | `e` | Export the latest local transcript |
127
+ | `p` | Change local session path |
128
+ | `x` | Clear stopped transcript slot |
129
+ | `q` | Quit |
130
+ | `?` | Help |
131
+
132
+ ## License
133
+
134
+ MIT
@@ -0,0 +1,10 @@
1
+ LICENSE
2
+ README.md
3
+ pyproject.toml
4
+ python/voice_bird_cli/__init__.py
5
+ python/voice_bird_cli/__main__.py
6
+ python/voice_bird_cli.egg-info/PKG-INFO
7
+ python/voice_bird_cli.egg-info/SOURCES.txt
8
+ python/voice_bird_cli.egg-info/dependency_links.txt
9
+ python/voice_bird_cli.egg-info/entry_points.txt
10
+ python/voice_bird_cli.egg-info/top_level.txt
@@ -0,0 +1,2 @@
1
+ [console_scripts]
2
+ voice-bird-cli = voice_bird_cli.__main__:main
@@ -0,0 +1,4 @@
1
+ [egg_info]
2
+ tag_build =
3
+ tag_date = 0
4
+
@@ -1,74 +0,0 @@
1
- Metadata-Version: 2.4
2
- Name: voice-bird-cli
3
- Version: 0.2.7
4
- Classifier: Development Status :: 3 - Alpha
5
- Classifier: Environment :: Console
6
- Classifier: Intended Audience :: Developers
7
- Classifier: License :: OSI Approved :: MIT License
8
- Classifier: Operating System :: OS Independent
9
- Classifier: Programming Language :: Python :: 3
10
- Classifier: Programming Language :: Rust
11
- Classifier: Topic :: Multimedia :: Sound/Audio
12
- Summary: Voice Bird CLI - Terminal audio streaming for voice transcription
13
- Keywords: audio,streaming,transcription,voice,cli,tui
14
- Author: Dzmitry Rekun
15
- License: MIT
16
- Requires-Python: >=3.8
17
- Description-Content-Type: text/markdown; charset=UTF-8; variant=GFM
18
- Project-URL: Homepage, https://voicebird.app
19
- Project-URL: Repository, https://github.com/RekunDzmitry/voice-bird-releases
20
-
21
- # Voice Bird CLI
22
-
23
- Terminal-based audio streaming for voice transcription.
24
-
25
- ## Installation
26
-
27
- ### Using cargo-binstall (Recommended)
28
-
29
- ```bash
30
- # Install cargo-binstall if you don't have it
31
- cargo install cargo-binstall
32
-
33
- # Install Voice Bird CLI
34
- cargo binstall voice-bird-cli
35
- ```
36
-
37
- ### Manual Download
38
-
39
- Download pre-built binaries from [GitHub Releases](https://github.com/RekunDzmitry/voice-bird-releases/releases).
40
-
41
- ## Features
42
-
43
- - Enumerate audio devices and running applications
44
- - Capture per-application audio (Windows/macOS)
45
- - Stream audio to Voice Bird server for transcription
46
- - Real-time audio level visualization
47
- - Interactive TUI interface
48
-
49
- ## Usage
50
-
51
- ```bash
52
- # Run the CLI
53
- voice-bird-cli
54
- ```
55
-
56
- ### Controls
57
-
58
- - `↑/↓` - Navigate device list
59
- - `Space` - Select/deselect audio source
60
- - `Enter` - Start/stop streaming
61
- - `c` - Configure API key
62
- - `r` - Refresh device list
63
- - `q` - Quit
64
- - `?` - Help
65
-
66
- ## Requirements
67
-
68
- - Windows 10 Build 20348+ or macOS 12+
69
- - Voice Bird API key (get one at https://voicebird.app)
70
-
71
- ## License
72
-
73
- Proprietary - See LICENSE file for details.
74
-
@@ -1,34 +0,0 @@
1
- [build-system]
2
- requires = ["maturin>=1.9,<2.0"]
3
- build-backend = "maturin"
4
-
5
- [project]
6
- name = "voice-bird-cli"
7
- version = "0.2.7"
8
- description = "Voice Bird CLI - Terminal audio streaming for voice transcription"
9
- authors = [{ name = "Dzmitry Rekun" }]
10
- readme = "voice-bird-cli/README.md"
11
- requires-python = ">=3.8"
12
- license = { text = "MIT" }
13
- keywords = ["audio", "streaming", "transcription", "voice", "cli", "tui"]
14
- classifiers = [
15
- "Development Status :: 3 - Alpha",
16
- "Environment :: Console",
17
- "Intended Audience :: Developers",
18
- "License :: OSI Approved :: MIT License",
19
- "Operating System :: OS Independent",
20
- "Programming Language :: Python :: 3",
21
- "Programming Language :: Rust",
22
- "Topic :: Multimedia :: Sound/Audio",
23
- ]
24
-
25
- [project.urls]
26
- Homepage = "https://voicebird.app"
27
- Repository = "https://github.com/RekunDzmitry/voice-bird-releases"
28
-
29
- [tool.maturin]
30
- bindings = "bin"
31
- manifest-path = "voice-bird-cli/Cargo.toml"
32
- module-name = "voice_bird_cli"
33
- python-source = "python"
34
- strip = true
@@ -1 +0,0 @@
1
- """Voice Bird CLI - Terminal audio streaming for voice transcription."""
@@ -1,50 +0,0 @@
1
- from __future__ import annotations
2
-
3
- import os
4
- import sys
5
- import sysconfig
6
-
7
-
8
- def find_voice_bird_cli() -> str:
9
- """Return the voice-bird-cli binary path."""
10
- exe = "voice-bird-cli" + (sysconfig.get_config_var("EXE") or "")
11
-
12
- scripts_path = os.path.join(sysconfig.get_path("scripts"), exe)
13
- if os.path.isfile(scripts_path):
14
- return scripts_path
15
-
16
- if sys.version_info >= (3, 10):
17
- user_scheme = sysconfig.get_preferred_scheme("user")
18
- elif os.name == "nt":
19
- user_scheme = "nt_user"
20
- elif sys.platform == "darwin" and sys._framework:
21
- user_scheme = "osx_framework_user"
22
- else:
23
- user_scheme = "posix_user"
24
-
25
- user_path = os.path.join(sysconfig.get_path("scripts", scheme=user_scheme), exe)
26
- if os.path.isfile(user_path):
27
- return user_path
28
-
29
- pkg_root = os.path.dirname(os.path.dirname(__file__))
30
- target_path = os.path.join(pkg_root, "bin", exe)
31
- if os.path.isfile(target_path):
32
- return target_path
33
-
34
- raise FileNotFoundError(
35
- f"Could not find {exe}. Searched:\n"
36
- f" {scripts_path}\n"
37
- f" {user_path}\n"
38
- f" {target_path}"
39
- )
40
-
41
-
42
- if __name__ == "__main__":
43
- bin_path = find_voice_bird_cli()
44
- if sys.platform == "win32":
45
- import subprocess
46
-
47
- completed_process = subprocess.run([bin_path, *sys.argv[1:]])
48
- sys.exit(completed_process.returncode)
49
- else:
50
- os.execvp(bin_path, [bin_path, *sys.argv[1:]])