BatchalignHK 0.7.18.post8__tar.gz → 0.7.18.post11__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/PKG-INFO +10 -31
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/requires.txt +1 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/PKG-INFO +10 -31
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/README.md +6 -29
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/resolve.py +1 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/fa/wave2vec_fa.py +1 -1
- batchalignhk-0.7.18.post11/batchalign/version +3 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/setup.py +4 -0
- batchalignhk-0.7.18.post8/batchalign/version +0 -3
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/SOURCES.txt +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/dependency_links.txt +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/entry_points.txt +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/top_level.txt +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/LICENSE +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/MANIFEST.in +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/__main__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/cli/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/cli/cli.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/cli/dispatch.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/constants.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/document.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/errors.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/base.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/file.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/generator.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/lexer.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/parser.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/utils.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/file.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/generator.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/parser.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/speaker/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/speaker/config.yaml +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/speaker/infer.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/speaker/utils.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/training/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/training/run.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/training/utils.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utils.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/cantonese_infer.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/dataset.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/execute.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/infer.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/prep.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/train.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/wave2vec/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/wave2vec/infer_fa.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/whisper/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/whisper/infer_asr.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/whisper/infer_fa.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/analysis/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/analysis/eval.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/num2chinese.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/rev.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/tencent.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/utils.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/whisper.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/whisperx.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/base.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/cleanup.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/parse_support.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/retrace.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/support/test.test +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/dispatch.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/fa/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/fa/whisper_fa.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/coref.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/en/irr.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/fr/apm.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/fr/apmn.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/ud.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/pipeline.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/speaker/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/gtrans.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/seamless.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/utils.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/rev_utr.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/utils.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/whisper_utr.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utterance/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utterance/ud_utterance.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/conftest.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/fixures.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/test_pipeline.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/test_document.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/utils/__init__.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/utils/config.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/utils/dp.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/utils/utils.py +0 -0
- {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/setup.cfg +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
Metadata-Version: 2.
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
2
|
Name: BatchalignHK
|
|
3
|
-
Version: 0.7.18.
|
|
3
|
+
Version: 0.7.18.post11
|
|
4
4
|
Summary: Python Speech Language Sample Analysis
|
|
5
5
|
Author: Brian MacWhinney, Houjun Liu
|
|
6
6
|
Author-email: macw@cmu.edu, houjun@cmu.edu
|
|
@@ -14,6 +14,7 @@ Requires-Dist: praatio<6.1.0,>=6.0.0
|
|
|
14
14
|
Requires-Dist: torch>=2.6.0
|
|
15
15
|
Requires-Dist: torchaudio
|
|
16
16
|
Requires-Dist: opencc-python-reimplemented
|
|
17
|
+
Requires-Dist: pydub
|
|
17
18
|
Requires-Dist: plotly>=5.3.0
|
|
18
19
|
Requires-Dist: transformers>=4.37
|
|
19
20
|
Requires-Dist: tokenizers>=0.14.1
|
|
@@ -44,6 +45,7 @@ Dynamic: author-email
|
|
|
44
45
|
Dynamic: classifier
|
|
45
46
|
Dynamic: description
|
|
46
47
|
Dynamic: description-content-type
|
|
48
|
+
Dynamic: license-file
|
|
47
49
|
Dynamic: provides-extra
|
|
48
50
|
Dynamic: requires-dist
|
|
49
51
|
Dynamic: summary
|
|
@@ -60,46 +62,23 @@ The TalkBank Project, of which Batchalign is a part, is supported by NIH grant H
|
|
|
60
62
|
|
|
61
63
|
The following instructions provide a quick start to installing Batchalign. For most users aiming to process CHAT and audio with Batchalign, we recommend more detailed usage instructions: for [usage](https://talkbank.org/info/BA2-usage.pdf) and [human transcript cleanup](https://talkbank.org/info/BA2-cleanup.pdf). The following provides a quick start guide for the program.
|
|
62
64
|
|
|
63
|
-
### Get Python
|
|
64
|
-
- We support Python versions 3.9, 3.10, 3.11 and 3.12.
|
|
65
|
-
- First, check to see if you have Python by running `python`. If it reports any of the versions above, skip the following step.
|
|
66
|
-
- To install Python, follow the instructions...
|
|
67
|
-
- for macOS
|
|
68
|
-
1. Install Brew: [visit this link](https://brew.sh/)
|
|
69
|
-
2. Install Python and Pipx: execute `brew install python@3.11 pipx`
|
|
70
|
-
3. Copy the pipx path to yours: execute `pipx ensurepath`
|
|
71
|
-
- for Windows
|
|
72
|
-
1. Install Python 3.11: [via this link](https://www.python.org/ftp/python/3.11.7/python-3.11.7-amd64.exe)
|
|
73
|
-
2. If later commands report `pip module not found`, [this page may help](https://github.com/TalkBank/batchalign2/wiki/Troubleshooting-Tips#get-pip-on-windows)
|
|
74
|
-
- your distribution's instructions for Linux
|
|
75
|
-
|
|
76
|
-
For first-time users of Python, note that if you didn't install Python 3.11 (as we recommended above), it may be complex to change Python versions downstream and may cause additional problems. We recommend explicitly installing Python 3.11 by installing it explicitly via specifying a version number as we show above.
|
|
77
|
-
|
|
78
65
|
### Install and Update the Package
|
|
79
|
-
|
|
80
|
-
|
|
81
|
-
#### macOS
|
|
66
|
+
Batchalign is on PyPi (as `batchalign`). We recommend the use of UV to install Batchalign:
|
|
82
67
|
|
|
83
|
-
|
|
68
|
+
#### macOS / Linux
|
|
84
69
|
|
|
85
70
|
```
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
#### Linux
|
|
90
|
-
|
|
91
|
-
```
|
|
92
|
-
pip install -U batchalign
|
|
71
|
+
curl -LsSf https://astral.sh/uv/install.sh | sh
|
|
72
|
+
UV_PYTHON=3.11 uv tool install batchalign
|
|
93
73
|
```
|
|
94
74
|
|
|
95
75
|
#### Windows
|
|
96
76
|
|
|
97
77
|
```
|
|
98
|
-
|
|
78
|
+
powershell -ExecutionPolicy ByPass -c "irm https://astral.sh/uv/install.ps1 | iex"
|
|
79
|
+
uv tool install batchalign
|
|
99
80
|
```
|
|
100
81
|
|
|
101
|
-
Note that if your system reports `pip: command not found`, replace every use of `pip` in the instructions with `pip3` and try again.
|
|
102
|
-
|
|
103
82
|
### Rock and Roll
|
|
104
83
|
There are two main ways of interacting with Batchalign. Batchalign can be used as a program to batch-process CHAT (hence the name), or as a Python LSA library.
|
|
105
84
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
Metadata-Version: 2.
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
2
|
Name: BatchalignHK
|
|
3
|
-
Version: 0.7.18.
|
|
3
|
+
Version: 0.7.18.post11
|
|
4
4
|
Summary: Python Speech Language Sample Analysis
|
|
5
5
|
Author: Brian MacWhinney, Houjun Liu
|
|
6
6
|
Author-email: macw@cmu.edu, houjun@cmu.edu
|
|
@@ -14,6 +14,7 @@ Requires-Dist: praatio<6.1.0,>=6.0.0
|
|
|
14
14
|
Requires-Dist: torch>=2.6.0
|
|
15
15
|
Requires-Dist: torchaudio
|
|
16
16
|
Requires-Dist: opencc-python-reimplemented
|
|
17
|
+
Requires-Dist: pydub
|
|
17
18
|
Requires-Dist: plotly>=5.3.0
|
|
18
19
|
Requires-Dist: transformers>=4.37
|
|
19
20
|
Requires-Dist: tokenizers>=0.14.1
|
|
@@ -44,6 +45,7 @@ Dynamic: author-email
|
|
|
44
45
|
Dynamic: classifier
|
|
45
46
|
Dynamic: description
|
|
46
47
|
Dynamic: description-content-type
|
|
48
|
+
Dynamic: license-file
|
|
47
49
|
Dynamic: provides-extra
|
|
48
50
|
Dynamic: requires-dist
|
|
49
51
|
Dynamic: summary
|
|
@@ -60,46 +62,23 @@ The TalkBank Project, of which Batchalign is a part, is supported by NIH grant H
|
|
|
60
62
|
|
|
61
63
|
The following instructions provide a quick start to installing Batchalign. For most users aiming to process CHAT and audio with Batchalign, we recommend more detailed usage instructions: for [usage](https://talkbank.org/info/BA2-usage.pdf) and [human transcript cleanup](https://talkbank.org/info/BA2-cleanup.pdf). The following provides a quick start guide for the program.
|
|
62
64
|
|
|
63
|
-
### Get Python
|
|
64
|
-
- We support Python versions 3.9, 3.10, 3.11 and 3.12.
|
|
65
|
-
- First, check to see if you have Python by running `python`. If it reports any of the versions above, skip the following step.
|
|
66
|
-
- To install Python, follow the instructions...
|
|
67
|
-
- for macOS
|
|
68
|
-
1. Install Brew: [visit this link](https://brew.sh/)
|
|
69
|
-
2. Install Python and Pipx: execute `brew install python@3.11 pipx`
|
|
70
|
-
3. Copy the pipx path to yours: execute `pipx ensurepath`
|
|
71
|
-
- for Windows
|
|
72
|
-
1. Install Python 3.11: [via this link](https://www.python.org/ftp/python/3.11.7/python-3.11.7-amd64.exe)
|
|
73
|
-
2. If later commands report `pip module not found`, [this page may help](https://github.com/TalkBank/batchalign2/wiki/Troubleshooting-Tips#get-pip-on-windows)
|
|
74
|
-
- your distribution's instructions for Linux
|
|
75
|
-
|
|
76
|
-
For first-time users of Python, note that if you didn't install Python 3.11 (as we recommended above), it may be complex to change Python versions downstream and may cause additional problems. We recommend explicitly installing Python 3.11 by installing it explicitly via specifying a version number as we show above.
|
|
77
|
-
|
|
78
65
|
### Install and Update the Package
|
|
79
|
-
|
|
80
|
-
|
|
81
|
-
#### macOS
|
|
66
|
+
Batchalign is on PyPi (as `batchalign`). We recommend the use of UV to install Batchalign:
|
|
82
67
|
|
|
83
|
-
|
|
68
|
+
#### macOS / Linux
|
|
84
69
|
|
|
85
70
|
```
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
#### Linux
|
|
90
|
-
|
|
91
|
-
```
|
|
92
|
-
pip install -U batchalign
|
|
71
|
+
curl -LsSf https://astral.sh/uv/install.sh | sh
|
|
72
|
+
UV_PYTHON=3.11 uv tool install batchalign
|
|
93
73
|
```
|
|
94
74
|
|
|
95
75
|
#### Windows
|
|
96
76
|
|
|
97
77
|
```
|
|
98
|
-
|
|
78
|
+
powershell -ExecutionPolicy ByPass -c "irm https://astral.sh/uv/install.ps1 | iex"
|
|
79
|
+
uv tool install batchalign
|
|
99
80
|
```
|
|
100
81
|
|
|
101
|
-
Note that if your system reports `pip: command not found`, replace every use of `pip` in the instructions with `pip3` and try again.
|
|
102
|
-
|
|
103
82
|
### Rock and Roll
|
|
104
83
|
There are two main ways of interacting with Batchalign. Batchalign can be used as a program to batch-process CHAT (hence the name), or as a Python LSA library.
|
|
105
84
|
|
|
@@ -10,46 +10,23 @@ The TalkBank Project, of which Batchalign is a part, is supported by NIH grant H
|
|
|
10
10
|
|
|
11
11
|
The following instructions provide a quick start to installing Batchalign. For most users aiming to process CHAT and audio with Batchalign, we recommend more detailed usage instructions: for [usage](https://talkbank.org/info/BA2-usage.pdf) and [human transcript cleanup](https://talkbank.org/info/BA2-cleanup.pdf). The following provides a quick start guide for the program.
|
|
12
12
|
|
|
13
|
-
### Get Python
|
|
14
|
-
- We support Python versions 3.9, 3.10, 3.11 and 3.12.
|
|
15
|
-
- First, check to see if you have Python by running `python`. If it reports any of the versions above, skip the following step.
|
|
16
|
-
- To install Python, follow the instructions...
|
|
17
|
-
- for macOS
|
|
18
|
-
1. Install Brew: [visit this link](https://brew.sh/)
|
|
19
|
-
2. Install Python and Pipx: execute `brew install python@3.11 pipx`
|
|
20
|
-
3. Copy the pipx path to yours: execute `pipx ensurepath`
|
|
21
|
-
- for Windows
|
|
22
|
-
1. Install Python 3.11: [via this link](https://www.python.org/ftp/python/3.11.7/python-3.11.7-amd64.exe)
|
|
23
|
-
2. If later commands report `pip module not found`, [this page may help](https://github.com/TalkBank/batchalign2/wiki/Troubleshooting-Tips#get-pip-on-windows)
|
|
24
|
-
- your distribution's instructions for Linux
|
|
25
|
-
|
|
26
|
-
For first-time users of Python, note that if you didn't install Python 3.11 (as we recommended above), it may be complex to change Python versions downstream and may cause additional problems. We recommend explicitly installing Python 3.11 by installing it explicitly via specifying a version number as we show above.
|
|
27
|
-
|
|
28
13
|
### Install and Update the Package
|
|
29
|
-
|
|
30
|
-
|
|
31
|
-
#### macOS
|
|
14
|
+
Batchalign is on PyPi (as `batchalign`). We recommend the use of UV to install Batchalign:
|
|
32
15
|
|
|
33
|
-
|
|
16
|
+
#### macOS / Linux
|
|
34
17
|
|
|
35
18
|
```
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
|
|
39
|
-
#### Linux
|
|
40
|
-
|
|
41
|
-
```
|
|
42
|
-
pip install -U batchalign
|
|
19
|
+
curl -LsSf https://astral.sh/uv/install.sh | sh
|
|
20
|
+
UV_PYTHON=3.11 uv tool install batchalign
|
|
43
21
|
```
|
|
44
22
|
|
|
45
23
|
#### Windows
|
|
46
24
|
|
|
47
25
|
```
|
|
48
|
-
|
|
26
|
+
powershell -ExecutionPolicy ByPass -c "irm https://astral.sh/uv/install.ps1 | iex"
|
|
27
|
+
uv tool install batchalign
|
|
49
28
|
```
|
|
50
29
|
|
|
51
|
-
Note that if your system reports `pip: command not found`, replace every use of `pip` in the instructions with `pip3` and try again.
|
|
52
|
-
|
|
53
30
|
### Rock and Roll
|
|
54
31
|
There are two main ways of interacting with Batchalign. Batchalign can be used as a program to batch-process CHAT (hence the name), or as a Python LSA library.
|
|
55
32
|
|
|
@@ -13,6 +13,7 @@ resolver = {
|
|
|
13
13
|
"whisper": {
|
|
14
14
|
'eng': ("talkbank/CHATWhisper-en-large-v1", "openai/whisper-large-v2"),
|
|
15
15
|
'yue': ("alvanlii/whisper-small-cantonese", "alvanlii/whisper-small-cantonese"),
|
|
16
|
+
"heb": ("ivrit-ai/whisper-large-v3", "ivrit-ai/whisper-large-v3")
|
|
16
17
|
}
|
|
17
18
|
}
|
|
18
19
|
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/fa/wave2vec_fa.py
RENAMED
|
@@ -80,7 +80,7 @@ class Wave2VecFAEngine(BatchalignEngine):
|
|
|
80
80
|
# breakpoint()
|
|
81
81
|
if (grp[-1][1][1] - grp[0][1][0]) < 20*1000:
|
|
82
82
|
res = self.__wav2vec(audio=f.chunk(grp[0][1][0], grp[-1][1][1]), text=transcript)
|
|
83
|
-
except
|
|
83
|
+
except:
|
|
84
84
|
# utterance contains nothing
|
|
85
85
|
continue
|
|
86
86
|
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/entry_points.txt
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/top_level.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/generator.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/file.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/generator.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/parser.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/speaker/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/speaker/config.yaml
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/training/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/training/utils.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/dataset.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/execute.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/infer.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/prep.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/train.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/wave2vec/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/wave2vec/infer_fa.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/whisper/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/whisper/infer_asr.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/whisper/infer_fa.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/analysis/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/analysis/eval.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/num2chinese.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/tencent.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/whisper.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/whisperx.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/cleanup.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/retrace.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/fa/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/fa/whisper_fa.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/coref.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/en/irr.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/fr/apm.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/ud.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/speaker/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/gtrans.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/seamless.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/utils.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/rev_utr.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/whisper_utr.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utterance/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/fixures.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/test_pipeline.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|