batchalign 0.7.4__tar.gz → 0.7.5a2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {batchalign-0.7.4/batchalign.egg-info → batchalign-0.7.5a2}/PKG-INFO +5 -5
- {batchalign-0.7.4 → batchalign-0.7.5a2}/README.md +4 -4
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/cli/cli.py +18 -13
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/chat/utils.py +1 -1
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/morphosyntax/ud.py +4 -2
- batchalign-0.7.5a2/batchalign/version +3 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2/batchalign.egg-info}/PKG-INFO +5 -5
- batchalign-0.7.4/batchalign/version +0 -3
- {batchalign-0.7.4 → batchalign-0.7.5a2}/LICENSE +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/MANIFEST.in +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/__main__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/cli/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/cli/dispatch.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/constants.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/document.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/errors.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/base.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/chat/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/chat/file.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/chat/generator.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/chat/lexer.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/chat/parser.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/textgrid/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/textgrid/file.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/textgrid/generator.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/formats/textgrid/parser.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/resolve.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/speaker/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/speaker/config.yaml +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/speaker/infer.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/speaker/utils.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/training/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/training/run.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/training/utils.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/utils.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/utterance/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/utterance/dataset.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/utterance/execute.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/utterance/infer.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/utterance/prep.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/utterance/train.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/whisper/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/whisper/infer_asr.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/models/whisper/infer_fa.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/analysis/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/analysis/eval.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/asr/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/asr/rev.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/asr/utils.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/asr/whisper.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/asr/whisperx.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/base.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/cleanup/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/cleanup/cleanup.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/cleanup/parse_support.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/cleanup/retrace.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/cleanup/support/test.test +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/dispatch.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/fa/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/fa/whisper_fa.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/pipeline.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/speaker/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/utr/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/utr/rev_utr.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/utr/utils.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/utr/whisper_utr.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/utterance/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/utterance/ud_utterance.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/conftest.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/fixures.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/test_pipeline.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/test_document.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/utils/__init__.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/utils/config.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/utils/dp.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/utils/utils.py +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign.egg-info/SOURCES.txt +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign.egg-info/dependency_links.txt +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign.egg-info/entry_points.txt +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign.egg-info/requires.txt +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign.egg-info/top_level.txt +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/setup.cfg +0 -0
- {batchalign-0.7.4 → batchalign-0.7.5a2}/setup.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: batchalign
|
3
|
-
Version: 0.7.
|
3
|
+
Version: 0.7.5a2
|
4
4
|
Summary: Python Speech Language Sample Analysis
|
5
5
|
Author: Brian MacWhinney, Houjun Liu
|
6
6
|
Author-email: macw@cmu.edu, houjun@cmu.edu
|
@@ -85,15 +85,15 @@ The TalkBank Project, of which Batchalign is a part, is supported by NIH grant H
|
|
85
85
|
The following instructions provide a quick start to installing Batchalign. For most users aiming to process CHAT and audio with Batchalign, we recommend more detailed usage instructions: for [usage](https://talkbank.org/info/BA2-usage.pdf) and [human transcript cleanup](https://talkbank.org/info/BA2-cleanup.pdf). The following provides a quick start guide for the program.
|
86
86
|
|
87
87
|
### Get Python
|
88
|
-
- We support Python versions 3.9, 3.10, and 3.
|
89
|
-
-
|
88
|
+
- We support Python versions 3.9, 3.10, 3.11 and 3.12.
|
89
|
+
- First, check to see if you have Python by running `python`. If it reports any of the versions above, skip the following step.
|
90
90
|
- To install Python, follow the instructions...
|
91
91
|
- for macOS
|
92
92
|
1. Install Brew: [visit this link](https://brew.sh/)
|
93
93
|
2. Install Python: execute `brew install python@3.11`
|
94
94
|
- for Windows
|
95
95
|
1. Install Python 3.11: [via this link](https://www.python.org/ftp/python/3.11.7/python-3.11.7-amd64.exe)
|
96
|
-
2. If later commands report `pip module not found`, [this page may help](https://
|
96
|
+
2. If later commands report `pip module not found`, [this page may help](https://github.com/TalkBank/batchalign2/wiki/Troubleshooting-Tips#get-pip-on-windows)
|
97
97
|
- your distribution's instructions for Linux
|
98
98
|
|
99
99
|
### Install and Update the Package
|
@@ -156,7 +156,7 @@ batchalign morphotag ~/ba_input ~/ba_output
|
|
156
156
|
#### forced alignment
|
157
157
|
|
158
158
|
```
|
159
|
-
batchalign align
|
159
|
+
batchalign align ~/ba_input ~/ba_output
|
160
160
|
```
|
161
161
|
|
162
162
|
|
@@ -11,15 +11,15 @@ The TalkBank Project, of which Batchalign is a part, is supported by NIH grant H
|
|
11
11
|
The following instructions provide a quick start to installing Batchalign. For most users aiming to process CHAT and audio with Batchalign, we recommend more detailed usage instructions: for [usage](https://talkbank.org/info/BA2-usage.pdf) and [human transcript cleanup](https://talkbank.org/info/BA2-cleanup.pdf). The following provides a quick start guide for the program.
|
12
12
|
|
13
13
|
### Get Python
|
14
|
-
- We support Python versions 3.9, 3.10, and 3.
|
15
|
-
-
|
14
|
+
- We support Python versions 3.9, 3.10, 3.11 and 3.12.
|
15
|
+
- First, check to see if you have Python by running `python`. If it reports any of the versions above, skip the following step.
|
16
16
|
- To install Python, follow the instructions...
|
17
17
|
- for macOS
|
18
18
|
1. Install Brew: [visit this link](https://brew.sh/)
|
19
19
|
2. Install Python: execute `brew install python@3.11`
|
20
20
|
- for Windows
|
21
21
|
1. Install Python 3.11: [via this link](https://www.python.org/ftp/python/3.11.7/python-3.11.7-amd64.exe)
|
22
|
-
2. If later commands report `pip module not found`, [this page may help](https://
|
22
|
+
2. If later commands report `pip module not found`, [this page may help](https://github.com/TalkBank/batchalign2/wiki/Troubleshooting-Tips#get-pip-on-windows)
|
23
23
|
- your distribution's instructions for Linux
|
24
24
|
|
25
25
|
### Install and Update the Package
|
@@ -82,7 +82,7 @@ batchalign morphotag ~/ba_input ~/ba_output
|
|
82
82
|
#### forced alignment
|
83
83
|
|
84
84
|
```
|
85
|
-
batchalign align
|
85
|
+
batchalign align ~/ba_input ~/ba_output
|
86
86
|
```
|
87
87
|
|
88
88
|
|
@@ -49,15 +49,7 @@ def common_options(f):
|
|
49
49
|
click.argument("in_dir",
|
50
50
|
type=click.Path(exists=True, file_okay=False)),
|
51
51
|
click.argument("out_dir",
|
52
|
-
type=click.Path(exists=True, file_okay=False))
|
53
|
-
click.option("--lang",
|
54
|
-
help="sample language in three-letter ISO 3166-1 alpha-3 code",
|
55
|
-
show_default=True,
|
56
|
-
default="eng",
|
57
|
-
type=str),
|
58
|
-
click.option("-n", "--num_speakers", type=int,
|
59
|
-
help="number of speakers in the language sample", default=2),
|
60
|
-
|
52
|
+
type=click.Path(exists=True, file_okay=False))
|
61
53
|
]
|
62
54
|
|
63
55
|
options.reverse()
|
@@ -115,8 +107,9 @@ batchalign.add_command(train, "models")
|
|
115
107
|
@common_options
|
116
108
|
@click.option("--whisper/--rev",
|
117
109
|
default=False, help="For utterance timing recovery, OpenAI Whisper (ASR) instead of Rev.AI (default).")
|
110
|
+
|
118
111
|
@click.pass_context
|
119
|
-
def align(ctx, in_dir, out_dir,
|
112
|
+
def align(ctx, in_dir, out_dir, whisper, **kwargs):
|
120
113
|
"""Align transcripts against corresponding media files."""
|
121
114
|
def loader(file):
|
122
115
|
return CHATFile(path=os.path.abspath(file)).doc
|
@@ -124,7 +117,7 @@ def align(ctx, in_dir, out_dir, lang, num_speakers, whisper, **kwargs):
|
|
124
117
|
def writer(doc, output):
|
125
118
|
CHATFile(doc=doc).write(output)
|
126
119
|
|
127
|
-
_dispatch("align",
|
120
|
+
_dispatch("align", "eng", 1,
|
128
121
|
["cha"], ctx,
|
129
122
|
in_dir, out_dir,
|
130
123
|
loader, writer, C,
|
@@ -143,6 +136,12 @@ def align(ctx, in_dir, out_dir, lang, num_speakers, whisper, **kwargs):
|
|
143
136
|
default=False, help="Perform speaker diarization (this flag is ignored with Rev.AI)")
|
144
137
|
@click.option("--wor/--nowor",
|
145
138
|
default=False, help="Should we write word level alignment line? Default to no.")
|
139
|
+
@click.option("--lang",
|
140
|
+
help="sample language in three-letter ISO 3166-1 alpha-3 code",
|
141
|
+
show_default=True,
|
142
|
+
default="eng",
|
143
|
+
type=str)
|
144
|
+
@click.option("-n", "--num_speakers", type=int, help="number of speakers in the language sample", default=2)
|
146
145
|
@click.pass_context
|
147
146
|
def transcribe(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
|
148
147
|
"""Create a transcript from audio files."""
|
@@ -189,7 +188,7 @@ def transcribe(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
|
|
189
188
|
file_okay=True, dir_okay=False),
|
190
189
|
help="Comma seperated manual lexicon override")
|
191
190
|
@click.pass_context
|
192
|
-
def morphotag(ctx, in_dir, out_dir,
|
191
|
+
def morphotag(ctx, in_dir, out_dir, **kwargs):
|
193
192
|
"""Perform morphosyntactic analysis on transcripts."""
|
194
193
|
|
195
194
|
def loader(file):
|
@@ -213,7 +212,7 @@ def morphotag(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
|
|
213
212
|
def writer(doc, output):
|
214
213
|
CHATFile(doc=doc, special_mor_=doc.ba_special_.get("special_mor_notation", False)).write(output)
|
215
214
|
|
216
|
-
_dispatch("morphotag",
|
215
|
+
_dispatch("morphotag", "eng", 1, ["cha"], ctx,
|
217
216
|
in_dir, out_dir,
|
218
217
|
loader, writer, C)
|
219
218
|
|
@@ -222,6 +221,12 @@ def morphotag(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
|
|
222
221
|
|
223
222
|
@batchalign.command()
|
224
223
|
@common_options
|
224
|
+
@click.option("--lang",
|
225
|
+
help="sample language in three-letter ISO 3166-1 alpha-3 code",
|
226
|
+
show_default=True,
|
227
|
+
default="eng",
|
228
|
+
type=str)
|
229
|
+
@click.option("-n", "--num_speakers", type=int, help="number of speakers in the language sample", default=2)
|
225
230
|
@click.pass_context
|
226
231
|
def utseg(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
|
227
232
|
"""Perform morphosyntactic analysis on transcripts."""
|
@@ -146,7 +146,7 @@ def annotation_clean(content, special=False):
|
|
146
146
|
cleaned_word = cleaned_word.replace("~","").replace("&~","")
|
147
147
|
cleaned_word = cleaned_word.replace(">","").replace("<","")
|
148
148
|
cleaned_word = cleaned_word.replace("〕","").replace("//","").replace(";","")
|
149
|
-
cleaned_word = re.sub(r"
|
149
|
+
cleaned_word = re.sub(r"@[^abcefpoqs]", '', cleaned_word)
|
150
150
|
cleaned_word = re.sub(r"&.", '', cleaned_word)
|
151
151
|
|
152
152
|
return cleaned_word
|
@@ -212,7 +212,7 @@ def handler__NOUN(word, lang=None):
|
|
212
212
|
def handler__PROPN(word, lang=None):
|
213
213
|
# code as noun
|
214
214
|
parsed = handler__NOUN(word)
|
215
|
-
return parsed.replace("
|
215
|
+
return parsed.replace("noun", "propn")
|
216
216
|
|
217
217
|
def handler__VERB(word, lang=None):
|
218
218
|
# get the features
|
@@ -635,7 +635,9 @@ def tokenizer_processor(tokenized, lang, sent):
|
|
635
635
|
before,after = conform(i).split("'")
|
636
636
|
res.append((f'{before}\'', False))
|
637
637
|
res.append((after, False))
|
638
|
-
elif ("en" in lang) and matches_in(i, "'")
|
638
|
+
elif (("en" in lang) and matches_in(i, "'") and
|
639
|
+
not (len(conform(i).split("'")) > 1 and
|
640
|
+
conform(i).split("'")[0].strip() == "o")):
|
639
641
|
res.append((conform(i), True))
|
640
642
|
elif ("nl" in lang) and conform(i).endswith("'s"):
|
641
643
|
res.append((conform(i), False))
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: batchalign
|
3
|
-
Version: 0.7.
|
3
|
+
Version: 0.7.5a2
|
4
4
|
Summary: Python Speech Language Sample Analysis
|
5
5
|
Author: Brian MacWhinney, Houjun Liu
|
6
6
|
Author-email: macw@cmu.edu, houjun@cmu.edu
|
@@ -85,15 +85,15 @@ The TalkBank Project, of which Batchalign is a part, is supported by NIH grant H
|
|
85
85
|
The following instructions provide a quick start to installing Batchalign. For most users aiming to process CHAT and audio with Batchalign, we recommend more detailed usage instructions: for [usage](https://talkbank.org/info/BA2-usage.pdf) and [human transcript cleanup](https://talkbank.org/info/BA2-cleanup.pdf). The following provides a quick start guide for the program.
|
86
86
|
|
87
87
|
### Get Python
|
88
|
-
- We support Python versions 3.9, 3.10, and 3.
|
89
|
-
-
|
88
|
+
- We support Python versions 3.9, 3.10, 3.11 and 3.12.
|
89
|
+
- First, check to see if you have Python by running `python`. If it reports any of the versions above, skip the following step.
|
90
90
|
- To install Python, follow the instructions...
|
91
91
|
- for macOS
|
92
92
|
1. Install Brew: [visit this link](https://brew.sh/)
|
93
93
|
2. Install Python: execute `brew install python@3.11`
|
94
94
|
- for Windows
|
95
95
|
1. Install Python 3.11: [via this link](https://www.python.org/ftp/python/3.11.7/python-3.11.7-amd64.exe)
|
96
|
-
2. If later commands report `pip module not found`, [this page may help](https://
|
96
|
+
2. If later commands report `pip module not found`, [this page may help](https://github.com/TalkBank/batchalign2/wiki/Troubleshooting-Tips#get-pip-on-windows)
|
97
97
|
- your distribution's instructions for Linux
|
98
98
|
|
99
99
|
### Install and Update the Package
|
@@ -156,7 +156,7 @@ batchalign morphotag ~/ba_input ~/ba_output
|
|
156
156
|
#### forced alignment
|
157
157
|
|
158
158
|
```
|
159
|
-
batchalign align
|
159
|
+
batchalign align ~/ba_input ~/ba_output
|
160
160
|
```
|
161
161
|
|
162
162
|
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/cleanup/support/filled_pauses.eng
RENAMED
File without changes
|
{batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/pipelines/cleanup/support/replacements.eng
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/formats/chat/test_chat_generator.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/cleanup/test_disfluency.py
RENAMED
File without changes
|
{batchalign-0.7.4 → batchalign-0.7.5a2}/batchalign/tests/pipelines/cleanup/test_parse_support.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|