batchalign 0.7.3b9__tar.gz → 0.7.3b11__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {batchalign-0.7.3b9/batchalign.egg-info → batchalign-0.7.3b11}/PKG-INFO +1 -1
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/cli/dispatch.py +1 -1
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/document.py +3 -3
- batchalign-0.7.3b11/batchalign/version +3 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11/batchalign.egg-info}/PKG-INFO +1 -1
- batchalign-0.7.3b9/batchalign/version +0 -3
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/LICENSE +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/MANIFEST.in +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/README.md +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/__main__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/cli/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/cli/cli.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/constants.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/errors.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/base.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/chat/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/chat/file.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/chat/generator.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/chat/lexer.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/chat/parser.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/chat/utils.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/textgrid/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/textgrid/file.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/textgrid/generator.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/formats/textgrid/parser.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/resolve.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/speaker/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/speaker/config.yaml +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/speaker/infer.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/speaker/utils.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/training/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/training/run.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/training/utils.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/utils.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/utterance/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/utterance/dataset.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/utterance/execute.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/utterance/infer.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/utterance/prep.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/utterance/train.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/whisper/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/whisper/infer_asr.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/models/whisper/infer_fa.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/analysis/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/analysis/eval.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/asr/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/asr/rev.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/asr/utils.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/asr/whisper.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/asr/whisperx.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/base.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/cleanup/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/cleanup/cleanup.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/cleanup/parse_support.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/cleanup/retrace.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/cleanup/support/test.test +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/dispatch.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/fa/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/fa/whisper_fa.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/morphosyntax/ud.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/pipeline.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/speaker/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/utr/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/utr/rev_utr.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/utr/utils.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/utr/whisper_utr.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/utterance/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/utterance/ud_utterance.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/conftest.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/fixures.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/test_pipeline.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/test_document.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/utils/__init__.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/utils/config.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/utils/dp.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/utils/utils.py +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign.egg-info/SOURCES.txt +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign.egg-info/dependency_links.txt +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign.egg-info/entry_points.txt +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign.egg-info/requires.txt +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign.egg-info/top_level.txt +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/setup.cfg +0 -0
- {batchalign-0.7.3b9 → batchalign-0.7.3b11}/setup.py +0 -0
@@ -88,7 +88,7 @@ def _dispatch(command, lang, num_speakers,
|
|
88
88
|
# HACK check for @Options:\tdummy in the file
|
89
89
|
# and simply copy it
|
90
90
|
if ext == "cha":
|
91
|
-
with open(inp_path, 'r') as df:
|
91
|
+
with open(inp_path, 'r', encoding="utf-8") as df:
|
92
92
|
data = df.read()
|
93
93
|
if "@Options:\tdummy" in data:
|
94
94
|
shutil.copy2(inp_path, str(repathed))
|
@@ -203,9 +203,9 @@ class Utterance(BaseModel):
|
|
203
203
|
t = re.sub(r"^\+\.\.\.", "", t.strip()).strip()
|
204
204
|
# this is here thrice to prevent stuff from not
|
205
205
|
# matching once because .sub seems to only match once
|
206
|
-
t = re.sub(r"^[^\w\d\s<]+", "", t.strip()).strip()
|
207
|
-
t = re.sub(r"^[^\w\d\s<]+", "", t.strip()).strip()
|
208
|
-
t = re.sub(r"^[^\w\d\s<]+", "", t.strip()).strip()
|
206
|
+
# t = re.sub(r"^[^\w\d\s<]+", "", t.strip()).strip()
|
207
|
+
# t = re.sub(r"^[^\w\d\s<]+", "", t.strip()).strip()
|
208
|
+
# t = re.sub(r"^[^\w\d\s<]+", "", t.strip()).strip()
|
209
209
|
t = re.sub(r",", " , ", t.strip()).strip()
|
210
210
|
t = re.sub(r" +", " ", t.strip()).strip()
|
211
211
|
return t
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/cleanup/support/filled_pauses.eng
RENAMED
File without changes
|
{batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/pipelines/cleanup/support/replacements.eng
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/formats/chat/test_chat_generator.py
RENAMED
File without changes
|
File without changes
|
{batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/formats/chat/test_chat_parser.py
RENAMED
File without changes
|
File without changes
|
{batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/formats/textgrid/test_textgrid.py
RENAMED
File without changes
|
File without changes
|
{batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/asr/test_asr_pipeline.py
RENAMED
File without changes
|
File without changes
|
{batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/cleanup/test_disfluency.py
RENAMED
File without changes
|
{batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/cleanup/test_parse_support.py
RENAMED
File without changes
|
{batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/fa/test_fa_pipeline.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.3b9 → batchalign-0.7.3b11}/batchalign/tests/pipelines/test_pipeline_models.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|