batchalign 0.7.9.post3__tar.gz → 0.7.10__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {batchalign-0.7.9.post3/batchalign.egg-info → batchalign-0.7.10}/PKG-INFO +1 -1
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/generator.py +29 -1
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utterance/ud_utterance.py +2 -0
- batchalign-0.7.10/batchalign/version +3 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10/batchalign.egg-info}/PKG-INFO +1 -1
- batchalign-0.7.9.post3/batchalign/version +0 -3
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/LICENSE +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/MANIFEST.in +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/README.md +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/__main__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/cli/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/cli/cli.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/cli/dispatch.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/constants.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/document.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/errors.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/base.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/file.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/lexer.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/parser.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/utils.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/textgrid/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/textgrid/file.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/textgrid/generator.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/textgrid/parser.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/resolve.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/speaker/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/speaker/config.yaml +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/speaker/infer.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/speaker/utils.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/training/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/training/run.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/training/utils.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utils.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/dataset.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/execute.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/infer.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/prep.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/train.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/whisper/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/whisper/infer_asr.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/whisper/infer_fa.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/analysis/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/analysis/eval.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/asr/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/asr/rev.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/asr/utils.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/asr/whisper.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/asr/whisperx.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/base.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/cleanup.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/parse_support.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/retrace.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/support/test.test +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/dispatch.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/fa/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/fa/whisper_fa.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/coref.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/en/irr.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/fr/apm.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/fr/apmn.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/ud.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/pipeline.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/speaker/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utr/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utr/rev_utr.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utr/utils.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utr/whisper_utr.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utterance/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/conftest.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/fixures.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/test_pipeline.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/test_document.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/utils/__init__.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/utils/config.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/utils/dp.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/utils/utils.py +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign.egg-info/SOURCES.txt +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign.egg-info/dependency_links.txt +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign.egg-info/entry_points.txt +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign.egg-info/requires.txt +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign.egg-info/top_level.txt +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/setup.cfg +0 -0
- {batchalign-0.7.9.post3 → batchalign-0.7.10}/setup.py +0 -0
@@ -1,5 +1,6 @@
|
|
1
1
|
from batchalign.document import *
|
2
2
|
from batchalign.constants import *
|
3
|
+
import numbers
|
3
4
|
|
4
5
|
import warnings
|
5
6
|
|
@@ -104,6 +105,32 @@ def generate_chat_utterance(utterance: Utterance, special_mor=False, write_wor=T
|
|
104
105
|
|
105
106
|
return "\n".join(result)
|
106
107
|
|
108
|
+
def check_utterances_ordered(doc):
|
109
|
+
"""check if the utterances are ordered such that one is aligned after another
|
110
|
+
|
111
|
+
Parameters
|
112
|
+
----------
|
113
|
+
doc : Document
|
114
|
+
The CHAT document to check.
|
115
|
+
|
116
|
+
Returns
|
117
|
+
-------
|
118
|
+
bool
|
119
|
+
Whether the utterances timings are ordered or not.
|
120
|
+
"""
|
121
|
+
|
122
|
+
n = -1
|
123
|
+
for i in doc.content:
|
124
|
+
if isinstance(i, Utterance) and i.alignment:
|
125
|
+
(start, end) = i.alignment
|
126
|
+
if isinstance(start, numbers.Number) != None and isinstance(end, numbers.Number) != None:
|
127
|
+
if end < start:
|
128
|
+
return False
|
129
|
+
if start < n:
|
130
|
+
return False
|
131
|
+
n = end
|
132
|
+
return True
|
133
|
+
|
107
134
|
def generate_chat_preamble(doc, birthdays=[]):
|
108
135
|
"""Generate header for a Batchalign document.
|
109
136
|
|
@@ -124,7 +151,8 @@ def generate_chat_preamble(doc, birthdays=[]):
|
|
124
151
|
header = []
|
125
152
|
header.append("@Languages:\t"+", ".join(doc.langs))
|
126
153
|
header.append("@Participants:\t"+", ".join([f"{i.id} {i.name}" for i in doc.tiers]))
|
127
|
-
|
154
|
+
if not check_utterances_ordered(doc):
|
155
|
+
header.append("@Options:\tbullets")
|
128
156
|
header.append("\n".join([f"@ID:\t{i.lang}|{i.corpus}|{i.id}|{i.birthday}|{i.additional[0]}|{i.additional[1]}|{i.additional[2]}|{i.name}|{i.additional[3]}|{i.additional[4]}|" for i in doc.tiers]))
|
129
157
|
for i in birthdays:
|
130
158
|
header.append(f"@{i.id}:\t{i.content}")
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/support/filled_pauses.eng
RENAMED
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/support/replacements.eng
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/ja/verbforms.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_file.py
RENAMED
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_generator.py
RENAMED
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_lexer.py
RENAMED
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_parser.py
RENAMED
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_utils.py
RENAMED
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/textgrid/test_textgrid.py
RENAMED
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/analysis/test_eval.py
RENAMED
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/asr/test_asr_pipeline.py
RENAMED
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/asr/test_asr_utils.py
RENAMED
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/cleanup/test_disfluency.py
RENAMED
File without changes
|
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/fa/test_fa_pipeline.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/test_pipeline_models.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|