batchalign 0.7.6a5__tar.gz → 0.7.6a7__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {batchalign-0.7.6a5/batchalign.egg-info → batchalign-0.7.6a7}/PKG-INFO +1 -1
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/whisper/infer_asr.py +98 -17
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/morphosyntax/ud.py +2 -0
- batchalign-0.7.6a7/batchalign/version +3 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7/batchalign.egg-info}/PKG-INFO +1 -1
- batchalign-0.7.6a5/batchalign/version +0 -3
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/LICENSE +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/MANIFEST.in +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/README.md +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/__main__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/cli/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/cli/cli.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/cli/dispatch.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/constants.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/document.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/errors.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/base.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/chat/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/chat/file.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/chat/generator.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/chat/lexer.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/chat/parser.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/chat/utils.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/textgrid/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/textgrid/file.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/textgrid/generator.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/formats/textgrid/parser.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/resolve.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/speaker/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/speaker/config.yaml +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/speaker/infer.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/speaker/utils.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/training/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/training/run.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/training/utils.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/utils.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/utterance/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/utterance/dataset.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/utterance/execute.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/utterance/infer.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/utterance/prep.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/utterance/train.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/whisper/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/models/whisper/infer_fa.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/analysis/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/analysis/eval.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/asr/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/asr/rev.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/asr/utils.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/asr/whisper.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/asr/whisperx.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/base.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/cleanup/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/cleanup/cleanup.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/cleanup/parse_support.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/cleanup/retrace.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/cleanup/support/test.test +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/dispatch.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/fa/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/fa/whisper_fa.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/morphosyntax/coref.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/pipeline.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/speaker/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/utr/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/utr/rev_utr.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/utr/utils.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/utr/whisper_utr.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/utterance/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/utterance/ud_utterance.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/conftest.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/fixures.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/test_pipeline.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/test_document.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/utils/__init__.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/utils/config.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/utils/dp.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/utils/utils.py +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign.egg-info/SOURCES.txt +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign.egg-info/dependency_links.txt +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign.egg-info/entry_points.txt +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign.egg-info/requires.txt +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign.egg-info/top_level.txt +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/setup.cfg +0 -0
- {batchalign-0.7.6a5 → batchalign-0.7.6a7}/setup.py +0 -0
@@ -64,19 +64,89 @@ class WhisperASRModel(object):
|
|
64
64
|
|
65
65
|
def __init__(self, model, base="openai/whisper-large-v3", language="english", target_sample_rate=16000):
|
66
66
|
L.debug("Initializing whisper model...")
|
67
|
-
self.pipe = pipeline(
|
68
|
-
"automatic-speech-recognition",
|
69
|
-
model=model,
|
70
|
-
tokenizer=WhisperTokenizer.from_pretrained(base),
|
71
|
-
chunk_length_s=25,
|
72
|
-
stride_length_s=3,
|
73
|
-
device=DEVICE,
|
74
|
-
torch_dtype=torch.float32,
|
75
|
-
return_timestamps="word",
|
76
|
-
)
|
77
|
-
L.debug("Done, initalizing processor and config...")
|
78
67
|
self.__config = GenerationConfig.from_pretrained(base)
|
79
68
|
self.__config.no_repeat_ngram_size = 4
|
69
|
+
|
70
|
+
if language == "Cantonese":
|
71
|
+
self.pipe = pipeline(
|
72
|
+
"automatic-speech-recognition",
|
73
|
+
model=model,
|
74
|
+
# tokenizer=WhisperTokenizer.from_pretrained(base),
|
75
|
+
chunk_length_s=30,
|
76
|
+
# stride_length_s=3,
|
77
|
+
device=DEVICE,
|
78
|
+
# torch_dtype=torch.float32,
|
79
|
+
return_timestamps="word",
|
80
|
+
)
|
81
|
+
self.__config = GenerationConfig.from_model_config(self.pipe.model.config)
|
82
|
+
self.__config.no_repeat_ngram_size = 4
|
83
|
+
self.__config.use_cache = False
|
84
|
+
|
85
|
+
forced_decoder_ids = self.pipe.tokenizer.get_decoder_prompt_ids(language="yue", task="transcribe")
|
86
|
+
|
87
|
+
suppress_tokens = []
|
88
|
+
|
89
|
+
# Define other parameters
|
90
|
+
return_attention_mask = False
|
91
|
+
pad_token_id = 50257
|
92
|
+
bos_token_id = 50257
|
93
|
+
eos_token_id = 50257
|
94
|
+
decoder_start_token_id = 50258
|
95
|
+
begin_suppress_tokens = [
|
96
|
+
220,
|
97
|
+
50257
|
98
|
+
],
|
99
|
+
alignment_heads = [
|
100
|
+
[5, 3],
|
101
|
+
[5, 9],
|
102
|
+
[8, 0],
|
103
|
+
[8, 4],
|
104
|
+
[8, 8],
|
105
|
+
[9, 0],
|
106
|
+
[9, 7],
|
107
|
+
[9, 9],
|
108
|
+
[10, 5]
|
109
|
+
]
|
110
|
+
lang_to_id = {"<|yue|>": 50325}
|
111
|
+
task_to_id = {"transcribe": 50359}
|
112
|
+
is_multilingual = True
|
113
|
+
max_initial_timestamp_index = 50
|
114
|
+
no_timestamps_token_id = 50363
|
115
|
+
prev_sot_token_id = 50361
|
116
|
+
max_length = 448
|
117
|
+
|
118
|
+
# Assign values to generation config
|
119
|
+
self.__config.forced_decoder_ids = forced_decoder_ids
|
120
|
+
self.__config.suppress_tokens = suppress_tokens
|
121
|
+
self.__config.pad_token_id = pad_token_id
|
122
|
+
self.__config.bos_token_id = bos_token_id
|
123
|
+
self.__config.eos_token_id = eos_token_id
|
124
|
+
self.__config.decoder_start_token_id = decoder_start_token_id
|
125
|
+
self.__config.lang_to_id = lang_to_id
|
126
|
+
self.__config.task_to_id = task_to_id
|
127
|
+
self.__config.alignment_heads = alignment_heads
|
128
|
+
self.__config.alignment_heads = alignment_heads
|
129
|
+
self.__config.begin_suppress_tokens = begin_suppress_tokens
|
130
|
+
self.__config.is_multilingual = is_multilingual
|
131
|
+
self.__config.max_initial_timestamp_index = max_initial_timestamp_index
|
132
|
+
self.__config.no_timestamps_token_id = no_timestamps_token_id
|
133
|
+
self.__config.prev_sot_token_id = prev_sot_token_id
|
134
|
+
self.__config.max_length =max_length
|
135
|
+
|
136
|
+
self.pipe.model.generation_config = self.__config
|
137
|
+
|
138
|
+
else:
|
139
|
+
self.pipe = pipeline(
|
140
|
+
"automatic-speech-recognition",
|
141
|
+
model=model,
|
142
|
+
tokenizer=WhisperTokenizer.from_pretrained(base),
|
143
|
+
chunk_length_s=25,
|
144
|
+
stride_length_s=3,
|
145
|
+
device=DEVICE,
|
146
|
+
torch_dtype=torch.float32,
|
147
|
+
return_timestamps="word",
|
148
|
+
)
|
149
|
+
L.debug("Done, initalizing processor and config...")
|
80
150
|
processor = WhisperProcessor.from_pretrained(base)
|
81
151
|
L.debug("Whisper initialization done.")
|
82
152
|
|
@@ -147,14 +217,25 @@ class WhisperASRModel(object):
|
|
147
217
|
})
|
148
218
|
|
149
219
|
L.debug("Whisper Transcribing...")
|
220
|
+
config = {
|
221
|
+
"repetition_penalty": 1.001,
|
222
|
+
"generation_config": self.__config,
|
223
|
+
"task": "transcribe",
|
224
|
+
"language": self.lang
|
225
|
+
}
|
226
|
+
|
227
|
+
if self.lang == "Cantonese":
|
228
|
+
config = {
|
229
|
+
"repetition_penalty": 1.001,
|
230
|
+
# "generation_config": self.__config,
|
231
|
+
# "task": "transcribe",
|
232
|
+
# "language": self.lang
|
233
|
+
}
|
234
|
+
|
150
235
|
words = self.pipe(data.cpu().numpy(),
|
151
236
|
batch_size=1,
|
152
|
-
generate_kwargs
|
153
|
-
|
154
|
-
"generation_config": self.__config,
|
155
|
-
"task": "transcribe",
|
156
|
-
"language": self.lang
|
157
|
-
})
|
237
|
+
generate_kwargs=config)
|
238
|
+
|
158
239
|
# "do_sample": True,
|
159
240
|
# "temperature": 0.1
|
160
241
|
# })
|
@@ -202,6 +202,8 @@ def handler__NOUN(word, lang=None):
|
|
202
202
|
case = feats.get("Case", "").replace(",", "")
|
203
203
|
type = feats.get("PronType", "")
|
204
204
|
|
205
|
+
if word.get("deprel") == "obj" and case.strip() == "":
|
206
|
+
case = "Acc"
|
205
207
|
|
206
208
|
# clear defaults
|
207
209
|
if gender_str == "-Com,Neut" or gender_str == "-Com" or gender_str == "-ComNeut": gender_str=""
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/cleanup/support/filled_pauses.eng
RENAMED
File without changes
|
{batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/pipelines/cleanup/support/replacements.eng
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/formats/chat/test_chat_generator.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/formats/textgrid/test_textgrid.py
RENAMED
File without changes
|
File without changes
|
{batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/asr/test_asr_pipeline.py
RENAMED
File without changes
|
File without changes
|
{batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/cleanup/test_disfluency.py
RENAMED
File without changes
|
{batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/cleanup/test_parse_support.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{batchalign-0.7.6a5 → batchalign-0.7.6a7}/batchalign/tests/pipelines/test_pipeline_models.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|