BatchalignHK 0.7.19.post21__tar.gz → 0.7.19.post23__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/BatchalignHK.egg-info/PKG-INFO +1 -1
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/PKG-INFO +1 -1
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/analysis/eval.py +46 -3
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/utils/dp.py +6 -5
- batchalignhk-0.7.19.post23/batchalign/version +3 -0
- batchalignhk-0.7.19.post21/batchalign/version +0 -3
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/BatchalignHK.egg-info/SOURCES.txt +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/BatchalignHK.egg-info/dependency_links.txt +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/BatchalignHK.egg-info/entry_points.txt +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/BatchalignHK.egg-info/requires.txt +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/BatchalignHK.egg-info/top_level.txt +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/LICENSE +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/MANIFEST.in +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/README.md +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/__main__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/cli/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/cli/cli.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/cli/dispatch.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/constants.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/document.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/errors.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/core.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/exception.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/logging.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/realtime_meeting.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/speech_recognizer.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/speech_synthesizer.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/speech_transcriber.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/stream_input_tts.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/token.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/util.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/version.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_abnf.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_app.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_cookiejar.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_core.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_exceptions.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_handshake.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_http.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_logging.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_socket.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_ssl_compat.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_url.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/tests/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/tests/echo-server.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/tests/test_abnf.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/tests/test_app.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/tests/test_cookiejar.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/tests/test_http.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/tests/test_url.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/tests/test_websocket.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/base.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/chat/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/chat/file.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/chat/generator.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/chat/lexer.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/chat/parser.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/chat/utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/textgrid/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/textgrid/file.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/textgrid/generator.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/textgrid/parser.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/resolve.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/speaker/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/speaker/config.yaml +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/speaker/infer.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/speaker/utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/training/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/training/run.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/training/utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/cantonese_infer.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/dataset.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/execute.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/infer.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/prep.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/train.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/wave2vec/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/wave2vec/infer_fa.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/whisper/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/whisper/infer_asr.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/whisper/infer_fa.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/analysis/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/aliyun.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/num2chinese.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/oai_whisper.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/rev.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/tencent.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/whisper.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/whisperx.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/base.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/cleanup.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/parse_support.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/retrace.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/support/test.test +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/dispatch.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/fa/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/fa/wave2vec_fa.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/fa/whisper_fa.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/morphosyntax/coref.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/morphosyntax/en/irr.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/morphosyntax/fr/apm.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/morphosyntax/fr/apmn.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/morphosyntax/ud.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/pipeline.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/speaker/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/translate/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/translate/gtrans.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/translate/seamless.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/translate/utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utr/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utr/rev_utr.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utr/tencent_utr.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utr/utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utr/whisper_utr.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utterance/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utterance/ud_utterance.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/conftest.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/pipelines/fixures.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/pipelines/test_pipeline.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/test_document.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/utils/__init__.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/utils/abbrev.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/utils/config.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/utils/names.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/utils/utils.py +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/setup.cfg +0 -0
- {batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/setup.py +0 -0
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/analysis/eval.py
RENAMED
|
@@ -38,9 +38,47 @@ def conform(x):
|
|
|
38
38
|
elif "wanna" == i.strip():
|
|
39
39
|
result.append("want")
|
|
40
40
|
result.append("to")
|
|
41
|
+
elif "ii" == i.strip():
|
|
42
|
+
result.append("i")
|
|
43
|
+
result.append("i")
|
|
44
|
+
elif "i'd" == i.strip():
|
|
45
|
+
result.append("i")
|
|
46
|
+
result.append("had")
|
|
47
|
+
elif "tshirts" == i.strip():
|
|
48
|
+
result.append("t")
|
|
49
|
+
result.append("shirts")
|
|
50
|
+
elif "tshirts" == i.strip():
|
|
51
|
+
result.append("t")
|
|
52
|
+
result.append("shirts")
|
|
53
|
+
elif "anytime" == i.strip():
|
|
54
|
+
result.append("any")
|
|
55
|
+
result.append("time")
|
|
56
|
+
elif "alright" == i.strip():
|
|
57
|
+
result.append("all")
|
|
58
|
+
result.append("right")
|
|
59
|
+
elif "sorta" == i.strip():
|
|
60
|
+
result.append("sort")
|
|
61
|
+
result.append("of")
|
|
62
|
+
elif "alrightie" == i.strip():
|
|
63
|
+
result.append("all")
|
|
64
|
+
result.append("right")
|
|
65
|
+
elif "mm" == i.strip():
|
|
66
|
+
result.append("hm")
|
|
67
|
+
elif "ai" == i.strip():
|
|
68
|
+
result.append("a")
|
|
69
|
+
result.append("i")
|
|
70
|
+
elif "this'll" == i.strip():
|
|
71
|
+
result.append("this")
|
|
72
|
+
result.append("will")
|
|
41
73
|
elif "gotta" == i.strip():
|
|
42
74
|
result.append("got")
|
|
43
75
|
result.append("to")
|
|
76
|
+
elif "eh" == i.strip():
|
|
77
|
+
result.append("uh")
|
|
78
|
+
elif "kinda" == i.strip():
|
|
79
|
+
result.append("a")
|
|
80
|
+
result.append("kind")
|
|
81
|
+
result.append("of")
|
|
44
82
|
elif "farmhouse" == i.strip():
|
|
45
83
|
result.append("farm")
|
|
46
84
|
result.append("house")
|
|
@@ -57,6 +95,11 @@ def conform(x):
|
|
|
57
95
|
|
|
58
96
|
return result
|
|
59
97
|
|
|
98
|
+
def match_fn(x,y):
|
|
99
|
+
return (y == x or
|
|
100
|
+
y.replace("(", "").replace(")", "") == x.replace("(", "").replace(")", "") or
|
|
101
|
+
re.sub(r"\((.*)\)",r"", y) == x or re.sub(r"\((.*)\)",r"", x) == y)
|
|
102
|
+
|
|
60
103
|
class EvaluationEngine(BatchalignEngine):
|
|
61
104
|
tasks = [ Task.WER ]
|
|
62
105
|
|
|
@@ -69,8 +112,8 @@ class EvaluationEngine(BatchalignEngine):
|
|
|
69
112
|
forms = [i.replace("-", "") for i in forms if i.strip() not in MOR_PUNCT+ENDING_PUNCT]
|
|
70
113
|
gold_forms = [i.replace("-", "") for i in gold_forms if i.strip() not in MOR_PUNCT+ENDING_PUNCT]
|
|
71
114
|
|
|
72
|
-
forms = [re.sub(r"\((.*)\)",r"", i) for i in forms]
|
|
73
|
-
gold_forms = [re.sub(r"\((.*)\)",r"", i) for i in gold_forms]
|
|
115
|
+
# forms = [re.sub(r"\((.*)\)",r"", i) for i in forms]
|
|
116
|
+
# gold_forms = [re.sub(r"\((.*)\)",r"", i) for i in gold_forms]
|
|
74
117
|
|
|
75
118
|
# if there are single letter frames, we combine them tofgether
|
|
76
119
|
# until the utterance is done or there isn't any left
|
|
@@ -111,7 +154,7 @@ class EvaluationEngine(BatchalignEngine):
|
|
|
111
154
|
forms_final = conform(forms_final)
|
|
112
155
|
|
|
113
156
|
# dp!
|
|
114
|
-
alignment = align(forms_final, gold_final, False)
|
|
157
|
+
alignment = align(forms_final, gold_final, False, match_fn)
|
|
115
158
|
|
|
116
159
|
# calculate each type of error
|
|
117
160
|
sub = 0
|
|
@@ -76,7 +76,7 @@ def __serialize_arr(src, tgt):
|
|
|
76
76
|
|
|
77
77
|
return src_serialized, tgt_serialized
|
|
78
78
|
|
|
79
|
-
def __dp(payload, reference, t):
|
|
79
|
+
def __dp(payload, reference, t, match_fn):
|
|
80
80
|
"""Performs bottom-up dynamic programming alignment
|
|
81
81
|
|
|
82
82
|
Parameters
|
|
@@ -149,7 +149,7 @@ def __dp(payload, reference, t):
|
|
|
149
149
|
# get a match.
|
|
150
150
|
|
|
151
151
|
# recall 1 indexing
|
|
152
|
-
is_match = (reference[i-1].key
|
|
152
|
+
is_match = match_fn(reference[i-1].key, payload[j-1].key)
|
|
153
153
|
|
|
154
154
|
# calculate new distances
|
|
155
155
|
new_dist1 = dist1+(0 if is_match else 2)
|
|
@@ -209,15 +209,16 @@ def __dp(payload, reference, t):
|
|
|
209
209
|
|
|
210
210
|
def align(source_payload_sequence,
|
|
211
211
|
target_reference_sequence,
|
|
212
|
-
tqdm=True
|
|
212
|
+
tqdm=True,
|
|
213
|
+
match_fn=lambda x,y: x==y):
|
|
213
214
|
"""Align two sequences"""
|
|
214
215
|
|
|
215
216
|
if (len(source_payload_sequence) > 0 and
|
|
216
217
|
type(source_payload_sequence[0]) == PayloadTarget):
|
|
217
|
-
return __dp(source_payload_sequence, target_reference_sequence, tqdm)
|
|
218
|
+
return __dp(source_payload_sequence, target_reference_sequence, tqdm, match_fn)
|
|
218
219
|
else:
|
|
219
220
|
return __dp(*__serialize_arr(source_payload_sequence,
|
|
220
|
-
target_reference_sequence), tqdm)
|
|
221
|
+
target_reference_sequence), tqdm, match_fn)
|
|
221
222
|
|
|
222
223
|
# align([1,2,3,4,4,5,5,5], [1,1,3,4,4,12,5,5,18])
|
|
223
224
|
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/BatchalignHK.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/BatchalignHK.egg-info/entry_points.txt
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/BatchalignHK.egg-info/requires.txt
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/BatchalignHK.egg-info/top_level.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/exception.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/realtime_meeting.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/speech_recognizer.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/stream_input_tts.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_abnf.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_app.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_core.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_http.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_socket.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_url.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/extern/nls/websocket/_utils.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/chat/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/chat/generator.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/textgrid/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/textgrid/file.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/textgrid/generator.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/formats/textgrid/parser.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/speaker/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/speaker/config.yaml
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/speaker/infer.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/speaker/utils.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/training/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/training/utils.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/dataset.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/execute.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/infer.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/prep.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/utterance/train.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/wave2vec/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/wave2vec/infer_fa.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/whisper/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/whisper/infer_asr.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/models/whisper/infer_fa.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/analysis/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/aliyun.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/num2chinese.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/oai_whisper.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/tencent.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/whisper.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/asr/whisperx.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/cleanup.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/cleanup/retrace.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/fa/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/fa/wave2vec_fa.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/fa/whisper_fa.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/morphosyntax/coref.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/morphosyntax/ud.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/speaker/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/translate/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/translate/gtrans.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/translate/seamless.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/translate/utils.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utr/__init__.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utr/rev_utr.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utr/tencent_utr.py
RENAMED
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utr/whisper_utr.py
RENAMED
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/pipelines/utterance/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{batchalignhk-0.7.19.post21 → batchalignhk-0.7.19.post23}/batchalign/tests/pipelines/fixures.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|