BatchalignHK 0.8.0.post2__tar.gz → 0.8.0.post3__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (184) hide show
  1. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/BatchalignHK.egg-info/PKG-INFO +1 -1
  2. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/PKG-INFO +1 -1
  3. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/cli/dispatch.py +81 -2
  4. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/utils.py +6 -2
  5. batchalignhk-0.8.0.post3/batchalign/version +3 -0
  6. batchalignhk-0.8.0.post2/batchalign/version +0 -3
  7. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/BatchalignHK.egg-info/SOURCES.txt +0 -0
  8. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/BatchalignHK.egg-info/dependency_links.txt +0 -0
  9. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/BatchalignHK.egg-info/entry_points.txt +0 -0
  10. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/BatchalignHK.egg-info/requires.txt +0 -0
  11. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/BatchalignHK.egg-info/top_level.txt +0 -0
  12. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/LICENSE +0 -0
  13. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/MANIFEST.in +0 -0
  14. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/README.md +0 -0
  15. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/__init__.py +0 -0
  16. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/__main__.py +0 -0
  17. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/cli/__init__.py +0 -0
  18. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/cli/cli.py +0 -0
  19. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/constants.py +0 -0
  20. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/document.py +0 -0
  21. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/errors.py +0 -0
  22. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/__init__.py +0 -0
  23. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/core.py +0 -0
  24. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/exception.py +0 -0
  25. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/logging.py +0 -0
  26. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/realtime_meeting.py +0 -0
  27. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/speech_recognizer.py +0 -0
  28. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/speech_synthesizer.py +0 -0
  29. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/speech_transcriber.py +0 -0
  30. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/stream_input_tts.py +0 -0
  31. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/token.py +0 -0
  32. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/util.py +0 -0
  33. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/version.py +0 -0
  34. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/__init__.py +0 -0
  35. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_abnf.py +0 -0
  36. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_app.py +0 -0
  37. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_cookiejar.py +0 -0
  38. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_core.py +0 -0
  39. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_exceptions.py +0 -0
  40. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_handshake.py +0 -0
  41. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_http.py +0 -0
  42. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_logging.py +0 -0
  43. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_socket.py +0 -0
  44. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_ssl_compat.py +0 -0
  45. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_url.py +0 -0
  46. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/_utils.py +0 -0
  47. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/tests/__init__.py +0 -0
  48. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/tests/echo-server.py +0 -0
  49. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/tests/test_abnf.py +0 -0
  50. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/tests/test_app.py +0 -0
  51. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/tests/test_cookiejar.py +0 -0
  52. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/tests/test_http.py +0 -0
  53. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/tests/test_url.py +0 -0
  54. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/extern/nls/websocket/tests/test_websocket.py +0 -0
  55. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/__init__.py +0 -0
  56. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/base.py +0 -0
  57. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/chat/__init__.py +0 -0
  58. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/chat/file.py +0 -0
  59. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/chat/generator.py +0 -0
  60. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/chat/lexer.py +0 -0
  61. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/chat/parser.py +0 -0
  62. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/chat/utils.py +0 -0
  63. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/textgrid/__init__.py +0 -0
  64. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/textgrid/file.py +0 -0
  65. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/textgrid/generator.py +0 -0
  66. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/formats/textgrid/parser.py +0 -0
  67. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/__init__.py +0 -0
  68. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/resolve.py +0 -0
  69. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/speaker/__init__.py +0 -0
  70. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/speaker/config.yaml +0 -0
  71. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/speaker/infer.py +0 -0
  72. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/speaker/utils.py +0 -0
  73. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/training/__init__.py +0 -0
  74. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/training/run.py +0 -0
  75. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/training/utils.py +0 -0
  76. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/utils.py +0 -0
  77. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/utterance/__init__.py +0 -0
  78. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/utterance/cantonese_infer.py +0 -0
  79. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/utterance/dataset.py +0 -0
  80. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/utterance/execute.py +0 -0
  81. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/utterance/infer.py +0 -0
  82. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/utterance/prep.py +0 -0
  83. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/utterance/train.py +0 -0
  84. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/wave2vec/__init__.py +0 -0
  85. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/wave2vec/infer_fa.py +0 -0
  86. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/whisper/__init__.py +0 -0
  87. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/whisper/infer_asr.py +0 -0
  88. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/models/whisper/infer_fa.py +0 -0
  89. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/__init__.py +0 -0
  90. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/analysis/__init__.py +0 -0
  91. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/analysis/eval.py +0 -0
  92. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/__init__.py +0 -0
  93. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/aliyun.py +0 -0
  94. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/funaudio.py +0 -0
  95. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2chinese.py +0 -0
  96. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/__init__.py +0 -0
  97. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/deu.py +0 -0
  98. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/ell.py +0 -0
  99. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/eng.py +0 -0
  100. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/eus.py +0 -0
  101. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/fra.py +0 -0
  102. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/hrv.py +0 -0
  103. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/ind.py +0 -0
  104. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/jpn.py +0 -0
  105. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/nld.py +0 -0
  106. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/por.py +0 -0
  107. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/spa.py +0 -0
  108. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/num2lang/tha.py +0 -0
  109. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/oai_whisper.py +0 -0
  110. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/rev.py +0 -0
  111. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/tencent.py +0 -0
  112. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/whisper.py +0 -0
  113. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/asr/whisperx.py +0 -0
  114. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/avqi/__init__.py +0 -0
  115. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/avqi/engine.py +0 -0
  116. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/base.py +0 -0
  117. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/cleanup/__init__.py +0 -0
  118. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/cleanup/cleanup.py +0 -0
  119. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
  120. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/cleanup/parse_support.py +0 -0
  121. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/cleanup/retrace.py +0 -0
  122. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
  123. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
  124. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/cleanup/support/test.test +0 -0
  125. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/diarization/__init__.py +0 -0
  126. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/diarization/pyannote.py +0 -0
  127. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/dispatch.py +0 -0
  128. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/fa/__init__.py +0 -0
  129. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/fa/iic_fa.py +0 -0
  130. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/fa/wave2vec_fa.py +0 -0
  131. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/fa/wave2vec_fa_canto.py +0 -0
  132. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/fa/whisper_fa.py +0 -0
  133. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
  134. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/morphosyntax/coref.py +0 -0
  135. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/morphosyntax/en/irr.py +0 -0
  136. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/morphosyntax/fr/apm.py +0 -0
  137. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/morphosyntax/fr/apmn.py +0 -0
  138. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
  139. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
  140. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/morphosyntax/ud.py +0 -0
  141. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/opensmile/__init__.py +0 -0
  142. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/opensmile/engine.py +0 -0
  143. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/pipeline.py +0 -0
  144. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/speaker/__init__.py +0 -0
  145. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
  146. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/translate/__init__.py +0 -0
  147. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/translate/gtrans.py +0 -0
  148. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/translate/seamless.py +0 -0
  149. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/translate/utils.py +0 -0
  150. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/utr/__init__.py +0 -0
  151. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/utr/funaudio_utr.py +0 -0
  152. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/utr/rev_utr.py +0 -0
  153. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/utr/tencent_utr.py +0 -0
  154. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/utr/utils.py +0 -0
  155. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/utr/whisper_utr.py +0 -0
  156. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/utterance/__init__.py +0 -0
  157. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/pipelines/utterance/ud_utterance.py +0 -0
  158. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/__init__.py +0 -0
  159. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/conftest.py +0 -0
  160. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
  161. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
  162. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
  163. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
  164. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
  165. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
  166. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
  167. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
  168. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
  169. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
  170. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
  171. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
  172. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/pipelines/fixures.py +0 -0
  173. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/pipelines/test_pipeline.py +0 -0
  174. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
  175. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/tests/test_document.py +0 -0
  176. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/utils/__init__.py +0 -0
  177. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/utils/abbrev.py +0 -0
  178. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/utils/compounds.py +0 -0
  179. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/utils/config.py +0 -0
  180. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/utils/dp.py +0 -0
  181. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/utils/names.py +0 -0
  182. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/batchalign/utils/utils.py +0 -0
  183. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/setup.cfg +0 -0
  184. {batchalignhk-0.8.0.post2 → batchalignhk-0.8.0.post3}/setup.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: BatchalignHK
3
- Version: 0.8.0.post2
3
+ Version: 0.8.0.post3
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: BatchalignHK
3
- Version: 0.8.0.post2
3
+ Version: 0.8.0.post3
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -158,8 +158,87 @@ def _worker_task(file_info, command, lang, num_speakers, loader_info, writer_inf
158
158
  doc = pipeline(doc, callback=progress_callback, **kw)
159
159
  CHATFile(doc=doc).write(output, write_wor=kwargs.get("wor", True))
160
160
 
161
+ elif command in ["transcribe", "transcribe_s"]:
162
+ from batchalign.document import CustomLine, CustomLineType
163
+ # For transcribe, the "loader" just passes the file path
164
+ doc = file
165
+
166
+ # Process through pipeline
167
+ doc = pipeline(doc, callback=progress_callback)
168
+
169
+ # Write output with ASR comment
170
+ asr = kwargs.get("asr", "rev")
171
+ with open(Path(__file__).parent.parent / "version", 'r') as df:
172
+ VERSION_NUMBER = df.readline().strip()
173
+ doc.content.insert(0, CustomLine(id="Comment", type=CustomLineType.INDEPENDENT,
174
+ content=f"Batchalign {VERSION_NUMBER}, ASR Engine {asr}. Unchecked output of ASR model."))
175
+ CHATFile(doc=doc).write(output
176
+ .replace(".wav", ".cha")
177
+ .replace(".WAV", ".cha")
178
+ .replace(".mp4", ".cha")
179
+ .replace(".MP4", ".cha")
180
+ .replace(".mp3", ".cha")
181
+ .replace(".MP3", ".cha"),
182
+ write_wor=kwargs.get("wor", False))
183
+
184
+ elif command == "translate":
185
+ cf = CHATFile(path=os.path.abspath(file), special_mor_=True)
186
+ doc = cf.doc
187
+ doc = pipeline(doc, callback=progress_callback)
188
+ CHATFile(doc=doc).write(output)
189
+
190
+ elif command == "utseg":
191
+ doc = CHATFile(path=os.path.abspath(file)).doc
192
+ doc = pipeline(doc, callback=progress_callback)
193
+ CHATFile(doc=doc).write(output)
194
+
195
+ elif command == "coref":
196
+ cf = CHATFile(path=os.path.abspath(file))
197
+ doc = cf.doc
198
+ doc = pipeline(doc, callback=progress_callback)
199
+ CHATFile(doc=doc).write(output)
200
+
201
+ elif command == "benchmark":
202
+ # Find gold transcript
203
+ from pathlib import Path as P
204
+ p = P(file)
205
+ cha = p.with_suffix(".cha")
206
+ if not cha.exists():
207
+ raise FileNotFoundError(f"No gold .cha transcript found for benchmarking. audio: {p.name}, desired cha: {cha.name}, looked in: {str(cha)}")
208
+
209
+ gold_doc = CHATFile(path=str(cha), special_mor_=True).doc
210
+ doc = pipeline(file, callback=progress_callback, gold=gold_doc)
211
+
212
+ # Write benchmark results
213
+ import os
214
+ os.remove(P(output).with_suffix(".cha"))
215
+ with open(P(output).with_suffix(".wer.txt"), 'w') as df:
216
+ df.write(str(doc["wer"]))
217
+ with open(P(output).with_suffix(".diff"), 'w') as df:
218
+ df.write(str(doc["diff"]))
219
+ CHATFile(doc=doc["doc"]).write(str(P(output).with_suffix(".asr.cha")),
220
+ write_wor=kwargs.get("wor", False))
221
+
222
+ elif command == "opensmile":
223
+ from batchalign.document import Document
224
+ doc = Document.new(media_path=file, lang=lang)
225
+ results = pipeline(doc, callback=progress_callback, feature_set=kwargs.get("feature_set", "eGeMAPSv02"))
226
+
227
+ # Write opensmile results
228
+ if results.get('success', False):
229
+ output_csv = Path(output).with_suffix('.opensmile.csv')
230
+ features_df = results.get('features_df')
231
+ if features_df is not None:
232
+ features_df.to_csv(output_csv, header=['value'], index_label='feature')
233
+ else:
234
+ error_file = Path(output).with_suffix('.error.txt')
235
+ with open(error_file, 'w') as f:
236
+ f.write(f"OpenSMILE extraction failed: {results.get('error', 'Unknown error')}\n")
237
+
161
238
  else:
162
239
  loader, writer = loader_info, writer_info
240
+ if loader is None or writer is None:
241
+ raise ValueError(f"Command '{command}' requires loader and writer functions, but they are None. This may indicate an unimplemented command or configuration issue.")
163
242
  doc = loader(os.path.abspath(file))
164
243
  kw = {}
165
244
  if isinstance(doc, tuple) and len(doc) > 1:
@@ -456,8 +535,8 @@ def _dispatch(command, lang, num_speakers,
456
535
  command=command,
457
536
  lang=lang,
458
537
  num_speakers=num_speakers,
459
- loader_info=None,
460
- writer_info=None,
538
+ loader_info=loader,
539
+ writer_info=writer,
461
540
  progress_queue=progress_queue,
462
541
  verbose=ctx.obj["verbose"],
463
542
  **kwargs)
@@ -93,11 +93,15 @@ def retokenize_with_engine(intermediate_output, engine):
93
93
  ----------
94
94
  intermediate_output : List
95
95
  Rev.AI style output.
96
-
96
+
97
97
  engine : UtteranceEngine
98
98
  The utterance Engine to use.
99
99
  """
100
-
100
+
101
+ # Safety check: if engine is None or not callable, fall back to regular retokenize
102
+ if engine is None or not callable(engine):
103
+ return retokenize(intermediate_output)
104
+
101
105
  final_outputs = []
102
106
 
103
107
  for speaker, utterance in intermediate_output:
@@ -0,0 +1,3 @@
1
+ 0.8.0-post.3
2
+ Jan 16th, 2025
3
+ Patch regression?
@@ -1,3 +0,0 @@
1
- 0.8.0-post.2
2
- Jan 15th, 2025
3
- Memory Safegaurds