BatchalignHK 0.7.20.post3__tar.gz → 0.7.20.post5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (161) hide show
  1. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/BatchalignHK.egg-info/PKG-INFO +4 -4
  2. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/BatchalignHK.egg-info/requires.txt +2 -1
  3. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/PKG-INFO +4 -4
  4. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/chat/lexer.py +9 -10
  5. batchalignhk-0.7.20.post5/batchalign/version +3 -0
  6. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/setup.py +2 -1
  7. batchalignhk-0.7.20.post3/batchalign/version +0 -3
  8. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/BatchalignHK.egg-info/SOURCES.txt +0 -0
  9. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/BatchalignHK.egg-info/dependency_links.txt +0 -0
  10. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/BatchalignHK.egg-info/entry_points.txt +0 -0
  11. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/BatchalignHK.egg-info/top_level.txt +0 -0
  12. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/LICENSE +0 -0
  13. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/MANIFEST.in +0 -0
  14. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/README.md +0 -0
  15. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/__init__.py +0 -0
  16. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/__main__.py +0 -0
  17. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/cli/__init__.py +0 -0
  18. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/cli/cli.py +0 -0
  19. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/cli/dispatch.py +0 -0
  20. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/constants.py +0 -0
  21. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/document.py +0 -0
  22. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/errors.py +0 -0
  23. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/__init__.py +0 -0
  24. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/core.py +0 -0
  25. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/exception.py +0 -0
  26. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/logging.py +0 -0
  27. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/realtime_meeting.py +0 -0
  28. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/speech_recognizer.py +0 -0
  29. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/speech_synthesizer.py +0 -0
  30. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/speech_transcriber.py +0 -0
  31. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/stream_input_tts.py +0 -0
  32. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/token.py +0 -0
  33. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/util.py +0 -0
  34. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/version.py +0 -0
  35. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/__init__.py +0 -0
  36. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_abnf.py +0 -0
  37. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_app.py +0 -0
  38. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_cookiejar.py +0 -0
  39. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_core.py +0 -0
  40. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_exceptions.py +0 -0
  41. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_handshake.py +0 -0
  42. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_http.py +0 -0
  43. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_logging.py +0 -0
  44. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_socket.py +0 -0
  45. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_ssl_compat.py +0 -0
  46. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_url.py +0 -0
  47. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/_utils.py +0 -0
  48. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/tests/__init__.py +0 -0
  49. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/tests/echo-server.py +0 -0
  50. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/tests/test_abnf.py +0 -0
  51. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/tests/test_app.py +0 -0
  52. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/tests/test_cookiejar.py +0 -0
  53. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/tests/test_http.py +0 -0
  54. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/tests/test_url.py +0 -0
  55. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/extern/nls/websocket/tests/test_websocket.py +0 -0
  56. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/__init__.py +0 -0
  57. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/base.py +0 -0
  58. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/chat/__init__.py +0 -0
  59. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/chat/file.py +0 -0
  60. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/chat/generator.py +0 -0
  61. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/chat/parser.py +0 -0
  62. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/chat/utils.py +0 -0
  63. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/textgrid/__init__.py +0 -0
  64. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/textgrid/file.py +0 -0
  65. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/textgrid/generator.py +0 -0
  66. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/formats/textgrid/parser.py +0 -0
  67. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/__init__.py +0 -0
  68. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/resolve.py +0 -0
  69. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/speaker/__init__.py +0 -0
  70. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/speaker/config.yaml +0 -0
  71. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/speaker/infer.py +0 -0
  72. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/speaker/utils.py +0 -0
  73. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/training/__init__.py +0 -0
  74. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/training/run.py +0 -0
  75. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/training/utils.py +0 -0
  76. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/utils.py +0 -0
  77. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/utterance/__init__.py +0 -0
  78. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/utterance/cantonese_infer.py +0 -0
  79. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/utterance/dataset.py +0 -0
  80. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/utterance/execute.py +0 -0
  81. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/utterance/infer.py +0 -0
  82. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/utterance/prep.py +0 -0
  83. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/utterance/train.py +0 -0
  84. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/wave2vec/__init__.py +0 -0
  85. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/wave2vec/infer_fa.py +0 -0
  86. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/whisper/__init__.py +0 -0
  87. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/whisper/infer_asr.py +0 -0
  88. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/models/whisper/infer_fa.py +0 -0
  89. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/__init__.py +0 -0
  90. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/analysis/__init__.py +0 -0
  91. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/analysis/eval.py +0 -0
  92. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/asr/__init__.py +0 -0
  93. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/asr/aliyun.py +0 -0
  94. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/asr/num2chinese.py +0 -0
  95. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/asr/oai_whisper.py +0 -0
  96. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/asr/rev.py +0 -0
  97. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/asr/tencent.py +0 -0
  98. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/asr/utils.py +0 -0
  99. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/asr/whisper.py +0 -0
  100. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/asr/whisperx.py +0 -0
  101. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/base.py +0 -0
  102. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/cleanup/__init__.py +0 -0
  103. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/cleanup/cleanup.py +0 -0
  104. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
  105. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/cleanup/parse_support.py +0 -0
  106. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/cleanup/retrace.py +0 -0
  107. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
  108. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
  109. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/cleanup/support/test.test +0 -0
  110. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/dispatch.py +0 -0
  111. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/fa/__init__.py +0 -0
  112. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/fa/wave2vec_fa.py +0 -0
  113. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/fa/whisper_fa.py +0 -0
  114. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
  115. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/morphosyntax/coref.py +0 -0
  116. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/morphosyntax/en/irr.py +0 -0
  117. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/morphosyntax/fr/apm.py +0 -0
  118. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/morphosyntax/fr/apmn.py +0 -0
  119. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
  120. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
  121. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/morphosyntax/ud.py +0 -0
  122. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/pipeline.py +0 -0
  123. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/speaker/__init__.py +0 -0
  124. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
  125. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/translate/__init__.py +0 -0
  126. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/translate/gtrans.py +0 -0
  127. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/translate/seamless.py +0 -0
  128. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/translate/utils.py +0 -0
  129. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/utr/__init__.py +0 -0
  130. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/utr/rev_utr.py +0 -0
  131. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/utr/tencent_utr.py +0 -0
  132. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/utr/utils.py +0 -0
  133. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/utr/whisper_utr.py +0 -0
  134. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/utterance/__init__.py +0 -0
  135. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/pipelines/utterance/ud_utterance.py +0 -0
  136. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/__init__.py +0 -0
  137. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/conftest.py +0 -0
  138. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
  139. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
  140. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
  141. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
  142. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
  143. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
  144. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
  145. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
  146. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
  147. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
  148. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
  149. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
  150. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/pipelines/fixures.py +0 -0
  151. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/pipelines/test_pipeline.py +0 -0
  152. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
  153. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/tests/test_document.py +0 -0
  154. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/utils/__init__.py +0 -0
  155. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/utils/abbrev.py +0 -0
  156. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/utils/compounds.py +0 -0
  157. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/utils/config.py +0 -0
  158. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/utils/dp.py +0 -0
  159. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/utils/names.py +0 -0
  160. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/batchalign/utils/utils.py +0 -0
  161. {batchalignhk-0.7.20.post3 → batchalignhk-0.7.20.post5}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
- Metadata-Version: 2.4
1
+ Metadata-Version: 2.2
2
2
  Name: BatchalignHK
3
- Version: 0.7.20.post3
3
+ Version: 0.7.20.post5
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -16,13 +16,14 @@ Requires-Dist: torchaudio
16
16
  Requires-Dist: opencc-python-reimplemented
17
17
  Requires-Dist: pydub
18
18
  Requires-Dist: plotly>=5.3.0
19
- Requires-Dist: transformers>=4.37
19
+ Requires-Dist: transformers>=4.38.2
20
20
  Requires-Dist: tokenizers>=0.14.1
21
21
  Requires-Dist: pycountry>=22.3
22
22
  Requires-Dist: stanza[transformers]>=1.10.1
23
23
  Requires-Dist: scipy~=1.11
24
24
  Requires-Dist: rev_ai>=2.18.0
25
25
  Requires-Dist: rich~=13.6
26
+ Requires-Dist: omegaconf
26
27
  Requires-Dist: click~=8.1
27
28
  Requires-Dist: matplotlib<4.0.0,>=3.8.0
28
29
  Requires-Dist: pyfiglet==1.0.2
@@ -52,7 +53,6 @@ Dynamic: author-email
52
53
  Dynamic: classifier
53
54
  Dynamic: description
54
55
  Dynamic: description-content-type
55
- Dynamic: license-file
56
56
  Dynamic: provides-extra
57
57
  Dynamic: requires-dist
58
58
  Dynamic: summary
@@ -6,13 +6,14 @@ torchaudio
6
6
  opencc-python-reimplemented
7
7
  pydub
8
8
  plotly>=5.3.0
9
- transformers>=4.37
9
+ transformers>=4.38.2
10
10
  tokenizers>=0.14.1
11
11
  pycountry>=22.3
12
12
  stanza[transformers]>=1.10.1
13
13
  scipy~=1.11
14
14
  rev_ai>=2.18.0
15
15
  rich~=13.6
16
+ omegaconf
16
17
  click~=8.1
17
18
  matplotlib<4.0.0,>=3.8.0
18
19
  pyfiglet==1.0.2
@@ -1,6 +1,6 @@
1
- Metadata-Version: 2.4
1
+ Metadata-Version: 2.2
2
2
  Name: BatchalignHK
3
- Version: 0.7.20.post3
3
+ Version: 0.7.20.post5
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -16,13 +16,14 @@ Requires-Dist: torchaudio
16
16
  Requires-Dist: opencc-python-reimplemented
17
17
  Requires-Dist: pydub
18
18
  Requires-Dist: plotly>=5.3.0
19
- Requires-Dist: transformers>=4.37
19
+ Requires-Dist: transformers>=4.38.2
20
20
  Requires-Dist: tokenizers>=0.14.1
21
21
  Requires-Dist: pycountry>=22.3
22
22
  Requires-Dist: stanza[transformers]>=1.10.1
23
23
  Requires-Dist: scipy~=1.11
24
24
  Requires-Dist: rev_ai>=2.18.0
25
25
  Requires-Dist: rich~=13.6
26
+ Requires-Dist: omegaconf
26
27
  Requires-Dist: click~=8.1
27
28
  Requires-Dist: matplotlib<4.0.0,>=3.8.0
28
29
  Requires-Dist: pyfiglet==1.0.2
@@ -52,7 +53,6 @@ Dynamic: author-email
52
53
  Dynamic: classifier
53
54
  Dynamic: description
54
55
  Dynamic: description-content-type
55
- Dynamic: license-file
56
56
  Dynamic: provides-extra
57
57
  Dynamic: requires-dist
58
58
  Dynamic: summary
@@ -47,7 +47,7 @@ class UtteranceLexer:
47
47
  decoded.append((i, type))
48
48
  return decoded
49
49
 
50
- def __get_until(self, end_tokens=[' ']):
50
+ def _get_until(self, end_tokens=[' ']):
51
51
  has_read_nonempty = False
52
52
  tokens = []
53
53
  while True:
@@ -79,7 +79,8 @@ class UtteranceLexer:
79
79
  # self.__clauses.append((form.strip(), TokenType.FEAT))
80
80
  elif form.strip() in NORMAL_GROUP_MARKS:
81
81
  # basically ignore the form
82
- pass
82
+ self.__clauses.append((self.__clauses.pop(-1)[0], TokenType.REGULAR))
83
+ # pass
83
84
  # self.__clauses.append((form.strip(), TokenType.FEAT))
84
85
  elif form[0] == "[" and form[:2] != "[:":
85
86
  # we ignore all other things which are simple annotations
@@ -97,13 +98,13 @@ class UtteranceLexer:
97
98
  self.__clauses.append((annotation_clean(form).strip(), TokenType.REGULAR))
98
99
 
99
100
  def __pull(self):
100
- form, num, delim = self.__get_until()
101
+ form, num, delim = self._get_until()
101
102
 
102
103
  self.__handle(form, num, delim)
103
104
 
104
105
  return form
105
106
 
106
- def __get_group(self, form, type):
107
+ def _get_group(self, form, type):
107
108
  text = ""
108
109
  group = [form]
109
110
 
@@ -113,11 +114,10 @@ class UtteranceLexer:
113
114
 
114
115
  # scan forward until we have the first actual form, if
115
116
  # its a selection group
116
- if type == ">" and annotation_clean(form, special=True) == "":
117
- form, num, delim = self.__get_until()
117
+ if type == ">" and annotation_clean(form, special=True) == "" and form != "<":
118
+ form, num, delim = self._get_until()
118
119
  group = [group.pop(0).strip()+annotation_clean(form)]
119
120
 
120
-
121
121
  # decrement nesting first
122
122
  if form not in REPEAT_GROUP_MARKS and form not in NORMAL_GROUP_MARKS:
123
123
  if type == ">" and ">" in form:
@@ -127,7 +127,7 @@ class UtteranceLexer:
127
127
 
128
128
  # grab forward the entire group
129
129
  while (type not in form) or (nesting != -1):
130
- form, num, delim = self.__get_until()
130
+ form, num, delim = self._get_until()
131
131
 
132
132
  sform = copy.deepcopy(form)
133
133
  for i in REPEAT_GROUP_MARKS + NORMAL_GROUP_MARKS:
@@ -157,7 +157,6 @@ class UtteranceLexer:
157
157
  words = [re.compile(r"[^A-Za-zÀ-ÖØ-öø-ÿ']").sub("", i).strip() for i in group
158
158
  if re.compile(r"[^A-Za-zÀ-ÖØ-öø-ÿ']").sub("", i).strip()!= ""]
159
159
 
160
-
161
160
  if type == "]":
162
161
  return words, special[0], text
163
162
  else:
@@ -167,7 +166,7 @@ class UtteranceLexer:
167
166
  orig_form = form
168
167
 
169
168
  # scan the group
170
- words, special, text = self.__get_group(form, type)
169
+ words, special, text = self._get_group(form, type)
171
170
  text = form + text
172
171
 
173
172
  if len(text.strip()) == 0:
@@ -0,0 +1,3 @@
1
+ 0.7.20-post.5
2
+ July 25th, 2025
3
+ Patch lexer fixes (wip?)
@@ -38,13 +38,14 @@ setup(
38
38
  "pydub",
39
39
  # "imblearn",
40
40
  "plotly>=5.3.0",
41
- "transformers>=4.37",
41
+ "transformers>=4.38.2",
42
42
  "tokenizers>=0.14.1",
43
43
  "pycountry>=22.3",
44
44
  "stanza[transformers]>=1.10.1",
45
45
  "scipy~=1.11",
46
46
  "rev_ai>=2.18.0",
47
47
  "rich~=13.6",
48
+ "omegaconf",
48
49
  "click~=8.1",
49
50
  "matplotlib>=3.8.0,<4.0.0",
50
51
  "pyfiglet==1.0.2",
@@ -1,3 +0,0 @@
1
- 0.7.20-post.3
2
- July 21th, 2025
3
- Some benchmarking abbreviations