BatchalignHK 0.7.18.post8__tar.gz → 0.7.18.post11__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (122) hide show
  1. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/PKG-INFO +10 -31
  2. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/requires.txt +1 -0
  3. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/PKG-INFO +10 -31
  4. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/README.md +6 -29
  5. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/resolve.py +1 -0
  6. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/fa/wave2vec_fa.py +1 -1
  7. batchalignhk-0.7.18.post11/batchalign/version +3 -0
  8. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/setup.py +4 -0
  9. batchalignhk-0.7.18.post8/batchalign/version +0 -3
  10. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/SOURCES.txt +0 -0
  11. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/dependency_links.txt +0 -0
  12. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/entry_points.txt +0 -0
  13. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/BatchalignHK.egg-info/top_level.txt +0 -0
  14. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/LICENSE +0 -0
  15. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/MANIFEST.in +0 -0
  16. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/__init__.py +0 -0
  17. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/__main__.py +0 -0
  18. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/cli/__init__.py +0 -0
  19. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/cli/cli.py +0 -0
  20. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/cli/dispatch.py +0 -0
  21. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/constants.py +0 -0
  22. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/document.py +0 -0
  23. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/errors.py +0 -0
  24. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/__init__.py +0 -0
  25. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/base.py +0 -0
  26. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/__init__.py +0 -0
  27. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/file.py +0 -0
  28. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/generator.py +0 -0
  29. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/lexer.py +0 -0
  30. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/parser.py +0 -0
  31. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/chat/utils.py +0 -0
  32. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/__init__.py +0 -0
  33. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/file.py +0 -0
  34. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/generator.py +0 -0
  35. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/formats/textgrid/parser.py +0 -0
  36. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/__init__.py +0 -0
  37. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/speaker/__init__.py +0 -0
  38. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/speaker/config.yaml +0 -0
  39. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/speaker/infer.py +0 -0
  40. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/speaker/utils.py +0 -0
  41. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/training/__init__.py +0 -0
  42. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/training/run.py +0 -0
  43. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/training/utils.py +0 -0
  44. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utils.py +0 -0
  45. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/__init__.py +0 -0
  46. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/cantonese_infer.py +0 -0
  47. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/dataset.py +0 -0
  48. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/execute.py +0 -0
  49. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/infer.py +0 -0
  50. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/prep.py +0 -0
  51. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/utterance/train.py +0 -0
  52. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/wave2vec/__init__.py +0 -0
  53. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/wave2vec/infer_fa.py +0 -0
  54. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/whisper/__init__.py +0 -0
  55. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/whisper/infer_asr.py +0 -0
  56. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/models/whisper/infer_fa.py +0 -0
  57. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/__init__.py +0 -0
  58. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/analysis/__init__.py +0 -0
  59. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/analysis/eval.py +0 -0
  60. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/__init__.py +0 -0
  61. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/num2chinese.py +0 -0
  62. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/rev.py +0 -0
  63. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/tencent.py +0 -0
  64. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/utils.py +0 -0
  65. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/whisper.py +0 -0
  66. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/asr/whisperx.py +0 -0
  67. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/base.py +0 -0
  68. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/__init__.py +0 -0
  69. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/cleanup.py +0 -0
  70. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
  71. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/parse_support.py +0 -0
  72. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/retrace.py +0 -0
  73. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
  74. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
  75. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/cleanup/support/test.test +0 -0
  76. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/dispatch.py +0 -0
  77. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/fa/__init__.py +0 -0
  78. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/fa/whisper_fa.py +0 -0
  79. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
  80. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/coref.py +0 -0
  81. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/en/irr.py +0 -0
  82. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/fr/apm.py +0 -0
  83. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/fr/apmn.py +0 -0
  84. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
  85. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
  86. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/morphosyntax/ud.py +0 -0
  87. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/pipeline.py +0 -0
  88. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/speaker/__init__.py +0 -0
  89. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
  90. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/__init__.py +0 -0
  91. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/gtrans.py +0 -0
  92. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/seamless.py +0 -0
  93. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/translate/utils.py +0 -0
  94. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/__init__.py +0 -0
  95. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/rev_utr.py +0 -0
  96. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/utils.py +0 -0
  97. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utr/whisper_utr.py +0 -0
  98. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utterance/__init__.py +0 -0
  99. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/pipelines/utterance/ud_utterance.py +0 -0
  100. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/__init__.py +0 -0
  101. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/conftest.py +0 -0
  102. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
  103. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
  104. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
  105. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
  106. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
  107. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
  108. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
  109. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
  110. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
  111. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
  112. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
  113. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
  114. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/fixures.py +0 -0
  115. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/test_pipeline.py +0 -0
  116. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
  117. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/tests/test_document.py +0 -0
  118. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/utils/__init__.py +0 -0
  119. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/utils/config.py +0 -0
  120. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/utils/dp.py +0 -0
  121. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/batchalign/utils/utils.py +0 -0
  122. {batchalignhk-0.7.18.post8 → batchalignhk-0.7.18.post11}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
- Metadata-Version: 2.2
1
+ Metadata-Version: 2.4
2
2
  Name: BatchalignHK
3
- Version: 0.7.18.post8
3
+ Version: 0.7.18.post11
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -14,6 +14,7 @@ Requires-Dist: praatio<6.1.0,>=6.0.0
14
14
  Requires-Dist: torch>=2.6.0
15
15
  Requires-Dist: torchaudio
16
16
  Requires-Dist: opencc-python-reimplemented
17
+ Requires-Dist: pydub
17
18
  Requires-Dist: plotly>=5.3.0
18
19
  Requires-Dist: transformers>=4.37
19
20
  Requires-Dist: tokenizers>=0.14.1
@@ -44,6 +45,7 @@ Dynamic: author-email
44
45
  Dynamic: classifier
45
46
  Dynamic: description
46
47
  Dynamic: description-content-type
48
+ Dynamic: license-file
47
49
  Dynamic: provides-extra
48
50
  Dynamic: requires-dist
49
51
  Dynamic: summary
@@ -60,46 +62,23 @@ The TalkBank Project, of which Batchalign is a part, is supported by NIH grant H
60
62
 
61
63
  The following instructions provide a quick start to installing Batchalign. For most users aiming to process CHAT and audio with Batchalign, we recommend more detailed usage instructions: for [usage](https://talkbank.org/info/BA2-usage.pdf) and [human transcript cleanup](https://talkbank.org/info/BA2-cleanup.pdf). The following provides a quick start guide for the program.
62
64
 
63
- ### Get Python
64
- - We support Python versions 3.9, 3.10, 3.11 and 3.12.
65
- - First, check to see if you have Python by running `python`. If it reports any of the versions above, skip the following step.
66
- - To install Python, follow the instructions...
67
- - for macOS
68
- 1. Install Brew: [visit this link](https://brew.sh/)
69
- 2. Install Python and Pipx: execute `brew install python@3.11 pipx`
70
- 3. Copy the pipx path to yours: execute `pipx ensurepath`
71
- - for Windows
72
- 1. Install Python 3.11: [via this link](https://www.python.org/ftp/python/3.11.7/python-3.11.7-amd64.exe)
73
- 2. If later commands report `pip module not found`, [this page may help](https://github.com/TalkBank/batchalign2/wiki/Troubleshooting-Tips#get-pip-on-windows)
74
- - your distribution's instructions for Linux
75
-
76
- For first-time users of Python, note that if you didn't install Python 3.11 (as we recommended above), it may be complex to change Python versions downstream and may cause additional problems. We recommend explicitly installing Python 3.11 by installing it explicitly via specifying a version number as we show above.
77
-
78
65
  ### Install and Update the Package
79
- You can get Batchalign from PyPi, and you can update the package in the same way:
80
-
81
- #### macOS
66
+ Batchalign is on PyPi (as `batchalign`). We recommend the use of UV to install Batchalign:
82
67
 
83
- Since Batchalign is a command line program, we recommend using `pipx`, the newly standard environment-based Python program installer, on macOS:
68
+ #### macOS / Linux
84
69
 
85
70
  ```
86
- pipx install batchalign --python $(brew --prefix)/bin/python3.11
87
- ```
88
-
89
- #### Linux
90
-
91
- ```
92
- pip install -U batchalign
71
+ curl -LsSf https://astral.sh/uv/install.sh | sh
72
+ UV_PYTHON=3.11 uv tool install batchalign
93
73
  ```
94
74
 
95
75
  #### Windows
96
76
 
97
77
  ```
98
- py -m pip install -U batchalign
78
+ powershell -ExecutionPolicy ByPass -c "irm https://astral.sh/uv/install.ps1 | iex"
79
+ uv tool install batchalign
99
80
  ```
100
81
 
101
- Note that if your system reports `pip: command not found`, replace every use of `pip` in the instructions with `pip3` and try again.
102
-
103
82
  ### Rock and Roll
104
83
  There are two main ways of interacting with Batchalign. Batchalign can be used as a program to batch-process CHAT (hence the name), or as a Python LSA library.
105
84
 
@@ -4,6 +4,7 @@ praatio<6.1.0,>=6.0.0
4
4
  torch>=2.6.0
5
5
  torchaudio
6
6
  opencc-python-reimplemented
7
+ pydub
7
8
  plotly>=5.3.0
8
9
  transformers>=4.37
9
10
  tokenizers>=0.14.1
@@ -1,6 +1,6 @@
1
- Metadata-Version: 2.2
1
+ Metadata-Version: 2.4
2
2
  Name: BatchalignHK
3
- Version: 0.7.18.post8
3
+ Version: 0.7.18.post11
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -14,6 +14,7 @@ Requires-Dist: praatio<6.1.0,>=6.0.0
14
14
  Requires-Dist: torch>=2.6.0
15
15
  Requires-Dist: torchaudio
16
16
  Requires-Dist: opencc-python-reimplemented
17
+ Requires-Dist: pydub
17
18
  Requires-Dist: plotly>=5.3.0
18
19
  Requires-Dist: transformers>=4.37
19
20
  Requires-Dist: tokenizers>=0.14.1
@@ -44,6 +45,7 @@ Dynamic: author-email
44
45
  Dynamic: classifier
45
46
  Dynamic: description
46
47
  Dynamic: description-content-type
48
+ Dynamic: license-file
47
49
  Dynamic: provides-extra
48
50
  Dynamic: requires-dist
49
51
  Dynamic: summary
@@ -60,46 +62,23 @@ The TalkBank Project, of which Batchalign is a part, is supported by NIH grant H
60
62
 
61
63
  The following instructions provide a quick start to installing Batchalign. For most users aiming to process CHAT and audio with Batchalign, we recommend more detailed usage instructions: for [usage](https://talkbank.org/info/BA2-usage.pdf) and [human transcript cleanup](https://talkbank.org/info/BA2-cleanup.pdf). The following provides a quick start guide for the program.
62
64
 
63
- ### Get Python
64
- - We support Python versions 3.9, 3.10, 3.11 and 3.12.
65
- - First, check to see if you have Python by running `python`. If it reports any of the versions above, skip the following step.
66
- - To install Python, follow the instructions...
67
- - for macOS
68
- 1. Install Brew: [visit this link](https://brew.sh/)
69
- 2. Install Python and Pipx: execute `brew install python@3.11 pipx`
70
- 3. Copy the pipx path to yours: execute `pipx ensurepath`
71
- - for Windows
72
- 1. Install Python 3.11: [via this link](https://www.python.org/ftp/python/3.11.7/python-3.11.7-amd64.exe)
73
- 2. If later commands report `pip module not found`, [this page may help](https://github.com/TalkBank/batchalign2/wiki/Troubleshooting-Tips#get-pip-on-windows)
74
- - your distribution's instructions for Linux
75
-
76
- For first-time users of Python, note that if you didn't install Python 3.11 (as we recommended above), it may be complex to change Python versions downstream and may cause additional problems. We recommend explicitly installing Python 3.11 by installing it explicitly via specifying a version number as we show above.
77
-
78
65
  ### Install and Update the Package
79
- You can get Batchalign from PyPi, and you can update the package in the same way:
80
-
81
- #### macOS
66
+ Batchalign is on PyPi (as `batchalign`). We recommend the use of UV to install Batchalign:
82
67
 
83
- Since Batchalign is a command line program, we recommend using `pipx`, the newly standard environment-based Python program installer, on macOS:
68
+ #### macOS / Linux
84
69
 
85
70
  ```
86
- pipx install batchalign --python $(brew --prefix)/bin/python3.11
87
- ```
88
-
89
- #### Linux
90
-
91
- ```
92
- pip install -U batchalign
71
+ curl -LsSf https://astral.sh/uv/install.sh | sh
72
+ UV_PYTHON=3.11 uv tool install batchalign
93
73
  ```
94
74
 
95
75
  #### Windows
96
76
 
97
77
  ```
98
- py -m pip install -U batchalign
78
+ powershell -ExecutionPolicy ByPass -c "irm https://astral.sh/uv/install.ps1 | iex"
79
+ uv tool install batchalign
99
80
  ```
100
81
 
101
- Note that if your system reports `pip: command not found`, replace every use of `pip` in the instructions with `pip3` and try again.
102
-
103
82
  ### Rock and Roll
104
83
  There are two main ways of interacting with Batchalign. Batchalign can be used as a program to batch-process CHAT (hence the name), or as a Python LSA library.
105
84
 
@@ -10,46 +10,23 @@ The TalkBank Project, of which Batchalign is a part, is supported by NIH grant H
10
10
 
11
11
  The following instructions provide a quick start to installing Batchalign. For most users aiming to process CHAT and audio with Batchalign, we recommend more detailed usage instructions: for [usage](https://talkbank.org/info/BA2-usage.pdf) and [human transcript cleanup](https://talkbank.org/info/BA2-cleanup.pdf). The following provides a quick start guide for the program.
12
12
 
13
- ### Get Python
14
- - We support Python versions 3.9, 3.10, 3.11 and 3.12.
15
- - First, check to see if you have Python by running `python`. If it reports any of the versions above, skip the following step.
16
- - To install Python, follow the instructions...
17
- - for macOS
18
- 1. Install Brew: [visit this link](https://brew.sh/)
19
- 2. Install Python and Pipx: execute `brew install python@3.11 pipx`
20
- 3. Copy the pipx path to yours: execute `pipx ensurepath`
21
- - for Windows
22
- 1. Install Python 3.11: [via this link](https://www.python.org/ftp/python/3.11.7/python-3.11.7-amd64.exe)
23
- 2. If later commands report `pip module not found`, [this page may help](https://github.com/TalkBank/batchalign2/wiki/Troubleshooting-Tips#get-pip-on-windows)
24
- - your distribution's instructions for Linux
25
-
26
- For first-time users of Python, note that if you didn't install Python 3.11 (as we recommended above), it may be complex to change Python versions downstream and may cause additional problems. We recommend explicitly installing Python 3.11 by installing it explicitly via specifying a version number as we show above.
27
-
28
13
  ### Install and Update the Package
29
- You can get Batchalign from PyPi, and you can update the package in the same way:
30
-
31
- #### macOS
14
+ Batchalign is on PyPi (as `batchalign`). We recommend the use of UV to install Batchalign:
32
15
 
33
- Since Batchalign is a command line program, we recommend using `pipx`, the newly standard environment-based Python program installer, on macOS:
16
+ #### macOS / Linux
34
17
 
35
18
  ```
36
- pipx install batchalign --python $(brew --prefix)/bin/python3.11
37
- ```
38
-
39
- #### Linux
40
-
41
- ```
42
- pip install -U batchalign
19
+ curl -LsSf https://astral.sh/uv/install.sh | sh
20
+ UV_PYTHON=3.11 uv tool install batchalign
43
21
  ```
44
22
 
45
23
  #### Windows
46
24
 
47
25
  ```
48
- py -m pip install -U batchalign
26
+ powershell -ExecutionPolicy ByPass -c "irm https://astral.sh/uv/install.ps1 | iex"
27
+ uv tool install batchalign
49
28
  ```
50
29
 
51
- Note that if your system reports `pip: command not found`, replace every use of `pip` in the instructions with `pip3` and try again.
52
-
53
30
  ### Rock and Roll
54
31
  There are two main ways of interacting with Batchalign. Batchalign can be used as a program to batch-process CHAT (hence the name), or as a Python LSA library.
55
32
 
@@ -13,6 +13,7 @@ resolver = {
13
13
  "whisper": {
14
14
  'eng': ("talkbank/CHATWhisper-en-large-v1", "openai/whisper-large-v2"),
15
15
  'yue': ("alvanlii/whisper-small-cantonese", "alvanlii/whisper-small-cantonese"),
16
+ "heb": ("ivrit-ai/whisper-large-v3", "ivrit-ai/whisper-large-v3")
16
17
  }
17
18
  }
18
19
 
@@ -80,7 +80,7 @@ class Wave2VecFAEngine(BatchalignEngine):
80
80
  # breakpoint()
81
81
  if (grp[-1][1][1] - grp[0][1][0]) < 20*1000:
82
82
  res = self.__wav2vec(audio=f.chunk(grp[0][1][0], grp[-1][1][1]), text=transcript)
83
- except (IndexError, RuntimeError) as e:
83
+ except:
84
84
  # utterance contains nothing
85
85
  continue
86
86
 
@@ -0,0 +1,3 @@
1
+ 0.7.18-post.11
2
+ April 30th, 2025
3
+ align
@@ -33,6 +33,10 @@ setup(
33
33
  "torchaudio",
34
34
  # "pyAudioAnalysis",
35
35
  "opencc-python-reimplemented",
36
+ # "hmmlearn==0.3.0",
37
+ # "eyed3",
38
+ "pydub",
39
+ # "imblearn",
36
40
  "plotly>=5.3.0",
37
41
  "transformers>=4.37",
38
42
  "tokenizers>=0.14.1",
@@ -1,3 +0,0 @@
1
- 0.7.18-post.8
2
- April 27th, 2025
3
- skip multilang