batchalign 0.7.22.post9__tar.gz → 0.7.22.post11__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (138) hide show
  1. {batchalign-0.7.22.post9/batchalign.egg-info → batchalign-0.7.22.post11}/PKG-INFO +1 -1
  2. batchalign-0.7.22.post11/batchalign/pipelines/asr/num2lang/__init__.py +15 -0
  3. batchalign-0.7.22.post11/batchalign/pipelines/asr/num2lang/eus.py +31 -0
  4. batchalign-0.7.22.post11/batchalign/pipelines/asr/num2lang/hrv.py +111 -0
  5. batchalign-0.7.22.post11/batchalign/pipelines/asr/num2lang/ind.py +23 -0
  6. batchalign-0.7.22.post11/batchalign/pipelines/asr/num2lang/nld.py +31 -0
  7. batchalign-0.7.22.post11/batchalign/pipelines/asr/num2lang/por.py +41 -0
  8. batchalign-0.7.22.post11/batchalign/pipelines/asr/num2lang/tha.py +23 -0
  9. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/asr/utils.py +5 -0
  10. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/dispatch.py +1 -1
  11. batchalign-0.7.22.post11/batchalign/version +3 -0
  12. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11/batchalign.egg-info}/PKG-INFO +1 -1
  13. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign.egg-info/SOURCES.txt +7 -0
  14. batchalign-0.7.22.post9/batchalign/version +0 -3
  15. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/LICENSE +0 -0
  16. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/MANIFEST.in +0 -0
  17. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/README.md +0 -0
  18. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/__init__.py +0 -0
  19. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/__main__.py +0 -0
  20. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/cli/__init__.py +0 -0
  21. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/cli/cli.py +0 -0
  22. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/cli/dispatch.py +0 -0
  23. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/constants.py +0 -0
  24. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/document.py +0 -0
  25. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/errors.py +0 -0
  26. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/__init__.py +0 -0
  27. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/base.py +0 -0
  28. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/chat/__init__.py +0 -0
  29. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/chat/file.py +0 -0
  30. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/chat/generator.py +0 -0
  31. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/chat/lexer.py +0 -0
  32. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/chat/parser.py +0 -0
  33. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/chat/utils.py +0 -0
  34. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/textgrid/__init__.py +0 -0
  35. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/textgrid/file.py +0 -0
  36. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/textgrid/generator.py +0 -0
  37. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/formats/textgrid/parser.py +0 -0
  38. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/__init__.py +0 -0
  39. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/resolve.py +0 -0
  40. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/speaker/__init__.py +0 -0
  41. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/speaker/config.yaml +0 -0
  42. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/speaker/infer.py +0 -0
  43. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/speaker/utils.py +0 -0
  44. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/training/__init__.py +0 -0
  45. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/training/run.py +0 -0
  46. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/training/utils.py +0 -0
  47. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/utils.py +0 -0
  48. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/utterance/__init__.py +0 -0
  49. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/utterance/cantonese_infer.py +0 -0
  50. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/utterance/dataset.py +0 -0
  51. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/utterance/execute.py +0 -0
  52. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/utterance/infer.py +0 -0
  53. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/utterance/prep.py +0 -0
  54. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/utterance/train.py +0 -0
  55. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/wave2vec/__init__.py +0 -0
  56. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/wave2vec/infer_fa.py +0 -0
  57. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/whisper/__init__.py +0 -0
  58. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/whisper/infer_asr.py +0 -0
  59. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/models/whisper/infer_fa.py +0 -0
  60. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/__init__.py +0 -0
  61. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/analysis/__init__.py +0 -0
  62. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/analysis/eval.py +0 -0
  63. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/asr/__init__.py +0 -0
  64. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/asr/num2chinese.py +0 -0
  65. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/asr/oai_whisper.py +0 -0
  66. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/asr/rev.py +0 -0
  67. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/asr/whisper.py +0 -0
  68. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/asr/whisperx.py +0 -0
  69. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/avqi/__init__.py +0 -0
  70. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/avqi/engine.py +0 -0
  71. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/base.py +0 -0
  72. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/cleanup/__init__.py +0 -0
  73. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/cleanup/cleanup.py +0 -0
  74. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
  75. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/cleanup/parse_support.py +0 -0
  76. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/cleanup/retrace.py +0 -0
  77. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
  78. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
  79. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/cleanup/support/test.test +0 -0
  80. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/diarization/__init__.py +0 -0
  81. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/diarization/pyannote.py +0 -0
  82. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/fa/__init__.py +0 -0
  83. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/fa/wave2vec_fa.py +0 -0
  84. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/fa/whisper_fa.py +0 -0
  85. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
  86. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/morphosyntax/coref.py +0 -0
  87. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/morphosyntax/en/irr.py +0 -0
  88. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/morphosyntax/fr/apm.py +0 -0
  89. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/morphosyntax/fr/apmn.py +0 -0
  90. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
  91. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
  92. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/morphosyntax/ud.py +0 -0
  93. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/opensmile/__init__.py +0 -0
  94. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/opensmile/engine.py +0 -0
  95. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/pipeline.py +0 -0
  96. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/speaker/__init__.py +0 -0
  97. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
  98. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/translate/__init__.py +0 -0
  99. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/translate/gtrans.py +0 -0
  100. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/translate/seamless.py +0 -0
  101. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/translate/utils.py +0 -0
  102. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/utr/__init__.py +0 -0
  103. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/utr/rev_utr.py +0 -0
  104. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/utr/utils.py +0 -0
  105. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/utr/whisper_utr.py +0 -0
  106. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/utterance/__init__.py +0 -0
  107. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/pipelines/utterance/ud_utterance.py +0 -0
  108. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/__init__.py +0 -0
  109. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/conftest.py +0 -0
  110. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
  111. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
  112. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
  113. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
  114. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
  115. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
  116. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
  117. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
  118. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
  119. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
  120. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
  121. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
  122. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/pipelines/fixures.py +0 -0
  123. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/pipelines/test_pipeline.py +0 -0
  124. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
  125. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/tests/test_document.py +0 -0
  126. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/utils/__init__.py +0 -0
  127. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/utils/abbrev.py +0 -0
  128. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/utils/compounds.py +0 -0
  129. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/utils/config.py +0 -0
  130. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/utils/dp.py +0 -0
  131. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/utils/names.py +0 -0
  132. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign/utils/utils.py +0 -0
  133. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign.egg-info/dependency_links.txt +0 -0
  134. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign.egg-info/entry_points.txt +0 -0
  135. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign.egg-info/requires.txt +0 -0
  136. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/batchalign.egg-info/top_level.txt +0 -0
  137. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/setup.cfg +0 -0
  138. {batchalign-0.7.22.post9 → batchalign-0.7.22.post11}/setup.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: batchalign
3
- Version: 0.7.22.post9
3
+ Version: 0.7.22.post11
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -0,0 +1,15 @@
1
+ from .eus import EUS
2
+ from .hrv import HRV
3
+ from .nld import NLD
4
+ from .ind import IND
5
+ from .por import POR
6
+ from .tha import THA
7
+
8
+ NUM2LANG = {
9
+ "eus": EUS,
10
+ "hrv": HRV,
11
+ "nld": NLD,
12
+ "ind": IND,
13
+ "por": POR,
14
+ "tha": THA
15
+ }
@@ -0,0 +1,31 @@
1
+ EUS = {
2
+ "1":"bat",
3
+ "2":"bi",
4
+ "3":"hiru",
5
+ "4":"lau",
6
+ "5":"bost",
7
+ "6":"sei",
8
+ "7":"zazpi",
9
+ "8":"zortzi",
10
+ "9":"bederatzi",
11
+ "10":"hamar",
12
+ "11":"hamika",
13
+ "12":"hamabi",
14
+ "13":"hamahiru",
15
+ "14":"hamalau",
16
+ "15":"hamabost",
17
+ "16":"hamasei",
18
+ "17":"hamazazpi",
19
+ "18":"hemezortzi",
20
+ "19":"hemeretzi",
21
+ "20":"hogie",
22
+ "21":"hogeita-bat",
23
+ "22":"hogeita-bi",
24
+ "23":"hogeita-hiru",
25
+ "24":"hogeita-lau",
26
+ "25":"hogeita-bost",
27
+ "26":"hogeita-sei",
28
+ "27":"hogeita-zazpi",
29
+ "28":"hogeita-zortzi",
30
+ "29":"hogeita-bederatzi"
31
+ }
@@ -0,0 +1,111 @@
1
+ HRV = {
2
+ "1": "eins",
3
+ "2": "zwei",
4
+ "3": "drei",
5
+ "4": "vier",
6
+ "5": "fünf",
7
+ "6": "sechs",
8
+ "7": "sieben",
9
+ "8": "acht",
10
+ "9": "neun",
11
+ "10": "zehn",
12
+ "11": "elf",
13
+ "12": "zwölf",
14
+ "13": "dreizehn",
15
+ "14": "vierzehn",
16
+ "15": "fünfzehn",
17
+ "16": "sechzehn",
18
+ "17": "siebzehn",
19
+ "18": "achtzehn",
20
+ "19": "neunzehn",
21
+ "20": "zwanzig",
22
+ "21": "einundzwanzig",
23
+ "22": "zweiundzwanzig",
24
+ "23": "dreiundzwanzig",
25
+ "24": "vierundzwanzig",
26
+ "25": "fünfundzwanzig",
27
+ "26": "sechsundzwanzig",
28
+ "27": "siebenundzwanzig",
29
+ "28": "achtundzwanzig",
30
+ "29": "neunundzwanzig",
31
+ "30": "dreißig",
32
+ "31": "einunddreißig",
33
+ "32": "zweiunddreißig",
34
+ "33": "dreiunddreißig",
35
+ "34": "vierunddreißig",
36
+ "35": "fünfunddreißig",
37
+ "36": "sechsunddreißig",
38
+ "37": "siebenunddreißig",
39
+ "38": "achtunddreißig",
40
+ "39": "neununddreißig",
41
+ "40": "vierzig",
42
+ "41": "einundvierzig",
43
+ "42": "zweiundvierzig",
44
+ "43": "dreiundvierzig",
45
+ "44": "vierundvierzig",
46
+ "45": "fünfundvierzig",
47
+ "46": "sechsundvierzig",
48
+ "47": "siebenundvierzig",
49
+ "48": "achtundvierzig",
50
+ "49": "neunundvierzig",
51
+ "50": "fünfzig",
52
+ "51": "einundfünfzig",
53
+ "52": "zweiundfünfzig",
54
+ "53": "dreiundfünfzig",
55
+ "54": "vierundfünfzig",
56
+ "55": "fünfundfünfzig",
57
+ "56": "sechsundfünfzig",
58
+ "57": "siebenundfünfzig",
59
+ "58": "achtundfünfzig",
60
+ "59": "neunundfünfzig",
61
+ "60": "sechzig",
62
+ "61": "einundsechzig",
63
+ "62": "zweiundsechzig",
64
+ "63": "dreiundsechzig",
65
+ "64": "vierundsechzig",
66
+ "65": "fünfundsechzig",
67
+ "66": "sechsundsechzig",
68
+ "67": "siebenundsechzig",
69
+ "68": "achtundsechzig",
70
+ "69": "neunundsechzig",
71
+ "70": "siebzig",
72
+ "71": "einundsiebzig",
73
+ "72": "zweiundsiebzig",
74
+ "73": "dreiundsiebzig",
75
+ "74": "vierundsiebzig",
76
+ "75": "fünfundsiebzig",
77
+ "76": "sechsundsiebzig",
78
+ "77": "siebenundsiebzig",
79
+ "78": "achtundsiebzig",
80
+ "79": "neunundsiebzig",
81
+ "80": "achtzig",
82
+ "81": "einundachtzig",
83
+ "82": "zweiundachtzig",
84
+ "83": "dreiundachtzig",
85
+ "84": "vierundachtzig",
86
+ "85": "fünfundachtzig",
87
+ "86": "sechsundachtzig",
88
+ "87": "siebenundachtzig",
89
+ "88": "achtundachtzig",
90
+ "89": "neunundachtzig",
91
+ "90": "neunzig",
92
+ "91": "einundneunzig",
93
+ "92": "zweiundneunzig",
94
+ "93": "dreiundneunzig",
95
+ "94": "vierundneunzig",
96
+ "95": "fünfundneunzig",
97
+ "96": "sechsundneunzig",
98
+ "97": "siebenundneunzig",
99
+ "98": "achtundneunzig",
100
+ "99": "neunundneunzig",
101
+ "100": "hundert",
102
+ "200": "zwei-hundert",
103
+ "300": "drei-hundert",
104
+ "400": "vier-hundert",
105
+ "500": "fünf-hundert",
106
+ "600": "sechs-hundert",
107
+ "700": "sieben-hundert",
108
+ "800": "acht-hundert",
109
+ "900": "neun-hundert",
110
+ "1000": "tausend"
111
+ }
@@ -0,0 +1,23 @@
1
+ IND = {
2
+ "1":"satu",
3
+ "2":"dua",
4
+ "3":"tiga",
5
+ "4":"empat",
6
+ "5":"lima",
7
+ "6":"enam",
8
+ "7":"tujuh",
9
+ "8":"delapan",
10
+ "9":"sempilan",
11
+ "10":"sepuluh",
12
+ "11":"sebelas",
13
+ "12":"dua-belas",
14
+ "13":"tiga-belas",
15
+ "14":"empat-belas",
16
+ "15":"lima-belas",
17
+ "16":"enam-belas",
18
+ "17":"tujuh-belas",
19
+ "18":"delapan-belas",
20
+ "19":"sembilan-belas",
21
+ "20":"dua-puluh",
22
+ "21":"dua-puluh-satu"
23
+ }
@@ -0,0 +1,31 @@
1
+ NLD = {
2
+ "1":"een",
3
+ "2":"twee",
4
+ "3":"drie",
5
+ "4":"vier",
6
+ "5":"vijf",
7
+ "6":"zes",
8
+ "7":"zeven",
9
+ "8":"acht",
10
+ "9":"negen",
11
+ "10":"tien",
12
+ "11":"elf",
13
+ "12":"twaalf",
14
+ "13":"dertien",
15
+ "14":"viertien",
16
+ "15":"vijftien",
17
+ "16":"zestien",
18
+ "17":"zeventien",
19
+ "18":"achttien",
20
+ "19":"negentien",
21
+ "20":"twintig",
22
+ "21":"eenenttwintig",
23
+ "22":"tweeenttwintig",
24
+ "23":"drieenttwintig",
25
+ "24":"vierenttwintig",
26
+ "25":"vijfenttwintig",
27
+ "26":"zesenttwintig",
28
+ "27":"zevenenttwintig",
29
+ "28":"achtenttwintig",
30
+ "29":"negenenttwintig"
31
+ }
@@ -0,0 +1,41 @@
1
+ POR = {
2
+ "1":"um",
3
+ "2":"dois",
4
+ "3":"três",
5
+ "4":"quatro",
6
+ "5":"cinco",
7
+ "6":"seis",
8
+ "7":"sete",
9
+ "8":"oito",
10
+ "9":"nove",
11
+ "10":"dez",
12
+ "11":"onze",
13
+ "12":"doze",
14
+ "13":"treze",
15
+ "14":"quatorze",
16
+ "15":"quinze",
17
+ "16":"dezesseis",
18
+ "17":"dezessete",
19
+ "18":"dezesoito",
20
+ "19":"dezesnove",
21
+ "20":"vinte",
22
+ "21":"vinte-e-um",
23
+ "22":"vinte-e-dois",
24
+ "23":"vinte-e-três",
25
+ "24":"vinte-e-quatro",
26
+ "25":"vinte-e-cinco",
27
+ "26":"vinte-e-seis",
28
+ "27":"vinte-e-sete",
29
+ "28":"vinte-e-oito",
30
+ "29":"vinte-e-nove",
31
+ "30":"trinta",
32
+ "40":"quarenta",
33
+ "50":"cinqüenta",
34
+ "60":"sesenta",
35
+ "70":"setenta",
36
+ "80":"oitenta",
37
+ "90":"noventa",
38
+ "100":"centenas",
39
+ "101":"cento-e-um",
40
+ "121":"cento-e-vinte-e-um"
41
+ }
@@ -0,0 +1,23 @@
1
+ THA = {
2
+ "1":"นึ่ง",
3
+ "2":"สอง",
4
+ "3":"สาม",
5
+ "4":"สี่",
6
+ "5":"ห้า",
7
+ "6":"หก",
8
+ "7":"จ็ด",
9
+ "8":"แปด",
10
+ "9":"เก้า",
11
+ "10":"สิบ",
12
+ "11":"สิบเอ็ด",
13
+ "12":"สิบสอง",
14
+ "13":"สิบสาม",
15
+ "14":"สิบสี่",
16
+ "15":"สิบห้า",
17
+ "16":"สิบหก",
18
+ "17":"สิบเจ็ด",
19
+ "18":"สิบแปด",
20
+ "19":"สิบเก้า",
21
+ "20":"ยี่สิบ",
22
+ "21":"สิบเอ็ด"
23
+ }
@@ -1,6 +1,7 @@
1
1
  import re
2
2
  from batchalign.document import *
3
3
  from batchalign.utils import *
4
+ from batchalign.pipelines.asr.num2lang import NUM2LANG
4
5
 
5
6
  from batchalign.constants import ENDING_PUNCT
6
7
  from batchalign.pipelines.asr.num2chinese import num2chinese
@@ -229,6 +230,10 @@ def process_generation(output, lang="eng", utterance_engine=None):
229
230
  elif lang == "yue":
230
231
  return num2chinese(i, simp=False)
231
232
  else:
233
+ if NUM2LANG.get(lang) is not None:
234
+ n2l = NUM2LANG.get(lang)
235
+ for a,b in list(reversed(n2l.items())):
236
+ i = i.replace(a,b).strip()
232
237
  return i
233
238
  except:
234
239
  return i
@@ -137,7 +137,7 @@ def dispatch_pipeline(pkg_str, lang, num_speakers=None, **arg_overrides):
137
137
  elif engine == "gtrans":
138
138
  engines.append(GoogleTranslateEngine())
139
139
  elif engine == "whisper_oai":
140
- engines.append(OAIWhisperEngine())
140
+ engines.append(OAIWhisperEngine(lang=lang))
141
141
  elif engine == "pyannote":
142
142
  engines.append(PyannoteEngine())
143
143
  elif engine == "opensmile_egemaps":
@@ -0,0 +1,3 @@
1
+ 0.7.22-post.11
2
+ October 26st, 2025
3
+ change numbers
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: batchalign
3
- Version: 0.7.22.post9
3
+ Version: 0.7.22.post11
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -64,6 +64,13 @@ batchalign/pipelines/asr/rev.py
64
64
  batchalign/pipelines/asr/utils.py
65
65
  batchalign/pipelines/asr/whisper.py
66
66
  batchalign/pipelines/asr/whisperx.py
67
+ batchalign/pipelines/asr/num2lang/__init__.py
68
+ batchalign/pipelines/asr/num2lang/eus.py
69
+ batchalign/pipelines/asr/num2lang/hrv.py
70
+ batchalign/pipelines/asr/num2lang/ind.py
71
+ batchalign/pipelines/asr/num2lang/nld.py
72
+ batchalign/pipelines/asr/num2lang/por.py
73
+ batchalign/pipelines/asr/num2lang/tha.py
67
74
  batchalign/pipelines/avqi/__init__.py
68
75
  batchalign/pipelines/avqi/engine.py
69
76
  batchalign/pipelines/cleanup/__init__.py
@@ -1,3 +0,0 @@
1
- 0.7.22-post.9
2
- October 21st, 2025
3
- oai whisper for benchmakring