batchalign 0.7.3b17__tar.gz → 0.7.5a1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (108) hide show
  1. {batchalign-0.7.3b17/batchalign.egg-info → batchalign-0.7.5a1}/PKG-INFO +4 -4
  2. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/cli/cli.py +18 -13
  3. batchalign-0.7.5a1/batchalign/version +3 -0
  4. {batchalign-0.7.3b17 → batchalign-0.7.5a1/batchalign.egg-info}/PKG-INFO +4 -4
  5. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign.egg-info/requires.txt +3 -3
  6. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/setup.py +3 -3
  7. batchalign-0.7.3b17/batchalign/version +0 -3
  8. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/LICENSE +0 -0
  9. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/MANIFEST.in +0 -0
  10. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/README.md +0 -0
  11. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/__init__.py +0 -0
  12. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/__main__.py +0 -0
  13. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/cli/__init__.py +0 -0
  14. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/cli/dispatch.py +0 -0
  15. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/constants.py +0 -0
  16. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/document.py +0 -0
  17. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/errors.py +0 -0
  18. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/__init__.py +0 -0
  19. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/base.py +0 -0
  20. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/chat/__init__.py +0 -0
  21. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/chat/file.py +0 -0
  22. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/chat/generator.py +0 -0
  23. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/chat/lexer.py +0 -0
  24. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/chat/parser.py +0 -0
  25. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/chat/utils.py +0 -0
  26. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/textgrid/__init__.py +0 -0
  27. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/textgrid/file.py +0 -0
  28. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/textgrid/generator.py +0 -0
  29. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/formats/textgrid/parser.py +0 -0
  30. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/__init__.py +0 -0
  31. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/resolve.py +0 -0
  32. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/speaker/__init__.py +0 -0
  33. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/speaker/config.yaml +0 -0
  34. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/speaker/infer.py +0 -0
  35. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/speaker/utils.py +0 -0
  36. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/training/__init__.py +0 -0
  37. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/training/run.py +0 -0
  38. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/training/utils.py +0 -0
  39. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/utils.py +0 -0
  40. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/utterance/__init__.py +0 -0
  41. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/utterance/dataset.py +0 -0
  42. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/utterance/execute.py +0 -0
  43. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/utterance/infer.py +0 -0
  44. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/utterance/prep.py +0 -0
  45. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/utterance/train.py +0 -0
  46. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/whisper/__init__.py +0 -0
  47. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/whisper/infer_asr.py +0 -0
  48. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/models/whisper/infer_fa.py +0 -0
  49. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/__init__.py +0 -0
  50. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/analysis/__init__.py +0 -0
  51. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/analysis/eval.py +0 -0
  52. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/asr/__init__.py +0 -0
  53. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/asr/rev.py +0 -0
  54. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/asr/utils.py +0 -0
  55. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/asr/whisper.py +0 -0
  56. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/asr/whisperx.py +0 -0
  57. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/base.py +0 -0
  58. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/cleanup/__init__.py +0 -0
  59. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/cleanup/cleanup.py +0 -0
  60. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
  61. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/cleanup/parse_support.py +0 -0
  62. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/cleanup/retrace.py +0 -0
  63. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
  64. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
  65. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/cleanup/support/test.test +0 -0
  66. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/dispatch.py +0 -0
  67. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/fa/__init__.py +0 -0
  68. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/fa/whisper_fa.py +0 -0
  69. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
  70. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
  71. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
  72. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/morphosyntax/ud.py +0 -0
  73. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/pipeline.py +0 -0
  74. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/speaker/__init__.py +0 -0
  75. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
  76. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/utr/__init__.py +0 -0
  77. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/utr/rev_utr.py +0 -0
  78. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/utr/utils.py +0 -0
  79. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/utr/whisper_utr.py +0 -0
  80. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/utterance/__init__.py +0 -0
  81. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/pipelines/utterance/ud_utterance.py +0 -0
  82. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/__init__.py +0 -0
  83. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/conftest.py +0 -0
  84. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
  85. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
  86. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
  87. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
  88. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
  89. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
  90. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
  91. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
  92. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
  93. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
  94. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
  95. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
  96. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/pipelines/fixures.py +0 -0
  97. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/pipelines/test_pipeline.py +0 -0
  98. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
  99. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/tests/test_document.py +0 -0
  100. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/utils/__init__.py +0 -0
  101. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/utils/config.py +0 -0
  102. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/utils/dp.py +0 -0
  103. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign/utils/utils.py +0 -0
  104. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign.egg-info/SOURCES.txt +0 -0
  105. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign.egg-info/dependency_links.txt +0 -0
  106. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign.egg-info/entry_points.txt +0 -0
  107. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/batchalign.egg-info/top_level.txt +0 -0
  108. {batchalign-0.7.3b17 → batchalign-0.7.5a1}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: batchalign
3
- Version: 0.7.3b17
3
+ Version: 0.7.5a1
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -11,15 +11,15 @@ License-File: LICENSE
11
11
  Requires-Dist: pydantic>=2.4
12
12
  Requires-Dist: nltk>=3.8
13
13
  Requires-Dist: praatio<6.1.0,>=6.0.0
14
- Requires-Dist: torch<2.2.0,>=2.0.1
15
- Requires-Dist: torchaudio<2.2.0,>=2.1.0
14
+ Requires-Dist: torch>=2.0.1
15
+ Requires-Dist: torchaudio>=2.1.0
16
16
  Requires-Dist: pyAudioAnalysis==0.3.14
17
17
  Requires-Dist: hmmlearn==0.3.0
18
18
  Requires-Dist: eyed3~=0.9.7
19
19
  Requires-Dist: pydub<0.26.0,>=0.25.1
20
20
  Requires-Dist: imblearn
21
21
  Requires-Dist: plotly>=5.18.0
22
- Requires-Dist: transformers~=4.37
22
+ Requires-Dist: transformers>=4.37
23
23
  Requires-Dist: tokenizers>=0.14.1
24
24
  Requires-Dist: pycountry>=22.3
25
25
  Requires-Dist: stanza>=1.7
@@ -49,15 +49,7 @@ def common_options(f):
49
49
  click.argument("in_dir",
50
50
  type=click.Path(exists=True, file_okay=False)),
51
51
  click.argument("out_dir",
52
- type=click.Path(exists=True, file_okay=False)),
53
- click.option("--lang",
54
- help="sample language in three-letter ISO 3166-1 alpha-3 code",
55
- show_default=True,
56
- default="eng",
57
- type=str),
58
- click.option("-n", "--num_speakers", type=int,
59
- help="number of speakers in the language sample", default=2),
60
-
52
+ type=click.Path(exists=True, file_okay=False))
61
53
  ]
62
54
 
63
55
  options.reverse()
@@ -115,8 +107,9 @@ batchalign.add_command(train, "models")
115
107
  @common_options
116
108
  @click.option("--whisper/--rev",
117
109
  default=False, help="For utterance timing recovery, OpenAI Whisper (ASR) instead of Rev.AI (default).")
110
+
118
111
  @click.pass_context
119
- def align(ctx, in_dir, out_dir, lang, num_speakers, whisper, **kwargs):
112
+ def align(ctx, in_dir, out_dir, whisper, **kwargs):
120
113
  """Align transcripts against corresponding media files."""
121
114
  def loader(file):
122
115
  return CHATFile(path=os.path.abspath(file)).doc
@@ -124,7 +117,7 @@ def align(ctx, in_dir, out_dir, lang, num_speakers, whisper, **kwargs):
124
117
  def writer(doc, output):
125
118
  CHATFile(doc=doc).write(output)
126
119
 
127
- _dispatch("align", lang, num_speakers,
120
+ _dispatch("align", "eng", 1,
128
121
  ["cha"], ctx,
129
122
  in_dir, out_dir,
130
123
  loader, writer, C,
@@ -143,6 +136,12 @@ def align(ctx, in_dir, out_dir, lang, num_speakers, whisper, **kwargs):
143
136
  default=False, help="Perform speaker diarization (this flag is ignored with Rev.AI)")
144
137
  @click.option("--wor/--nowor",
145
138
  default=False, help="Should we write word level alignment line? Default to no.")
139
+ @click.option("--lang",
140
+ help="sample language in three-letter ISO 3166-1 alpha-3 code",
141
+ show_default=True,
142
+ default="eng",
143
+ type=str)
144
+ @click.option("-n", "--num_speakers", type=int, help="number of speakers in the language sample", default=2)
146
145
  @click.pass_context
147
146
  def transcribe(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
148
147
  """Create a transcript from audio files."""
@@ -189,7 +188,7 @@ def transcribe(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
189
188
  file_okay=True, dir_okay=False),
190
189
  help="Comma seperated manual lexicon override")
191
190
  @click.pass_context
192
- def morphotag(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
191
+ def morphotag(ctx, in_dir, out_dir, **kwargs):
193
192
  """Perform morphosyntactic analysis on transcripts."""
194
193
 
195
194
  def loader(file):
@@ -213,7 +212,7 @@ def morphotag(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
213
212
  def writer(doc, output):
214
213
  CHATFile(doc=doc, special_mor_=doc.ba_special_.get("special_mor_notation", False)).write(output)
215
214
 
216
- _dispatch("morphotag", lang, num_speakers, ["cha"], ctx,
215
+ _dispatch("morphotag", "eng", 1, ["cha"], ctx,
217
216
  in_dir, out_dir,
218
217
  loader, writer, C)
219
218
 
@@ -222,6 +221,12 @@ def morphotag(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
222
221
 
223
222
  @batchalign.command()
224
223
  @common_options
224
+ @click.option("--lang",
225
+ help="sample language in three-letter ISO 3166-1 alpha-3 code",
226
+ show_default=True,
227
+ default="eng",
228
+ type=str)
229
+ @click.option("-n", "--num_speakers", type=int, help="number of speakers in the language sample", default=2)
225
230
  @click.pass_context
226
231
  def utseg(ctx, in_dir, out_dir, lang, num_speakers, **kwargs):
227
232
  """Perform morphosyntactic analysis on transcripts."""
@@ -0,0 +1,3 @@
1
+ 0.7.5-alpha.1
2
+ September 3nd, 2024
3
+ Removes unneeded options
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: batchalign
3
- Version: 0.7.3b17
3
+ Version: 0.7.5a1
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -11,15 +11,15 @@ License-File: LICENSE
11
11
  Requires-Dist: pydantic>=2.4
12
12
  Requires-Dist: nltk>=3.8
13
13
  Requires-Dist: praatio<6.1.0,>=6.0.0
14
- Requires-Dist: torch<2.2.0,>=2.0.1
15
- Requires-Dist: torchaudio<2.2.0,>=2.1.0
14
+ Requires-Dist: torch>=2.0.1
15
+ Requires-Dist: torchaudio>=2.1.0
16
16
  Requires-Dist: pyAudioAnalysis==0.3.14
17
17
  Requires-Dist: hmmlearn==0.3.0
18
18
  Requires-Dist: eyed3~=0.9.7
19
19
  Requires-Dist: pydub<0.26.0,>=0.25.1
20
20
  Requires-Dist: imblearn
21
21
  Requires-Dist: plotly>=5.18.0
22
- Requires-Dist: transformers~=4.37
22
+ Requires-Dist: transformers>=4.37
23
23
  Requires-Dist: tokenizers>=0.14.1
24
24
  Requires-Dist: pycountry>=22.3
25
25
  Requires-Dist: stanza>=1.7
@@ -1,15 +1,15 @@
1
1
  pydantic>=2.4
2
2
  nltk>=3.8
3
3
  praatio<6.1.0,>=6.0.0
4
- torch<2.2.0,>=2.0.1
5
- torchaudio<2.2.0,>=2.1.0
4
+ torch>=2.0.1
5
+ torchaudio>=2.1.0
6
6
  pyAudioAnalysis==0.3.14
7
7
  hmmlearn==0.3.0
8
8
  eyed3~=0.9.7
9
9
  pydub<0.26.0,>=0.25.1
10
10
  imblearn
11
11
  plotly>=5.18.0
12
- transformers~=4.37
12
+ transformers>=4.37
13
13
  tokenizers>=0.14.1
14
14
  pycountry>=22.3
15
15
  stanza>=1.7
@@ -29,15 +29,15 @@ setup(
29
29
  "pydantic>=2.4",
30
30
  "nltk>=3.8",
31
31
  "praatio>=6.0.0,<6.1.0",
32
- "torch>=2.0.1,<2.2.0",
33
- "torchaudio>=2.1.0,<2.2.0",
32
+ "torch>=2.0.1",
33
+ "torchaudio>=2.1.0",
34
34
  "pyAudioAnalysis==0.3.14",
35
35
  "hmmlearn==0.3.0",
36
36
  "eyed3~=0.9.7",
37
37
  "pydub>=0.25.1,<0.26.0",
38
38
  "imblearn",
39
39
  "plotly>=5.18.0",
40
- "transformers~=4.37",
40
+ "transformers>=4.37",
41
41
  "tokenizers>=0.14.1",
42
42
  "pycountry>=22.3",
43
43
  "stanza>=1.7",
@@ -1,3 +0,0 @@
1
- 0.7.3-beta.17
2
- August 21st, 2024
3
- manual rules with mor
File without changes
File without changes
File without changes
File without changes