batchalign 0.7.9.post3__tar.gz → 0.7.10__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (112) hide show
  1. {batchalign-0.7.9.post3/batchalign.egg-info → batchalign-0.7.10}/PKG-INFO +1 -1
  2. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/generator.py +29 -1
  3. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utterance/ud_utterance.py +2 -0
  4. batchalign-0.7.10/batchalign/version +3 -0
  5. {batchalign-0.7.9.post3 → batchalign-0.7.10/batchalign.egg-info}/PKG-INFO +1 -1
  6. batchalign-0.7.9.post3/batchalign/version +0 -3
  7. {batchalign-0.7.9.post3 → batchalign-0.7.10}/LICENSE +0 -0
  8. {batchalign-0.7.9.post3 → batchalign-0.7.10}/MANIFEST.in +0 -0
  9. {batchalign-0.7.9.post3 → batchalign-0.7.10}/README.md +0 -0
  10. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/__init__.py +0 -0
  11. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/__main__.py +0 -0
  12. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/cli/__init__.py +0 -0
  13. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/cli/cli.py +0 -0
  14. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/cli/dispatch.py +0 -0
  15. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/constants.py +0 -0
  16. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/document.py +0 -0
  17. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/errors.py +0 -0
  18. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/__init__.py +0 -0
  19. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/base.py +0 -0
  20. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/__init__.py +0 -0
  21. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/file.py +0 -0
  22. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/lexer.py +0 -0
  23. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/parser.py +0 -0
  24. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/chat/utils.py +0 -0
  25. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/textgrid/__init__.py +0 -0
  26. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/textgrid/file.py +0 -0
  27. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/textgrid/generator.py +0 -0
  28. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/formats/textgrid/parser.py +0 -0
  29. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/__init__.py +0 -0
  30. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/resolve.py +0 -0
  31. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/speaker/__init__.py +0 -0
  32. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/speaker/config.yaml +0 -0
  33. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/speaker/infer.py +0 -0
  34. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/speaker/utils.py +0 -0
  35. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/training/__init__.py +0 -0
  36. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/training/run.py +0 -0
  37. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/training/utils.py +0 -0
  38. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utils.py +0 -0
  39. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/__init__.py +0 -0
  40. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/dataset.py +0 -0
  41. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/execute.py +0 -0
  42. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/infer.py +0 -0
  43. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/prep.py +0 -0
  44. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/utterance/train.py +0 -0
  45. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/whisper/__init__.py +0 -0
  46. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/whisper/infer_asr.py +0 -0
  47. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/models/whisper/infer_fa.py +0 -0
  48. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/__init__.py +0 -0
  49. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/analysis/__init__.py +0 -0
  50. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/analysis/eval.py +0 -0
  51. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/asr/__init__.py +0 -0
  52. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/asr/rev.py +0 -0
  53. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/asr/utils.py +0 -0
  54. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/asr/whisper.py +0 -0
  55. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/asr/whisperx.py +0 -0
  56. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/base.py +0 -0
  57. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/__init__.py +0 -0
  58. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/cleanup.py +0 -0
  59. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/disfluencies.py +0 -0
  60. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/parse_support.py +0 -0
  61. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/retrace.py +0 -0
  62. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/support/filled_pauses.eng +0 -0
  63. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/support/replacements.eng +0 -0
  64. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/cleanup/support/test.test +0 -0
  65. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/dispatch.py +0 -0
  66. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/fa/__init__.py +0 -0
  67. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/fa/whisper_fa.py +0 -0
  68. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/__init__.py +0 -0
  69. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/coref.py +0 -0
  70. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/en/irr.py +0 -0
  71. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/fr/apm.py +0 -0
  72. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/fr/apmn.py +0 -0
  73. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/fr/case.py +0 -0
  74. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/ja/verbforms.py +0 -0
  75. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/morphosyntax/ud.py +0 -0
  76. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/pipeline.py +0 -0
  77. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/speaker/__init__.py +0 -0
  78. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/speaker/nemo_speaker.py +0 -0
  79. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utr/__init__.py +0 -0
  80. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utr/rev_utr.py +0 -0
  81. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utr/utils.py +0 -0
  82. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utr/whisper_utr.py +0 -0
  83. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/pipelines/utterance/__init__.py +0 -0
  84. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/__init__.py +0 -0
  85. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/conftest.py +0 -0
  86. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_file.py +0 -0
  87. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_generator.py +0 -0
  88. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_lexer.py +0 -0
  89. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_parser.py +0 -0
  90. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/chat/test_chat_utils.py +0 -0
  91. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/formats/textgrid/test_textgrid.py +0 -0
  92. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/analysis/test_eval.py +0 -0
  93. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/asr/test_asr_pipeline.py +0 -0
  94. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/asr/test_asr_utils.py +0 -0
  95. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/cleanup/test_disfluency.py +0 -0
  96. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/cleanup/test_parse_support.py +0 -0
  97. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/fa/test_fa_pipeline.py +0 -0
  98. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/fixures.py +0 -0
  99. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/test_pipeline.py +0 -0
  100. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/pipelines/test_pipeline_models.py +0 -0
  101. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/tests/test_document.py +0 -0
  102. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/utils/__init__.py +0 -0
  103. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/utils/config.py +0 -0
  104. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/utils/dp.py +0 -0
  105. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign/utils/utils.py +0 -0
  106. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign.egg-info/SOURCES.txt +0 -0
  107. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign.egg-info/dependency_links.txt +0 -0
  108. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign.egg-info/entry_points.txt +0 -0
  109. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign.egg-info/requires.txt +0 -0
  110. {batchalign-0.7.9.post3 → batchalign-0.7.10}/batchalign.egg-info/top_level.txt +0 -0
  111. {batchalign-0.7.9.post3 → batchalign-0.7.10}/setup.cfg +0 -0
  112. {batchalign-0.7.9.post3 → batchalign-0.7.10}/setup.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: batchalign
3
- Version: 0.7.9.post3
3
+ Version: 0.7.10
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -1,5 +1,6 @@
1
1
  from batchalign.document import *
2
2
  from batchalign.constants import *
3
+ import numbers
3
4
 
4
5
  import warnings
5
6
 
@@ -104,6 +105,32 @@ def generate_chat_utterance(utterance: Utterance, special_mor=False, write_wor=T
104
105
 
105
106
  return "\n".join(result)
106
107
 
108
+ def check_utterances_ordered(doc):
109
+ """check if the utterances are ordered such that one is aligned after another
110
+
111
+ Parameters
112
+ ----------
113
+ doc : Document
114
+ The CHAT document to check.
115
+
116
+ Returns
117
+ -------
118
+ bool
119
+ Whether the utterances timings are ordered or not.
120
+ """
121
+
122
+ n = -1
123
+ for i in doc.content:
124
+ if isinstance(i, Utterance) and i.alignment:
125
+ (start, end) = i.alignment
126
+ if isinstance(start, numbers.Number) != None and isinstance(end, numbers.Number) != None:
127
+ if end < start:
128
+ return False
129
+ if start < n:
130
+ return False
131
+ n = end
132
+ return True
133
+
107
134
  def generate_chat_preamble(doc, birthdays=[]):
108
135
  """Generate header for a Batchalign document.
109
136
 
@@ -124,7 +151,8 @@ def generate_chat_preamble(doc, birthdays=[]):
124
151
  header = []
125
152
  header.append("@Languages:\t"+", ".join(doc.langs))
126
153
  header.append("@Participants:\t"+", ".join([f"{i.id} {i.name}" for i in doc.tiers]))
127
- # header.append("@Options:\tmulti")
154
+ if not check_utterances_ordered(doc):
155
+ header.append("@Options:\tbullets")
128
156
  header.append("\n".join([f"@ID:\t{i.lang}|{i.corpus}|{i.id}|{i.birthday}|{i.additional[0]}|{i.additional[1]}|{i.additional[2]}|{i.name}|{i.additional[3]}|{i.additional[4]}|" for i in doc.tiers]))
129
157
  for i in birthdays:
130
158
  header.append(f"@{i.id}:\t{i.content}")
@@ -294,6 +294,8 @@ class StanzaUtteranceEngine(BatchalignEngine):
294
294
  contents.append(i)
295
295
  continue
296
296
 
297
+ if len(i.content) == 0:
298
+ continue
297
299
  new_uts = process_ut(i, nlp)
298
300
  contents += new_uts
299
301
 
@@ -0,0 +1,3 @@
1
+ 0.7.10
2
+ Janurary 20th, 2025
3
+ insert options multi automatically
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: batchalign
3
- Version: 0.7.9.post3
3
+ Version: 0.7.10
4
4
  Summary: Python Speech Language Sample Analysis
5
5
  Author: Brian MacWhinney, Houjun Liu
6
6
  Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -1,3 +0,0 @@
1
- 0.7.9.post.3
2
- Janurary 14th, 2025
3
- fix croatian
File without changes
File without changes
File without changes
File without changes