nkululeko 0.90.4__tar.gz → 0.91.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (171) hide show
  1. {nkululeko-0.90.4 → nkululeko-0.91.0}/CHANGELOG.md +5 -0
  2. {nkululeko-0.90.4/nkululeko.egg-info → nkululeko-0.91.0}/PKG-INFO +6 -1
  3. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/constants.py +1 -1
  4. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/segment.py +2 -32
  5. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/segmenting/seg_silero.py +35 -9
  6. {nkululeko-0.90.4 → nkululeko-0.91.0/nkululeko.egg-info}/PKG-INFO +6 -1
  7. {nkululeko-0.90.4 → nkululeko-0.91.0}/LICENSE +0 -0
  8. {nkululeko-0.90.4 → nkululeko-0.91.0}/README.md +0 -0
  9. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/aesdd/process_database.py +0 -0
  10. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/androids/process_database.py +0 -0
  11. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/ased/process_database.py +0 -0
  12. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/asvp-esd/process_database.py +0 -0
  13. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/baved/process_database.py +0 -0
  14. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/cafe/process_database.py +0 -0
  15. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/clac/process_database.py +0 -0
  16. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/cmu-mosei/process_database.py +0 -0
  17. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/demos/process_database.py +0 -0
  18. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/ekorpus/process_database.py +0 -0
  19. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/emns/process_database.py +0 -0
  20. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/emofilm/convert_to_16k.py +0 -0
  21. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/emofilm/process_database.py +0 -0
  22. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/emorynlp/process_database.py +0 -0
  23. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/emov-db/process_database.py +0 -0
  24. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/emovo/process_database.py +0 -0
  25. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/emozionalmente/create.py +0 -0
  26. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/enterface/process_database.py +0 -0
  27. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/esd/process_database.py +0 -0
  28. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/gerparas/process_database.py +0 -0
  29. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/iemocap/process_database.py +0 -0
  30. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/jl/process_database.py +0 -0
  31. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/jtes/process_database.py +0 -0
  32. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/meld/process_database.py +0 -0
  33. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/mesd/process_database.py +0 -0
  34. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/mess/process_database.py +0 -0
  35. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/mlendsnd/process_database.py +0 -0
  36. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/msp-improv/process_database2.py +0 -0
  37. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/msp-podcast/process_database.py +0 -0
  38. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/oreau2/process_database.py +0 -0
  39. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/portuguese/process_database.py +0 -0
  40. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/ravdess/process_database.py +0 -0
  41. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/ravdess/process_database_speaker.py +0 -0
  42. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/savee/process_database.py +0 -0
  43. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/shemo/process_database.py +0 -0
  44. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/subesco/process_database.py +0 -0
  45. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/tess/process_database.py +0 -0
  46. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/thorsten-emotional/process_database.py +0 -0
  47. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/urdu/process_database.py +0 -0
  48. {nkululeko-0.90.4 → nkululeko-0.91.0}/data/vivae/process_database.py +0 -0
  49. {nkululeko-0.90.4 → nkululeko-0.91.0}/docs/source/conf.py +0 -0
  50. {nkululeko-0.90.4 → nkululeko-0.91.0}/meta/demos/demo_best_model.py +0 -0
  51. {nkululeko-0.90.4 → nkululeko-0.91.0}/meta/demos/my_experiment.py +0 -0
  52. {nkululeko-0.90.4 → nkululeko-0.91.0}/meta/demos/my_experiment_local.py +0 -0
  53. {nkululeko-0.90.4 → nkululeko-0.91.0}/meta/demos/plot_faster_anim.py +0 -0
  54. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/__init__.py +0 -0
  55. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/aug_train.py +0 -0
  56. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/augment.py +0 -0
  57. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/augmenting/__init__.py +0 -0
  58. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/augmenting/augmenter.py +0 -0
  59. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/augmenting/randomsplicer.py +0 -0
  60. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/augmenting/randomsplicing.py +0 -0
  61. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/augmenting/resampler.py +0 -0
  62. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/__init__.py +0 -0
  63. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/ap_age.py +0 -0
  64. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/ap_arousal.py +0 -0
  65. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/ap_dominance.py +0 -0
  66. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/ap_gender.py +0 -0
  67. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/ap_mos.py +0 -0
  68. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/ap_pesq.py +0 -0
  69. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/ap_sdr.py +0 -0
  70. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/ap_snr.py +0 -0
  71. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/ap_stoi.py +0 -0
  72. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/ap_valence.py +0 -0
  73. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/autopredict/estimate_snr.py +0 -0
  74. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/cacheddataset.py +0 -0
  75. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/data/__init__.py +0 -0
  76. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/data/dataset.py +0 -0
  77. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/data/dataset_csv.py +0 -0
  78. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/demo-ft.py +0 -0
  79. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/demo.py +0 -0
  80. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/demo_feats.py +0 -0
  81. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/demo_predictor.py +0 -0
  82. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/ensemble.py +0 -0
  83. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/experiment.py +0 -0
  84. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/explore.py +0 -0
  85. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/export.py +0 -0
  86. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/__init__.py +0 -0
  87. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_agender.py +0 -0
  88. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_agender_agender.py +0 -0
  89. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_analyser.py +0 -0
  90. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_ast.py +0 -0
  91. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_auddim.py +0 -0
  92. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_audmodel.py +0 -0
  93. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_clap.py +0 -0
  94. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_hubert.py +0 -0
  95. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_import.py +0 -0
  96. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_mld.py +0 -0
  97. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_mos.py +0 -0
  98. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_opensmile.py +0 -0
  99. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_oxbow.py +0 -0
  100. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_praat.py +0 -0
  101. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_snr.py +0 -0
  102. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_spectra.py +0 -0
  103. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_spkrec.py +0 -0
  104. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_squim.py +0 -0
  105. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_trill.py +0 -0
  106. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_wav2vec2.py +0 -0
  107. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_wavlm.py +0 -0
  108. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feats_whisper.py +0 -0
  109. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/featureset.py +0 -0
  110. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/feinberg_praat.py +0 -0
  111. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feat_extract/transformer_feature_extractor.py +0 -0
  112. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/feature_extractor.py +0 -0
  113. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/file_checker.py +0 -0
  114. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/filter_data.py +0 -0
  115. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/fixedsegment.py +0 -0
  116. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/glob_conf.py +0 -0
  117. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/losses/__init__.py +0 -0
  118. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/losses/loss_ccc.py +0 -0
  119. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/losses/loss_softf1loss.py +0 -0
  120. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/modelrunner.py +0 -0
  121. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/__init__.py +0 -0
  122. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model.py +0 -0
  123. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_bayes.py +0 -0
  124. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_cnn.py +0 -0
  125. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_gmm.py +0 -0
  126. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_knn.py +0 -0
  127. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_knn_reg.py +0 -0
  128. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_lin_reg.py +0 -0
  129. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_mlp.py +0 -0
  130. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_mlp_regression.py +0 -0
  131. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_svm.py +0 -0
  132. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_svr.py +0 -0
  133. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_tree.py +0 -0
  134. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_tree_reg.py +0 -0
  135. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_tuned.py +0 -0
  136. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_xgb.py +0 -0
  137. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/models/model_xgr.py +0 -0
  138. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/multidb.py +0 -0
  139. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/nkuluflag.py +0 -0
  140. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/nkululeko.py +0 -0
  141. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/plots.py +0 -0
  142. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/predict.py +0 -0
  143. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/reporting/__init__.py +0 -0
  144. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/reporting/defines.py +0 -0
  145. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/reporting/latex_writer.py +0 -0
  146. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/reporting/report.py +0 -0
  147. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/reporting/report_item.py +0 -0
  148. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/reporting/reporter.py +0 -0
  149. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/reporting/result.py +0 -0
  150. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/resample.py +0 -0
  151. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/runmanager.py +0 -0
  152. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/scaler.py +0 -0
  153. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/segmenting/__init__.py +0 -0
  154. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/segmenting/seg_inaspeechsegmenter.py +0 -0
  155. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/syllable_nuclei.py +0 -0
  156. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/test.py +0 -0
  157. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/test_predictor.py +0 -0
  158. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/test_pretrain.py +0 -0
  159. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/utils/__init__.py +0 -0
  160. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/utils/files.py +0 -0
  161. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/utils/stats.py +0 -0
  162. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko/utils/util.py +0 -0
  163. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko.egg-info/SOURCES.txt +0 -0
  164. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko.egg-info/dependency_links.txt +0 -0
  165. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko.egg-info/entry_points.txt +0 -0
  166. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko.egg-info/requires.txt +0 -0
  167. {nkululeko-0.90.4 → nkululeko-0.91.0}/nkululeko.egg-info/top_level.txt +0 -0
  168. {nkululeko-0.90.4 → nkululeko-0.91.0}/pyproject.toml +0 -0
  169. {nkululeko-0.90.4 → nkululeko-0.91.0}/setup.cfg +0 -0
  170. {nkululeko-0.90.4 → nkululeko-0.91.0}/setup.py +0 -0
  171. {nkululeko-0.90.4 → nkululeko-0.91.0}/venv/bin/activate_this.py +0 -0
@@ -1,6 +1,11 @@
1
1
  Changelog
2
2
  =========
3
3
 
4
+ Version 0.91.0
5
+ --------------
6
+ * fixed duration display in segmentation
7
+ * added possibility to use original segmentations (without max. duration)
8
+
4
9
  Version 0.90.4
5
10
  --------------
6
11
  * added plot format for multidb
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: nkululeko
3
- Version: 0.90.4
3
+ Version: 0.91.0
4
4
  Summary: Machine learning audio prediction experiments based on templates
5
5
  Home-page: https://github.com/felixbur/nkululeko
6
6
  Author: Felix Burkhardt
@@ -356,6 +356,11 @@ F. Burkhardt, Johannes Wagner, Hagen Wierstorf, Florian Eyben and Björn Schulle
356
356
  Changelog
357
357
  =========
358
358
 
359
+ Version 0.91.0
360
+ --------------
361
+ * fixed duration display in segmentation
362
+ * added possibility to use original segmentations (without max. duration)
363
+
359
364
  Version 0.90.4
360
365
  --------------
361
366
  * added plot format for multidb
@@ -1,2 +1,2 @@
1
- VERSION="0.90.4"
1
+ VERSION="0.91.0"
2
2
  SAMPLING_RATE = 16000
@@ -7,9 +7,9 @@ import os
7
7
 
8
8
  import pandas as pd
9
9
 
10
- import nkululeko.glob_conf as glob_conf
11
10
  from nkululeko.constants import VERSION
12
11
  from nkululeko.experiment import Experiment
12
+ import nkululeko.glob_conf as glob_conf
13
13
  from nkululeko.reporting.report_item import ReportItem
14
14
  from nkululeko.utils.util import Util
15
15
 
@@ -78,6 +78,7 @@ def main():
78
78
 
79
79
  if "duration" not in df.columns:
80
80
  df["duration"] = df.index.to_series().map(lambda x: calc_dur(x))
81
+ df_seg["duration"] = df_seg.index.to_series().map(lambda x: calc_dur(x))
81
82
  num_before = df.shape[0]
82
83
  num_after = df_seg.shape[0]
83
84
  # plot distributions
@@ -115,36 +116,5 @@ def main():
115
116
  print("DONE")
116
117
 
117
118
 
118
- def get_segmentation(file):
119
- # print(f'segmenting {file[0]}')
120
- print(".", end="")
121
- wav = read_audio(file[0], sampling_rate=SAMPLING_RATE)
122
- speech_timestamps = get_speech_timestamps(
123
- wav, vad_model, sampling_rate=SAMPLING_RATE
124
- )
125
- files, starts, ends = [], [], []
126
- for entry in speech_timestamps:
127
- start = float(entry["start"] / 1000.0)
128
- end = float(entry["end"] / 1000.0)
129
- files.append(file[0])
130
- starts.append(start)
131
- ends.append(end)
132
- seg_index = segmented_index(files, starts, ends)
133
- return seg_index
134
-
135
-
136
- def segment_dataframe(df):
137
- dfs = []
138
- for file, values in df.iterrows():
139
- index = get_segmentation(file)
140
- dfs.append(
141
- pd.DataFrame(
142
- values.to_dict(),
143
- index,
144
- )
145
- )
146
- return audformat.utils.concat(dfs)
147
-
148
-
149
119
  if __name__ == "__main__":
150
120
  main() # use this if you want to state the config file path on command line
@@ -32,8 +32,30 @@ class Silero_segmenter:
32
32
  self.no_testing = not_testing
33
33
  self.util = Util(has_config=not_testing)
34
34
 
35
- def get_segmentation(self, file):
36
- # print(f'segmenting {file[0]}')
35
+ def get_segmentation_simple(self, file):
36
+ (
37
+ get_speech_timestamps,
38
+ save_audio,
39
+ read_audio,
40
+ VADIterator,
41
+ collect_chunks,
42
+ ) = vad_utils
43
+ SAMPLING_RATE = 16000
44
+ wav = read_audio(file[0], sampling_rate=SAMPLING_RATE)
45
+ speech_timestamps = get_speech_timestamps(
46
+ wav, vad_model, sampling_rate=SAMPLING_RATE
47
+ )
48
+ files, starts, ends = [], [], []
49
+ for entry in speech_timestamps:
50
+ start = float(entry["start"] / SAMPLING_RATE)
51
+ end = float(entry["end"] / SAMPLING_RATE)
52
+ files.append(file[0])
53
+ starts.append(start)
54
+ ends.append(end)
55
+ seg_index = segmented_index(files, starts, ends)
56
+ return seg_index
57
+
58
+ def get_segmentation(self, file, min_length, max_length):
37
59
  (
38
60
  get_speech_timestamps,
39
61
  save_audio,
@@ -42,12 +64,6 @@ class Silero_segmenter:
42
64
  collect_chunks,
43
65
  ) = vad_utils
44
66
  SAMPLING_RATE = 16000
45
- if self.no_testing:
46
- min_length = float(self.util.config_val("SEGMENT", "min_length", 2))
47
- max_length = float(self.util.config_val("SEGMENT", "max_length", 10))
48
- else:
49
- min_length = 2
50
- max_length = 10
51
67
  wav = read_audio(file[0], sampling_rate=SAMPLING_RATE)
52
68
  speech_timestamps = get_speech_timestamps(
53
69
  wav, vad_model, sampling_rate=SAMPLING_RATE
@@ -76,8 +92,18 @@ class Silero_segmenter:
76
92
 
77
93
  def segment_dataframe(self, df):
78
94
  dfs = []
95
+ max_length = eval(self.util.config_val("SEGMENT", "max_length", "False"))
96
+ if max_length:
97
+ if self.no_testing:
98
+ min_length = float(self.util.config_val("SEGMENT", "min_length", 2))
99
+ else:
100
+ min_length = 2
101
+ self.util.debug(f"segmenting with max length: {max_length+min_length}")
79
102
  for file, values in tqdm(df.iterrows()):
80
- index = self.get_segmentation(file)
103
+ if max_length:
104
+ index = self.get_segmentation(file, min_length, max_length)
105
+ else:
106
+ index = self.get_segmentation_simple(file)
81
107
  dfs.append(
82
108
  pd.DataFrame(
83
109
  values.to_dict(),
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: nkululeko
3
- Version: 0.90.4
3
+ Version: 0.91.0
4
4
  Summary: Machine learning audio prediction experiments based on templates
5
5
  Home-page: https://github.com/felixbur/nkululeko
6
6
  Author: Felix Burkhardt
@@ -356,6 +356,11 @@ F. Burkhardt, Johannes Wagner, Hagen Wierstorf, Florian Eyben and Björn Schulle
356
356
  Changelog
357
357
  =========
358
358
 
359
+ Version 0.91.0
360
+ --------------
361
+ * fixed duration display in segmentation
362
+ * added possibility to use original segmentations (without max. duration)
363
+
359
364
  Version 0.90.4
360
365
  --------------
361
366
  * added plot format for multidb
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes