PyPI - nkululeko - Versions diffs - 0.45.0__py3-none-any.whl → 0.45.2__py3-none-any.whl - Mend

nkululeko 0.45.0py3-none-any.whl → 0.45.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

nkululeko/constants.py CHANGED Viewed

	@@ -1 +1 @@
1	- VERSION = '0.45.0'
1	+ VERSION = '0.45.2'

nkululeko/experiment.py CHANGED Viewed

@@ -247,17 +247,20 @@ class Experiment:
     def plot_distribution(self):
         """Plot the distribution of samples and speaker per target class and biological sex"""
         plot = Plots()
-        if self.util.exp_is_classification():
-            # self.df_train['labels'] = self.label_encoder.inverse_transform(self.df_train[self.target])
-            # if self.df_test.is_labeled:
-            #     self.df_test['labels'] = self.label_encoder.inverse_transform(self.df_test[self.target])
-            if self.df_test.shape[0] > 0:
-                plot.describe_df('dev_set', self.df_test, self.target, f'test_distplot')
-            plot.describe_df('train_set', self.df_train, self.target, f'train_distplot')
+        sample_selection = self.util.config_val('EXPL', 'sample_selection', 'all')
+        if sample_selection=='all':
+            df_labels = pd.concat([self.df_train, self.df_test])
+            self.util.copy_flags(self.df_train, df_labels)
+        elif sample_selection=='train':
+            df_labels = self.df_train
+            self.util.copy_flags(self.df_train, df_labels)
+        elif sample_selection=='test':
+            df_labels = self.df_test
+            self.util.copy_flags(self.df_test, df_labels)
         else:
-            if self.df_test.shape[0] > 0:
-                plot.describe_df('dev_set', self.df_test, self.target, f'test_distplot')
-            plot.describe_df('train_set', self.df_train, self.target, f'train_distplot')
+            self.util.error(f'unkown sample selection specifier {sample_selection}, should be [all | train | test]')
+        plot.describe_df(f'{sample_selection}_set', df_labels, self.target, f'{sample_selection}_distplot')
     def extract_test_feats(self):
         self.feats_test = pd.DataFrame()
@@ -303,7 +306,7 @@ class Experiment:
     #     self.df_train = self.df_train.append(df_train_aug)
-    def analyse_features(self):
+    def analyse_features(self, needs_feats):
         """
         Do a feature exploration
@@ -311,7 +314,8 @@ class Experiment:
         if self.util.config_val('EXPL', 'value_counts', False):
             self.plot_distribution()
+        if not needs_feats:
+            return
         sample_selection = self.util.config_val('EXPL', 'sample_selection', 'False')
         if sample_selection=='all':
             df_feats = pd.concat([self.feats_train, self.feats_test])
@@ -325,7 +329,7 @@ class Experiment:
         elif sample_selection=='False':
             pass
         else:
-            self.util.error(f'unkown feature_distribution specifier {sample_selection}, should be [all | train | test]')
+            self.util.error(f'unkown sample selection specifier {sample_selection}, should be [all | train | test]')
         if sample_selection in ('all', 'train', 'test'):
             feat_analyser = FeatureAnalyser(sample_selection, df_labels, df_feats)
             feat_analyser.analyse()
@@ -336,8 +340,8 @@ class Experiment:
             scatters = ast.literal_eval(glob_conf.config['EXPL']['scatter'])
             if self.util.exp_is_classification():
                 plots = Plots()
-                all_feats =self.feats_train.append(self.feats_test)
-                all_labels = self.df_train['class_label'].append(self.df_test['class_label'])
+                all_feats = pd.concat([self.feats_train, self.feats_test])
+                all_labels = pd.concat([self.df_train['class_label'], self.df_test['class_label']])
                 for scatter in scatters:
                     plots.scatter_plot(all_feats, all_labels, scatter)
             else:

nkululeko/explore.py CHANGED Viewed

@@ -42,12 +42,13 @@ def main(src_dir):
     scatter = eval(util.config_val('EXPL', 'scatter', 'False'))
     model_type = util.config_val('EXPL', 'model', False)
     plot_tree = eval(util.config_val('EXPL', 'plot_tree', 'False'))
+    needs_feats = False
     if plot_feats or tsne or scatter or model_type or plot_tree:
         # these investigations need features to explore
         expr.extract_feats()
+        needs_feats = True
     # explore
-    expr.analyse_features()
+    expr.analyse_features(needs_feats)
     print('DONE')

nkululeko/util.py CHANGED Viewed

@@ -226,4 +226,9 @@ class Util:
         elif format == 'csv':
             return audformat.utils.read_csv(name)
         else:
-            self.error(f'unkown store format: {format}')
+            self.error(f'unkown store format: {format}')
+    def copy_flags(self, df_source, df_target):
+        df_target.is_labeled = df_source.is_labeled
+        df_target.got_gender = df_source.got_gender
+        df_target.got_speaker = df_source.got_speaker

{nkululeko-0.45.0.dist-info → nkululeko-0.45.2.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: nkululeko
-Version: 0.45.0
+Version: 0.45.2
 Summary: Machine learning audio prediction experiments based on templates
 Home-page: https://github.com/felixbur/nkululeko
 Author: Felix Burkhardt
@@ -148,7 +148,6 @@ There's my [blog](http://blog.syntheticspeech.de/?s=nkululeko) with tutorials:
 * [Combine feature sets](http://blog.syntheticspeech.de/2022/06/30/how-to-combine-feature-sets-with-nkululeko/)
 * [Classifying continuous variables](http://blog.syntheticspeech.de/2022/01/26/nkululeko-classifying-continuous-variables/)
 * [Try out / demo a trained model](http://blog.syntheticspeech.de/2022/01/24/nkululeko-try-out-demo-a-trained-model/)
-* [Plot distributions of feature values](http://blog.syntheticspeech.de/2023/02/16/nkululeko-how-to-plot-distributions-of-feature-values/)
 * [Perform cross database experiments](http://blog.syntheticspeech.de/2021/10/05/nkululeko-perform-cross-database-experiments/)
 * [Meta parameter optimization](http://blog.syntheticspeech.de/2021/09/03/perform-optimization-with-nkululeko/)
 * [How to set up wav2vec embedding](http://blog.syntheticspeech.de/2021/12/03/how-to-set-up-wav2vec-embedding-for-nkululeko/)
@@ -242,6 +241,13 @@ Version 0.44.1
 * bugfixing: feature importance: https://github.com/felixbur/nkululeko/issues/23
 * bugfixing: loading csv database with filewise index https://github.com/felixbur/nkululeko/issues/24
+Version 0.45.2
+--------------
+* added sample_selection for sample distribution plots
+Version 0.45.1
+--------------
+* fixed dataframe.append bug
 Version 0.45.0
 --------------

{nkululeko-0.45.0.dist-info → nkululeko-0.45.2.dist-info}/RECORD RENAMED Viewed

@@ -3,14 +3,14 @@ nkululeko/augment.py,sha256=J-HxHKU7u1xZdIiVw_abYVYWOUmZI84HMQNQpcoYk9s,1385
 nkululeko/augmenter.py,sha256=whDW3mnda33Wl9TUk2yG_My6507PFCqCzBgy0027Q2c,2399
 nkululeko/balancer.py,sha256=64ftZN68sMDfkvuovCDHpAHmSJgCO6Kdk9bwmpSisec,12
 nkululeko/cacheddataset.py,sha256=bSJ_SDg7TxL89YL_pJXp-sFvdUXJtHuBTd5KSTE4AkQ,955
-nkululeko/constants.py,sha256=DvIzFa8FFrnFyfxPyiG3RFaXtX4c_fNT94jB-Kwoa-M,19
+nkululeko/constants.py,sha256=UCi6ILbrogDPyhI2hfa7nLbmAUE0U_qAdhqXFjpYGkI,19
 nkululeko/dataset.py,sha256=BRjWXtg5FWfg-mhBQABStgSB8bUj67VAl9h1Zdd5U0Q,21627
 nkululeko/dataset_csv.py,sha256=vWhs72Nc5kDDbPw90EIdAlZpX9VUxreFp509gqmOB6M,1908
 nkululeko/dataset_ravdess.py,sha256=pTt98sr4_egdUCv2fWepkZTlkQ6x3A2YshO_n302DNg,537
 nkululeko/demo.py,sha256=Y5CscOdEuUC7V4QBDCem-Rvdc5CYd9zGEl80rqFPQ_M,1789
 nkululeko/demo_predictor.py,sha256=hYuvvKyW-DxbORAq1Y63owqhRgq-Bl8qPOymVISvO7M,2286
-nkululeko/experiment.py,sha256=NwoiyCXQI7RBVzM1-SikIf0LaxyaB6bZvdjJmAF7DEE,20413
-nkululeko/explore.py,sha256=EbNXDzsF6PY1lxljSTvox9LeHiOf4cei5gqppfxQuDQ,1873
+nkululeko/experiment.py,sha256=It6uRIFl3ObAsJscVFS5II3mdVoZG3GC8e2hy_RwOUM,20481
+nkululeko/explore.py,sha256=3mx0iuGbP1w3cteG0DM0QhKZnavOeW5OcV-vzfopVuU,1934
 nkululeko/feats_analyser.py,sha256=3ECjWSbsEarnoyvQf-dsW5ax7gbf7zukf89M_DTB15I,3726
 nkululeko/feats_audmodel.py,sha256=w-cV9Fgk_9wAV5u4ELzxvB9KM06IptPFneDenXXEmV0,2748
 nkululeko/feats_audmodel_dim.py,sha256=kug4wKRiXjceAXyT4XA8WJwXKIFNP-hTy0g5HAELVcQ,2739
@@ -52,9 +52,9 @@ nkululeko/runmanager.py,sha256=No6l8422bAI-GmPchA41KnTIFMFe4J3kdcBlj2tuaiU,6753
 nkululeko/scaler.py,sha256=ryYFGxlBqlAVGM5eaiRQTO4YYfEk8fKpAHePsaz0odk,3013
 nkululeko/test.py,sha256=4u0W18KqfpFY6jHqmTyGTGbC3StkyIOP3mbwe7kFUxU,1340
 nkululeko/test_predictor.py,sha256=4XGFa9AsHNtOkGdY0X23RxPpESyAlICqoXqR-YidHXA,2315
-nkululeko/util.py,sha256=AjVH94iYD9pimBXmZlzCDSJq2ATDsDlFsxyRRlD8n28,8174
-nkululeko-0.45.0.dist-info/LICENSE,sha256=0zGP5B_W35yAcGfHPS18Q2B8UhvLRY3dQq1MhpsJU_U,1076
-nkululeko-0.45.0.dist-info/METADATA,sha256=8yAGOXZAz5bd_T07uWtOMlWgz64DEClInEhHJJGQBuA,17328
-nkululeko-0.45.0.dist-info/WHEEL,sha256=pkctZYzUS4AYVn6dJ-7367OJZivF2e8RA9b_ZBjif18,92
-nkululeko-0.45.0.dist-info/top_level.txt,sha256=DPFNNSHPjUeVKj44dVANAjuVGRCC3MusJ08lc2a8xFA,10
-nkululeko-0.45.0.dist-info/RECORD,,
+nkululeko/util.py,sha256=06iTrqxStMpr0CU1D0neywkfZd-N5SMswOvg0OsKfNY,8381
+nkululeko-0.45.2.dist-info/LICENSE,sha256=0zGP5B_W35yAcGfHPS18Q2B8UhvLRY3dQq1MhpsJU_U,1076
+nkululeko-0.45.2.dist-info/METADATA,sha256=mOe14oOubo5mE7xeZNyxdHQxOwxiNvbW9kNDJ76L4Ks,17334
+nkululeko-0.45.2.dist-info/WHEEL,sha256=pkctZYzUS4AYVn6dJ-7367OJZivF2e8RA9b_ZBjif18,92
+nkululeko-0.45.2.dist-info/top_level.txt,sha256=DPFNNSHPjUeVKj44dVANAjuVGRCC3MusJ08lc2a8xFA,10
+nkululeko-0.45.2.dist-info/RECORD,,

{nkululeko-0.45.0.dist-info → nkululeko-0.45.2.dist-info}/LICENSE RENAMED Viewed

File without changes

{nkululeko-0.45.0.dist-info → nkululeko-0.45.2.dist-info}/WHEEL RENAMED Viewed

File without changes

{nkululeko-0.45.0.dist-info → nkululeko-0.45.2.dist-info}/top_level.txt RENAMED Viewed

File without changes

nkululeko 0.45.0__py3-none-any.whl → 0.45.2__py3-none-any.whl

nkululeko 0.45.0py3-none-any.whl → 0.45.2py3-none-any.whl