nkululeko 0.93.13__tar.gz → 0.93.14__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {nkululeko-0.93.13 → nkululeko-0.93.14}/CHANGELOG.md +4 -0
- {nkululeko-0.93.13/nkululeko.egg-info → nkululeko-0.93.14}/PKG-INFO +1 -1
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/constants.py +1 -1
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/data/dataset_csv.py +5 -4
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/plots.py +12 -3
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/utils/stats.py +11 -9
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/utils/util.py +15 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14/nkululeko.egg-info}/PKG-INFO +1 -1
- {nkululeko-0.93.13 → nkululeko-0.93.14}/LICENSE +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/README.md +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/aesdd/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/ased/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/asvp-esd/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/baved/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/cafe/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/clac/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/cmu-mosei/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/demos/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/ekorpus/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/emns/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/emofilm/convert_to_16k.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/emofilm/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/emorynlp/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/emov-db/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/emovo/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/emozionalmente/create.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/enterface/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/esd/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/gerparas/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/iemocap/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/jl/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/jtes/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/meld/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/mesd/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/mess/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/mlendsnd/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/msp-improv/process_database2.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/msp-podcast/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/oreau2/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/portuguese/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/ravdess/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/ravdess/process_database_speaker.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/savee/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/shemo/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/subesco/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/tess/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/thorsten-emotional/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/urdu/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/data/vivae/process_database.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/docs/source/conf.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/meta/demos/demo_best_model.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/meta/demos/my_experiment.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/meta/demos/my_experiment_local.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/meta/demos/plot_faster_anim.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/__init__.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/aug_train.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/augment.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/augmenting/__init__.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/augmenting/augmenter.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/augmenting/randomsplicer.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/augmenting/randomsplicing.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/augmenting/resampler.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/__init__.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_age.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_arousal.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_dominance.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_gender.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_mos.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_pesq.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_sdr.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_sid.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_snr.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_stoi.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/ap_valence.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/autopredict/estimate_snr.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/cacheddataset.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/data/__init__.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/data/dataset.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/demo-ft.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/demo.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/demo_feats.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/demo_predictor.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/ensemble.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/experiment.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/explore.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/export.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/__init__.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_agender.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_agender_agender.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_analyser.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_ast.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_auddim.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_audmodel.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_clap.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_hubert.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_import.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_mld.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_mos.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_opensmile.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_oxbow.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_praat.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_snr.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_spectra.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_spkrec.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_squim.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_trill.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_wav2vec2.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_wavlm.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feats_whisper.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/featureset.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/feinberg_praat.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/transformer_feature_extractor.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feature_extractor.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/file_checker.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/filter_data.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/fixedsegment.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/glob_conf.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/losses/__init__.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/losses/loss_ccc.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/losses/loss_softf1loss.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/modelrunner.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/__init__.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_bayes.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_cnn.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_gmm.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_knn.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_knn_reg.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_lin_reg.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_mlp.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_mlp_regression.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_svm.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_svr.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_tree.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_tree_reg.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_tuned.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_xgb.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/models/model_xgr.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/multidb.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/nkuluflag.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/nkululeko.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/predict.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/reporting/__init__.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/reporting/defines.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/reporting/latex_writer.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/reporting/report.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/reporting/report_item.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/reporting/reporter.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/reporting/result.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/resample.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/runmanager.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/scaler.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/segment.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/segmenting/__init__.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/segmenting/seg_inaspeechsegmenter.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/segmenting/seg_pyannote.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/segmenting/seg_silero.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/syllable_nuclei.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/test.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/test_predictor.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/test_pretrain.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/utils/__init__.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/utils/files.py +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko.egg-info/SOURCES.txt +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko.egg-info/dependency_links.txt +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko.egg-info/entry_points.txt +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko.egg-info/requires.txt +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko.egg-info/top_level.txt +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/pyproject.toml +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/setup.cfg +0 -0
- {nkululeko-0.93.13 → nkululeko-0.93.14}/setup.py +0 -0
@@ -1,2 +1,2 @@
|
|
1
|
-
VERSION="0.93.
|
1
|
+
VERSION="0.93.14"
|
2
2
|
SAMPLING_RATE = 16000
|
@@ -3,19 +3,20 @@ import ast
|
|
3
3
|
import os
|
4
4
|
import os.path
|
5
5
|
|
6
|
-
import audformat.utils
|
7
6
|
import pandas as pd
|
8
7
|
|
9
|
-
import
|
8
|
+
import audformat.utils
|
9
|
+
|
10
10
|
from nkululeko.data.dataset import Dataset
|
11
|
+
import nkululeko.glob_conf as glob_conf
|
11
12
|
from nkululeko.reporting.report_item import ReportItem
|
12
13
|
|
13
14
|
|
14
15
|
class Dataset_CSV(Dataset):
|
15
|
-
"""Class to represent datasets stored as a csv file"""
|
16
|
+
"""Class to represent datasets stored as a csv file."""
|
16
17
|
|
17
18
|
def load(self):
|
18
|
-
"""Load the dataframe with files, speakers and task labels"""
|
19
|
+
"""Load the dataframe with files, speakers and task labels."""
|
19
20
|
self.util.debug(f"loading {self.name}")
|
20
21
|
self.got_target, self.got_speaker, self.got_gender = False, False, False
|
21
22
|
data_file = self.util.config_val_data(self.name, "", "")
|
@@ -24,8 +24,10 @@ class Plots:
|
|
24
24
|
self.format = self.util.config_val("PLOT", "format", "png")
|
25
25
|
self.target = self.util.config_val("DATA", "target", "emotion")
|
26
26
|
self.with_ccc = eval(self.util.config_val("PLOT", "ccc", "False"))
|
27
|
+
self.type_s = "samples"
|
27
28
|
|
28
29
|
def plot_distributions_speaker(self, df):
|
30
|
+
self.type_s = "speaker"
|
29
31
|
df_speakers = pd.DataFrame()
|
30
32
|
pd.options.mode.chained_assignment = None # default='warn'
|
31
33
|
for s in df.speaker.unique():
|
@@ -301,11 +303,18 @@ class Plots:
|
|
301
303
|
plot_df = plot_df.rename(columns={cont_col: self.target})
|
302
304
|
cont_col = self.target
|
303
305
|
dist_type = self.util.config_val("EXPL", "dist_type", "kde")
|
304
|
-
|
306
|
+
max_cat, cat_str, effect_results = su.get_effect_size(
|
307
|
+
plot_df, cat_col, cont_col
|
308
|
+
)
|
309
|
+
self.util.debug(effect_results)
|
310
|
+
self.util.print_results_to_store(
|
311
|
+
f"cohens-d_{self.type_s}", str(effect_results) + "\n"
|
312
|
+
)
|
313
|
+
es = effect_results[max_cat]
|
305
314
|
model_type = self.util.get_model_type()
|
306
315
|
if dist_type == "hist" and model_type != "tree":
|
307
316
|
ax = sns.histplot(plot_df, x=cont_col, hue=cat_col, kde=True)
|
308
|
-
caption = f"{ylab} {plot_df.shape[0]}. {cat_str} ({
|
317
|
+
caption = f"{ylab} {plot_df.shape[0]}. {cat_str} ({max_cat}):" f" {es}"
|
309
318
|
ax.set_title(caption)
|
310
319
|
ax.set_xlabel(f"{cont_col}")
|
311
320
|
ax.set_ylabel(f"number of {ylab}")
|
@@ -319,7 +328,7 @@ class Plots:
|
|
319
328
|
warn_singular=False,
|
320
329
|
)
|
321
330
|
ax.set(xlabel=f"{cont_col}")
|
322
|
-
caption = f"{ylab} {plot_df.shape[0]}. {cat_str} ({
|
331
|
+
caption = f"{ylab} {plot_df.shape[0]}. {cat_str} ({max_cat}):" f" {es}"
|
323
332
|
ax.figure.suptitle(caption)
|
324
333
|
return ax, caption
|
325
334
|
|
@@ -1,7 +1,8 @@
|
|
1
|
-
import math
|
2
1
|
from itertools import combinations
|
2
|
+
import math
|
3
3
|
|
4
4
|
import numpy as np
|
5
|
+
import pandas as pd
|
5
6
|
|
6
7
|
|
7
8
|
def check_na(a):
|
@@ -14,9 +15,8 @@ def check_na(a):
|
|
14
15
|
return a
|
15
16
|
|
16
17
|
|
17
|
-
def cohen_d(d1, d2):
|
18
|
-
"""
|
19
|
-
Compute Cohen's d from two distributions of real valued arrays.
|
18
|
+
def cohen_d(d1: np.array, d2: np.array) -> float:
|
19
|
+
"""Compute Cohen's d from two distributions of real valued arrays.
|
20
20
|
|
21
21
|
Args:
|
22
22
|
d1: one array
|
@@ -50,7 +50,9 @@ def all_combinations(items_list):
|
|
50
50
|
return result
|
51
51
|
|
52
52
|
|
53
|
-
def get_effect_size(
|
53
|
+
def get_effect_size(
|
54
|
+
df: pd.DataFrame, target: str, variable: str
|
55
|
+
) -> tuple[str, str, dict]:
|
54
56
|
"""Get the effect size as Cohen's D.
|
55
57
|
|
56
58
|
Effect size is computed from a real numbered variable on a categorical target.
|
@@ -68,10 +70,10 @@ def get_effect_size(df, target, variable):
|
|
68
70
|
for c in categories:
|
69
71
|
cats[c] = df[df[target] == c][variable].values
|
70
72
|
combos = all_combinations(categories)
|
71
|
-
results = {}
|
73
|
+
results = {categories[0]: 0}
|
72
74
|
if len(categories) == 1:
|
73
75
|
cat_s = cohens_D_to_string(0)
|
74
|
-
return categories[0], cat_s,
|
76
|
+
return categories[0], cat_s, results
|
75
77
|
else:
|
76
78
|
for combo in combos:
|
77
79
|
one = combo[0]
|
@@ -79,10 +81,10 @@ def get_effect_size(df, target, variable):
|
|
79
81
|
results[f"{one}-{other}"] = cohen_d(cats[one], cats[other])
|
80
82
|
max_cat = max(results, key=results.get)
|
81
83
|
cat_s = cohens_D_to_string(float(results[max_cat]))
|
82
|
-
return max_cat, cat_s, results
|
84
|
+
return max_cat, cat_s, results
|
83
85
|
|
84
86
|
|
85
|
-
def cohens_D_to_string(val):
|
87
|
+
def cohens_D_to_string(val: float) -> str:
|
86
88
|
if val < 0.2:
|
87
89
|
rval = "no effect"
|
88
90
|
elif val < 0.2:
|
@@ -160,6 +160,21 @@ class Util:
|
|
160
160
|
pred_name = self.get_model_description()
|
161
161
|
return f"{results_dir}/pred_{target}_{pred_name}.csv"
|
162
162
|
|
163
|
+
def print_results_to_store(self, name: str, contents: str) -> str:
|
164
|
+
"""Write contents to a result file.
|
165
|
+
|
166
|
+
Args:
|
167
|
+
name (str): the (sub) name of the file_
|
168
|
+
|
169
|
+
Returns:
|
170
|
+
str: The path to the file
|
171
|
+
"""
|
172
|
+
results_dir = self.get_path("res_dir")
|
173
|
+
pred_name = self.get_model_description()
|
174
|
+
path = os.path.join(results_dir, f"{name}_{pred_name}.txt")
|
175
|
+
with open(path, "a") as f:
|
176
|
+
f.write(contents)
|
177
|
+
|
163
178
|
def is_categorical(self, pd_series):
|
164
179
|
"""Check if a dataframe column is categorical."""
|
165
180
|
return pd_series.dtype.name == "object" or isinstance(
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{nkululeko-0.93.13 → nkululeko-0.93.14}/nkululeko/feat_extract/transformer_feature_extractor.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|