PyPI - nkululeko - Versions diffs - 0.84.0__py3-none-any.whl → 0.84.1__py3-none-any.whl - Mend

nkululeko 0.84.0py3-none-any.whl → 0.84.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

nkululeko/augmenting/resampler.py +9 -4
nkululeko/constants.py +1 -1
nkululeko/models/finetune_model.py +181 -0
nkululeko/resample.py +76 -54
nkululeko/test_pretrain.py +188 -11
nkululeko/utils/util.py +53 -32
{nkululeko-0.84.0.dist-info → nkululeko-0.84.1.dist-info}/METADATA +5 -1
{nkululeko-0.84.0.dist-info → nkululeko-0.84.1.dist-info}/RECORD +11 -10
{nkululeko-0.84.0.dist-info → nkululeko-0.84.1.dist-info}/LICENSE +0 -0
{nkululeko-0.84.0.dist-info → nkululeko-0.84.1.dist-info}/WHEEL +0 -0
{nkululeko-0.84.0.dist-info → nkululeko-0.84.1.dist-info}/top_level.txt +0 -0

nkululeko/augmenting/resampler.py CHANGED Viewed

@@ -12,16 +12,19 @@ from nkululeko.utils.util import Util
 class Resampler:
-    def __init__(self, df, not_testing=True):
+    def __init__(self, df, replace, not_testing=True):
         self.SAMPLING_RATE = 16000
         self.df = df
         self.util = Util("resampler", has_config=not_testing)
         self.util.warn(f"all files might be resampled to {self.SAMPLING_RATE}")
         self.not_testing = not_testing
+        self.replace = eval(self.util.config_val(
+            "RESAMPLE", "replace", "False")) if not not_testing else replace
     def resample(self):
         files = self.df.index.get_level_values(0).values
-        replace = eval(self.util.config_val("RESAMPLE", "replace", "False"))
+        # replace = eval(self.util.config_val("RESAMPLE", "replace", "False"))
+        replace = self.replace
         if self.not_testing:
             store = self.util.get_path("store")
         else:
@@ -42,7 +45,8 @@ class Resampler:
                 continue
             if org_sr != self.SAMPLING_RATE:
                 self.util.debug(f"resampling {f} (sr = {org_sr})")
-                resampler = torchaudio.transforms.Resample(org_sr, self.SAMPLING_RATE)
+                resampler = torchaudio.transforms.Resample(
+                    org_sr, self.SAMPLING_RATE)
                 signal = resampler(signal)
                 if replace:
                     torchaudio.save(
@@ -59,7 +63,8 @@ class Resampler:
             self.df = self.df.set_index(
                 self.df.index.set_levels(new_files, level="file")
             )
-            target_file = self.util.config_val("RESAMPLE", "target", "resampled.csv")
+            target_file = self.util.config_val(
+                "RESAMPLE", "target", "resampled.csv")
             # remove encoded labels
             target = self.util.config_val("DATA", "target", "emotion")
             if "class_label" in self.df.columns:

nkululeko/constants.py CHANGED Viewed

@@ -1,2 +1,2 @@
-VERSION="0.84.0"
+VERSION="0.84.1"
 SAMPLING_RATE = 16000

nkululeko/models/finetune_model.py ADDED Viewed

@@ -0,0 +1,181 @@
+import dataclasses
+import typing
+import torch
+import transformers
+from transformers.models.wav2vec2.modeling_wav2vec2 import (
+    Wav2Vec2PreTrainedModel,
+    Wav2Vec2Model,
+)
+class ConcordanceCorCoeff(torch.nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.mean = torch.mean
+        self.var = torch.var
+        self.sum = torch.sum
+        self.sqrt = torch.sqrt
+        self.std = torch.std
+    def forward(self, prediction, ground_truth):
+        mean_gt = self.mean(ground_truth, 0)
+        mean_pred = self.mean(prediction, 0)
+        var_gt = self.var(ground_truth, 0)
+        var_pred = self.var(prediction, 0)
+        v_pred = prediction - mean_pred
+        v_gt = ground_truth - mean_gt
+        cor = self.sum(v_pred * v_gt) / (
+            self.sqrt(self.sum(v_pred**2)) * self.sqrt(self.sum(v_gt**2))
+        )
+        sd_gt = self.std(ground_truth)
+        sd_pred = self.std(prediction)
+        numerator = 2 * cor * sd_gt * sd_pred
+        denominator = var_gt + var_pred + (mean_gt - mean_pred) ** 2
+        ccc = numerator / denominator
+        return 1 - ccc
+@dataclasses.dataclass
+class ModelOutput(transformers.file_utils.ModelOutput):
+    logits_cat: torch.FloatTensor = None
+    hidden_states: typing.Tuple[torch.FloatTensor] = None
+    cnn_features: torch.FloatTensor = None
+class ModelHead(torch.nn.Module):
+    def __init__(self, config, num_labels):
+        super().__init__()
+        self.dense = torch.nn.Linear(config.hidden_size, config.hidden_size)
+        self.dropout = torch.nn.Dropout(config.final_dropout)
+        self.out_proj = torch.nn.Linear(config.hidden_size, num_labels)
+    def forward(self, features, **kwargs):
+        x = features
+        x = self.dropout(x)
+        x = self.dense(x)
+        x = torch.tanh(x)
+        x = self.dropout(x)
+        x = self.out_proj(x)
+        return x
+class Model(Wav2Vec2PreTrainedModel):
+    def __init__(self, config):
+        super().__init__(config)
+        self.wav2vec2 = Wav2Vec2Model(config)
+        self.cat = ModelHead(config, 2)
+        self.init_weights()
+    def freeze_feature_extractor(self):
+        self.wav2vec2.feature_extractor._freeze_parameters()
+    def pooling(
+        self,
+        hidden_states,
+        attention_mask,
+    ):
+        if attention_mask is None:  # For evaluation with batch_size==1
+            outputs = torch.mean(hidden_states, dim=1)
+        else:
+            attention_mask = self._get_feature_vector_attention_mask(
+                hidden_states.shape[1],
+                attention_mask,
+            )
+            hidden_states = hidden_states * torch.reshape(
+                attention_mask,
+                (-1, attention_mask.shape[-1], 1),
+            )
+            outputs = torch.sum(hidden_states, dim=1)
+            attention_sum = torch.sum(attention_mask, dim=1)
+            outputs = outputs / torch.reshape(attention_sum, (-1, 1))
+        return outputs
+    def forward(
+        self,
+        input_values,
+        attention_mask=None,
+        labels=None,
+        return_hidden=False,
+    ):
+        outputs = self.wav2vec2(
+            input_values,
+            attention_mask=attention_mask,
+        )
+        cnn_features = outputs.extract_features
+        hidden_states_framewise = outputs.last_hidden_state
+        hidden_states = self.pooling(
+            hidden_states_framewise,
+            attention_mask,
+        )
+        logits_cat = self.cat(hidden_states)
+        if not self.training:
+            logits_cat = torch.softmax(logits_cat, dim=1)
+        if return_hidden:
+            # make time last axis
+            cnn_features = torch.transpose(cnn_features, 1, 2)
+            return ModelOutput(
+                logits_cat=logits_cat,
+                hidden_states=hidden_states,
+                cnn_features=cnn_features,
+            )
+        else:
+            return ModelOutput(
+                logits_cat=logits_cat,
+            )
+class ModelWithPreProcessing(Model):
+    def __init__(self, config):
+        super().__init__(config)
+    def forward(
+        self,
+        input_values,
+    ):
+        # Wav2Vec2FeatureExtractor.zero_mean_unit_var_norm():
+        # normed_slice = (vector - vector[:length].mean()) / np.sqrt(vector[:length].var() + 1e-7)
+        mean = input_values.mean()
+        # var = input_values.var()
+        # raises: onnxruntime.capi.onnxruntime_pybind11_state.NotImplemented: [ONNXRuntimeError] : 9 : NOT_IMPLEMENTED : Could not find an implementation for the node ReduceProd_3:ReduceProd(11)
+        var = torch.square(input_values - mean).mean()
+        input_values = (input_values - mean) / torch.sqrt(var + 1e-7)
+        output = super().forward(
+            input_values,
+            return_hidden=True,
+        )
+        return (
+            output.hidden_states,
+            output.logits_cat,
+            output.cnn_features,
+        )

nkululeko/resample.py CHANGED Viewed

@@ -1,78 +1,100 @@
 # resample.py
-# change the sampling rate for train and test splits
+# change the sampling rate for audio file or INI file (train, test, all)
 import argparse
 import configparser
 import os
 import pandas as pd
+import audformat
 from nkululeko.augmenting.resampler import Resampler
+from nkululeko.utils.util import Util
 from nkululeko.constants import VERSION
 from nkululeko.experiment import Experiment
-from nkululeko.utils.util import Util
 def main(src_dir):
     parser = argparse.ArgumentParser(
-        description="Call the nkululeko RESAMPLE  framework.")
-    parser.add_argument("--config", default="exp.ini",
+        description="Call the nkululeko RESAMPLE framework.")
+    parser.add_argument("--config", default=None,
                         help="The base configuration")
+    parser.add_argument("--file", default=None,
+                        help="The input audio file to resample")
+    parser.add_argument("--replace", action="store_true",
+                        help="Replace the original audio file")
     args = parser.parse_args()
-    if args.config is not None:
-        config_file = args.config
-    else:
-        config_file = f"{src_dir}/exp.ini"
-    # test if the configuration file exists
-    if not os.path.isfile(config_file):
-        print(f"ERROR: no such file: {config_file}")
+    if args.file is None and args.config is None:
+        print("ERROR: Either --file or --config argument must be provided.")
         exit()
-    # load one configuration per experiment
-    config = configparser.ConfigParser()
-    config.read(config_file)
-    # create a new experiment
-    expr = Experiment(config)
-    module = "resample"
-    expr.set_module(module)
-    util = Util(module)
-    util.debug(
-        f"running {expr.name} from config {config_file}, nkululeko version"
-        f" {VERSION}"
-    )
-    if util.config_val("EXP", "no_warnings", False):
-        import warnings
-        warnings.filterwarnings("ignore")
-    # load the data
-    expr.load_datasets()
-    # split into train and test
-    expr.fill_train_and_tests()
-    util.debug(
-        f"train shape : {expr.df_train.shape}, test shape:{expr.df_test.shape}")
-    sample_selection = util.config_val("RESAMPLE", "sample_selection", "all")
-    if sample_selection == "all":
-        df = pd.concat([expr.df_train, expr.df_test])
-    elif sample_selection == "train":
-        df = expr.df_train
-    elif sample_selection == "test":
-        df = expr.df_test
+    if args.file is not None:
+        # Load the audio file into a DataFrame
+        files = pd.Series([args.file])
+        df_sample = pd.DataFrame(index=files)
+        df_sample.index = audformat.utils.to_segmented_index(
+            df_sample.index, allow_nat=False
+        )
+        # Resample the audio file
+        util = Util("resampler", has_config=False)
+        util.debug(f"Resampling audio file: {args.file}")
+        rs = Resampler(df_sample, not_testing=True, replace=args.replace)
+        rs.resample()
     else:
-        util.error(
-            f"unknown selection specifier {sample_selection}, should be [all |"
-            " train | test]"
+        # Existing code for handling INI file
+        config_file = args.config
+        # Test if the configuration file exists
+        if not os.path.isfile(config_file):
+            print(f"ERROR: no such file: {config_file}")
+            exit()
+        # Load one configuration per experiment
+        config = configparser.ConfigParser()
+        config.read(config_file)
+        # Create a new experiment
+        expr = Experiment(config)
+        module = "resample"
+        expr.set_module(module)
+        util = Util(module)
+        util.debug(
+            f"running {expr.name} from config {config_file}, nkululeko version"
+            f" {VERSION}"
         )
-    util.debug(f"resampling {sample_selection}: {df.shape[0]} samples")
-    rs = Resampler(df)
-    rs.resample()
-    print("DONE")
+        if util.config_val("EXP", "no_warnings", False):
+            import warnings
+            warnings.filterwarnings("ignore")
+        # Load the data
+        expr.load_datasets()
+        # Split into train and test
+        expr.fill_train_and_tests()
+        util.debug(
+            f"train shape : {expr.df_train.shape}, test shape:{expr.df_test.shape}")
+        sample_selection = util.config_val(
+            "RESAMPLE", "sample_selection", "all")
+        if sample_selection == "all":
+            df = pd.concat([expr.df_train, expr.df_test])
+        elif sample_selection == "train":
+            df = expr.df_train
+        elif sample_selection == "test":
+            df = expr.df_test
+        else:
+            util.error(
+                f"unknown selection specifier {sample_selection}, should be [all |"
+                " train | test]"
+            )
+        util.debug(f"resampling {sample_selection}: {df.shape[0]} samples")
+        replace = util.config_val("RESAMPLE", "replace", "False")
+        rs = Resampler(df, replace=replace)
+        rs.resample()
 if __name__ == "__main__":
     cwd = os.path.dirname(os.path.abspath(__file__))
-    main(cwd)  # use this if you want to state the config file path on command line
+    main(cwd)

nkululeko/test_pretrain.py CHANGED Viewed

@@ -11,11 +11,14 @@ import transformers
 import audeer
 import audiofile
+import audmetric
 from nkululeko.constants import VERSION
 import nkululeko.experiment as exp
+import nkululeko.models.finetune_model as fm
 import nkululeko.glob_conf as glob_conf
 from nkululeko.utils.util import Util
+import json
 def doit(config_file):
@@ -50,28 +53,42 @@ def doit(config_file):
     expr.fill_train_and_tests()
     util.debug(f"train shape : {expr.df_train.shape}, test shape:{expr.df_test.shape}")
+    log_root = audeer.mkdir("log")
+    model_root = audeer.mkdir("model")
+    torch_root = audeer.path(model_root, "torch")
+    metrics_gender = {
+        "UAR": audmetric.unweighted_average_recall,
+        "ACC": audmetric.accuracy,
+    }
     sampling_rate = 16000
     max_duration_sec = 8.0
     model_path = "facebook/wav2vec2-large-robust-ft-swbd-300h"
     num_layers = None
+    os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID"
+    os.environ["CUDA_VISIBLE_DEVICES"] = "3"
     batch_size = 16
     accumulation_steps = 4
     # create dataset
     dataset = {}
+    target_name = glob_conf.target
     data_sources = {
-        "train": pd.DataFrame(expr.df_train[glob_conf.target]),
-        "dev": pd.DataFrame(expr.df_test[glob_conf.target]),
+        "train": pd.DataFrame(expr.df_train[target_name]),
+        "dev": pd.DataFrame(expr.df_test[target_name]),
     }
     for split in ["train", "dev"]:
+        df = data_sources[split]
+        df[target_name] = df[target_name].astype("float")
         y = pd.Series(
-            data=data_sources[split].itertuples(index=False, name=None),
-            index=data_sources[split].index,
+            data=df.itertuples(index=False, name=None),
+            index=df.index,
             dtype=object,
             name="labels",
         )
@@ -80,23 +97,183 @@ def doit(config_file):
         df = y.reset_index()
         df.start = df.start.dt.total_seconds()
         df.end = df.end.dt.total_seconds()
         print(f"{split}: {len(df)}")
         ds = datasets.Dataset.from_pandas(df)
         dataset[split] = ds
-        dataset = datasets.DatasetDict(dataset)
+    dataset = datasets.DatasetDict(dataset)
+    # load pre-trained model
+    le = glob_conf.label_encoder
+    mapping = dict(zip(le.classes_, range(len(le.classes_))))
+    target_mapping = {k: int(v) for k, v in mapping.items()}
+    target_mapping_reverse = {value: key for key, value in target_mapping.items()}
     config = transformers.AutoConfig.from_pretrained(
         model_path,
-        num_labels=len(util.la),
-        label2id=data.gender_mapping,
-        id2label=data.gender_mapping_reverse,
-        finetuning_task="age-gender",
+        num_labels=len(target_mapping),
+        label2id=target_mapping,
+        id2label=target_mapping_reverse,
+        finetuning_task=target_name,
     )
     if num_layers is not None:
         config.num_hidden_layers = num_layers
     setattr(config, "sampling_rate", sampling_rate)
-    setattr(config, "data", ",".join(sources))
+    setattr(config, "data", util.get_data_name())
+    vocab_dict = {}
+    with open("vocab.json", "w") as vocab_file:
+        json.dump(vocab_dict, vocab_file)
+    tokenizer = transformers.Wav2Vec2CTCTokenizer("./vocab.json")
+    tokenizer.save_pretrained(".")
+    feature_extractor = transformers.Wav2Vec2FeatureExtractor(
+        feature_size=1,
+        sampling_rate=16000,
+        padding_value=0.0,
+        do_normalize=True,
+        return_attention_mask=True,
+    )
+    processor = transformers.Wav2Vec2Processor(
+        feature_extractor=feature_extractor,
+        tokenizer=tokenizer,
+    )
+    assert processor.feature_extractor.sampling_rate == sampling_rate
+    model = fm.Model.from_pretrained(
+        model_path,
+        config=config,
+    )
+    model.freeze_feature_extractor()
+    model.train()
+    # training
+    def data_collator(data):
+        files = [d["file"] for d in data]
+        starts = [d["start"] for d in data]
+        ends = [d["end"] for d in data]
+        targets = [d["targets"] for d in data]
+        signals = []
+        for file, start, end in zip(
+            files,
+            starts,
+            ends,
+        ):
+            offset = start
+            duration = end - offset
+            if max_duration_sec is not None:
+                duration = min(duration, max_duration_sec)
+            signal, _ = audiofile.read(
+                file,
+                offset=offset,
+                duration=duration,
+            )
+            signals.append(signal.squeeze())
+        input_values = processor(
+            signals,
+            sampling_rate=sampling_rate,
+            padding=True,
+        )
+        batch = processor.pad(
+            input_values,
+            padding=True,
+            return_tensors="pt",
+        )
+        batch["labels"] = torch.tensor(targets)
+        return batch
+    def compute_metrics(p: transformers.EvalPrediction):
+        truth_gender = p.label_ids[:, 0].astype(int)
+        preds = p.predictions
+        preds_gender = np.argmax(preds, axis=1)
+        scores = {}
+        for name, metric in metrics_gender.items():
+            scores[f"gender-{name}"] = metric(truth_gender, preds_gender)
+        scores["combined"] = scores["gender-UAR"]
+        return scores
+    targets = pd.DataFrame(dataset["train"]["targets"])
+    counts = targets[0].value_counts().sort_index()
+    train_weights = 1 / counts
+    train_weights /= train_weights.sum()
+    print(train_weights)
+    criterion_gender = torch.nn.CrossEntropyLoss(
+        weight=torch.Tensor(train_weights).to("cuda"),
+    )
+    class Trainer(transformers.Trainer):
+        def compute_loss(
+            self,
+            model,
+            inputs,
+            return_outputs=False,
+        ):
+            targets = inputs.pop("labels").squeeze()
+            targets_gender = targets.type(torch.long)
+            outputs = model(**inputs)
+            logits_gender = outputs[0].squeeze()
+            loss_gender = criterion_gender(logits_gender, targets_gender)
+            loss = loss_gender
+            return (loss, outputs) if return_outputs else loss
+    num_steps = len(dataset["train"]) // (batch_size * accumulation_steps) // 5
+    num_steps = max(1, num_steps)
+    print(num_steps)
+    training_args = transformers.TrainingArguments(
+        output_dir=model_root,
+        logging_dir=log_root,
+        per_device_train_batch_size=batch_size,
+        per_device_eval_batch_size=batch_size,
+        gradient_accumulation_steps=accumulation_steps,
+        evaluation_strategy="steps",
+        num_train_epochs=5.0,
+        fp16=True,
+        save_steps=num_steps,
+        eval_steps=num_steps,
+        logging_steps=num_steps,
+        learning_rate=1e-4,
+        save_total_limit=2,
+        metric_for_best_model="combined",
+        greater_is_better=True,
+        load_best_model_at_end=True,
+        remove_unused_columns=False,
+    )
+    trainer = Trainer(
+        model=model,
+        data_collator=data_collator,
+        args=training_args,
+        compute_metrics=compute_metrics,
+        train_dataset=dataset["train"],
+        eval_dataset=dataset["dev"],
+        tokenizer=processor.feature_extractor,
+        callbacks=[transformers.integrations.TensorBoardCallback()],
+    )
+    trainer.train()
+    trainer.save_model(torch_root)
     print("DONE")

nkululeko/utils/util.py CHANGED Viewed

@@ -33,43 +33,58 @@ class Util:
         else:
             self.caller = ""
         if has_config:
-            import nkululeko.glob_conf as glob_conf
-            self.config = glob_conf.config
-            self.got_data_roots = self.config_val("DATA", "root_folders", False)
-            if self.got_data_roots:
-                # if there is a global data rootfolder file, read from there
-                if not os.path.isfile(self.got_data_roots):
-                    self.error(f"no such file: {self.got_data_roots}")
-                self.data_roots = configparser.ConfigParser()
-                self.data_roots.read(self.got_data_roots)
-                # self.debug(f"getting data roots from {self.got_data_roots}")
+            try:
+                import nkululeko.glob_conf as glob_conf
+                self.config = glob_conf.config
+                self.got_data_roots = self.config_val(
+                    "DATA", "root_folders", False)
+                if self.got_data_roots:
+                    # if there is a global data rootfolder file, read from there
+                    if not os.path.isfile(self.got_data_roots):
+                        self.error(f"no such file: {self.got_data_roots}")
+                    self.data_roots = configparser.ConfigParser()
+                    self.data_roots.read(self.got_data_roots)
+            except (ModuleNotFoundError, AttributeError):
+                self.config = None
+                self.got_data_roots = False
     def get_path(self, entry):
         """
         This method allows the user to get the directory path for the given argument.
         """
-        root = os.path.join(self.config["EXP"]["root"], "")
-        name = self.config["EXP"]["name"]
-        try:
-            entryn = self.config["EXP"][entry]
-        except KeyError:
-            # some default values
+        if self.config is None:
+            # If no configuration file is provided, use default paths
             if entry == "fig_dir":
-                entryn = "./images/"
+                dir_name = "./images/"
             elif entry == "res_dir":
-                entryn = "./results/"
+                dir_name = "./results/"
             elif entry == "model_dir":
-                entryn = "./models/"
+                dir_name = "./models/"
             else:
-                entryn = "./store/"
-        # Expand image, model and result directories with run index
-        if entry == "fig_dir" or entry == "res_dir" or entry == "model_dir":
-            run = self.config_val("EXP", "run", 0)
-            entryn = entryn + f"run_{run}/"
+                dir_name = "./store/"
+        else:
+            root = os.path.join(self.config["EXP"]["root"], "")
+            name = self.config["EXP"]["name"]
+            try:
+                entryn = self.config["EXP"][entry]
+            except KeyError:
+                # some default values
+                if entry == "fig_dir":
+                    entryn = "./images/"
+                elif entry == "res_dir":
+                    entryn = "./results/"
+                elif entry == "model_dir":
+                    entryn = "./models/"
+                else:
+                    entryn = "./store/"
+            # Expand image, model and result directories with run index
+            if entry == "fig_dir" or entry == "res_dir" or entry == "model_dir":
+                run = self.config_val("EXP", "run", 0)
+                entryn = entryn + f"run_{run}/"
+            dir_name = f"{root}{name}/{entryn}"
-        dir_name = f"{root}{name}/{entryn}"
         audeer.mkdir(dir_name)
         return dir_name
@@ -101,7 +116,8 @@ class Util:
                         )
                     return default
             if not default in self.stopvals:
-                self.debug(f"value for {key} not found, using default: {default}")
+                self.debug(
+                    f"value for {key} not found, using default: {default}")
             return default
     def set_config(self, config):
@@ -138,7 +154,8 @@ class Util:
         if len(df) == 0:
             return df
         if not isinstance(df.index, pd.MultiIndex):
-            df.index = audformat.utils.to_segmented_index(df.index, allow_nat=False)
+            df.index = audformat.utils.to_segmented_index(
+                df.index, allow_nat=False)
         return df
     def _get_value_descript(self, section, name):
@@ -243,11 +260,14 @@ class Util:
         print(df.head(1))
     def config_val(self, section, key, default):
+        if self.config is None:
+            return default
         try:
             return self.config[section][key]
         except KeyError:
-            if not default in self.stopvals:
-                self.debug(f"value for {key} not found, using default: {default}")
+            if default not in self.stopvals:
+                self.debug(
+                    f"value for {key} not found, using default: {default}")
             return default
     def config_val_list(self, section, key, default):
@@ -255,7 +275,8 @@ class Util:
             return ast.literal_eval(self.config[section][key])
         except KeyError:
             if not default in self.stopvals:
-                self.debug(f"value for {key} not found, using default: {default}")
+                self.debug(
+                    f"value for {key} not found, using default: {default}")
             return default
     def continuous_to_categorical(self, series):

{nkululeko-0.84.0.dist-info → nkululeko-0.84.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: nkululeko
-Version: 0.84.0
+Version: 0.84.1
 Summary: Machine learning audio prediction experiments based on templates
 Home-page: https://github.com/felixbur/nkululeko
 Author: Felix Burkhardt
@@ -333,6 +333,10 @@ F. Burkhardt, Johannes Wagner, Hagen Wierstorf, Florian Eyben and Björn Schulle
 Changelog
 =========
+Version 0.84.1
+--------------
+* made resample independent of config file
 Version 0.84.0
 --------------
 * added SHAP analysis

{nkululeko-0.84.0.dist-info → nkululeko-0.84.1.dist-info}/RECORD RENAMED Viewed

@@ -2,7 +2,7 @@ nkululeko/__init__.py,sha256=62f8HiEzJ8rG2QlTFJXUCMpvuH3fKI33DoJSj33mscc,63
 nkululeko/aug_train.py,sha256=YhuZnS_WVWnun9G-M6g5n6rbRxoVREz6Zh7k6qprFNQ,3194
 nkululeko/augment.py,sha256=4MG0apTAG5RgkuJrYEjGgDdbodZWi_HweSPNI1JJ5QA,3051
 nkululeko/cacheddataset.py,sha256=lIJ6hUo5LoxSrzXtWV8mzwO7wRtUETWnOQ4ws2XfL1E,969
-nkululeko/constants.py,sha256=Ij7mvqjHA328NaCRJL2JvyYgAPfkfYpVq_WiS735RQY,39
+nkululeko/constants.py,sha256=31GQXyAN-nrfQCNIt6_aSkBVeE_J3GO-PklTEy6EgBg,39
 nkululeko/demo.py,sha256=8bl15Kitoesnz8oa8yrs52T6YCSOhWbbq9PnZ8Hj6D0,3232
 nkululeko/demo_feats.py,sha256=sAeGFojhEj9WEDFtG3SzPBmyYJWLF2rkbpp65m8Ujo4,2025
 nkululeko/demo_predictor.py,sha256=es56xbT8ifkS_vnrlb5NTZT54gNmeUtNlA4zVA_gnN8,4757
@@ -19,19 +19,19 @@ nkululeko/nkuluflag.py,sha256=PGWSmZz-PiiHLgcZJAoGOI_Y-sZDVI1ksB8p5r7riWM,3725
 nkululeko/nkululeko.py,sha256=Kn3s2E3yyH8cJ7z6lkMxrnqtCxTu7-qfe9Zr_ONTD5g,1968
 nkululeko/plots.py,sha256=nd9tF_61DyAx7oGZF8gTrHXazkgFjFe4eClxu1nQ_XU,23276
 nkululeko/predict.py,sha256=sF091sSSLnEWcISx9ZcULLie3tY5XeFsQJd6b3vrxFg,2409
-nkululeko/resample.py,sha256=3WbxkwgyTe_fW38046Rjxk3knOkFdhqn2C4nfhbUurQ,2287
+nkululeko/resample.py,sha256=IPtYqU0nhZ-CqO_O1jJN0EvpfjxHZdFRwdTpEJOVuaQ,3354
 nkululeko/runmanager.py,sha256=eTM1DNQKt1lxYhzt4vZyZluPXW9sWlIJHNQzex4lkJU,7624
 nkululeko/scaler.py,sha256=4nkIqoajkIkuTPK0Z02ifMN_awl6fP_i-GBYdoGYgGM,4101
 nkululeko/segment.py,sha256=YLKckX44tbvTb3LrdgYw9X4guzuF27sutl92z9DkpZU,4835
 nkululeko/syllable_nuclei.py,sha256=Sky-C__MeUDaxqHnDl2TGLLYOYvsahD35TUjWGeG31k,10047
 nkululeko/test.py,sha256=1w624vo5KTzmFC8BUStGlLDmIEAFuJUz7J0W-gp7AxI,1677
 nkululeko/test_predictor.py,sha256=_w5J8CxH6hmW3mLTKbdfmywl5QpdNAnW1Y8TE5GtlfE,3237
-nkululeko/test_pretrain.py,sha256=aoN-C9M4Zn9LwseIWQdMMpEGclnkWs-gJXyItU5V0fk,3109
+nkululeko/test_pretrain.py,sha256=4b_39l01dySei_e0ys2NKo9Gipf1Fukp1GvhQllFHt8,8131
 nkululeko/augmenting/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nkululeko/augmenting/augmenter.py,sha256=XAt0dpmlnKxqyysqCgV3rcz-pRIvOz7rU7dmGDCVAzs,2905
 nkululeko/augmenting/randomsplicer.py,sha256=Z5rxdKKUpuncLWuTS6xVfVKUeVbeiYU_dLRHQ5fcg4Y,2669
 nkululeko/augmenting/randomsplicing.py,sha256=ldym9vZNsZIU5BAAaJVaOmAgmVHNs4a5i5K3bW-WAQU,1791
-nkululeko/augmenting/resampler.py,sha256=cRrn27w_f2I6aN0CftlTuHT2edi7pTREh3Yc6BxhcGU,3335
+nkululeko/augmenting/resampler.py,sha256=nOBsiQpX6p4jXsP7x6wak78F3B5YYYRmC_iHX8iuOXs,3542
 nkululeko/autopredict/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nkululeko/autopredict/ap_age.py,sha256=2Wn5E-Jd49sTn40WqaMcYtUEl4zEq3OY75XmjOpdxsA,1095
 nkululeko/autopredict/ap_arousal.py,sha256=ymt0diu4v1osw3VxJbSglsVKDAJYRzebQ2TTfFMKKxk,1024
@@ -75,6 +75,7 @@ nkululeko/losses/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,
 nkululeko/losses/loss_ccc.py,sha256=NOK0y0fxKUnU161B5geap6Fmn8QzoPl2MqtPiV8IuJE,976
 nkululeko/losses/loss_softf1loss.py,sha256=5gW-PuiqeAZcRgfwjueIOQtMokOjZWgQnVIv59HKTCo,1309
 nkululeko/models/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+nkululeko/models/finetune_model.py,sha256=bx9NsFpEqf_mBohcrf-9lWjrC4AtOIJ7holNXwaFo2Y,4910
 nkululeko/models/model.py,sha256=fL6LB6I9Oqo_OWUIptqiu6abuxVYYv8bW2a3m4XSLqU,11601
 nkululeko/models/model_bayes.py,sha256=WJFZ8wFKwWATz6MhmjeZIi1Pal1viU549WL_PjXDSy8,406
 nkululeko/models/model_cnn.py,sha256=bJxqwe6FnVR2hFeqN6EXexYGgvKYFED1VOhBXVlLWaE,9954
@@ -103,9 +104,9 @@ nkululeko/segmenting/seg_silero.py,sha256=lLytS38KzARS17omwv8VBw-zz60RVSXGSvZ5Ev
 nkululeko/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nkululeko/utils/files.py,sha256=UiGAtZRWYjHSvlmPaTMtzyNNGE6qaLaxQkybctS7iRM,4021
 nkululeko/utils/stats.py,sha256=1yUq0FTOyqkU8TwUocJRYdJaqMU5SlOBBRUun9STo2M,2829
-nkululeko/utils/util.py,sha256=lVKcIYHeN8wt7ap8o1UTx5z6nvOY40twJ_C4CshT42Y,13068
-nkululeko-0.84.0.dist-info/LICENSE,sha256=0zGP5B_W35yAcGfHPS18Q2B8UhvLRY3dQq1MhpsJU_U,1076
-nkululeko-0.84.0.dist-info/METADATA,sha256=RJnEnBwqdKRLs4J16zOzsps0GXmdVvzPMi1_2hpZh-Q,36346
-nkululeko-0.84.0.dist-info/WHEEL,sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ,92
-nkululeko-0.84.0.dist-info/top_level.txt,sha256=DPFNNSHPjUeVKj44dVANAjuVGRCC3MusJ08lc2a8xFA,10
-nkululeko-0.84.0.dist-info/RECORD,,
+nkululeko/utils/util.py,sha256=b1IHFucRNuF9Iyv5IJeK4AEg0Rga0xKG80UM5GWWdHA,13816
+nkululeko-0.84.1.dist-info/LICENSE,sha256=0zGP5B_W35yAcGfHPS18Q2B8UhvLRY3dQq1MhpsJU_U,1076
+nkululeko-0.84.1.dist-info/METADATA,sha256=Y647w-vkRjPG7fssLTEF_Aa_pP74aN-WPCGv6r0_NcE,36420
+nkululeko-0.84.1.dist-info/WHEEL,sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ,92
+nkululeko-0.84.1.dist-info/top_level.txt,sha256=DPFNNSHPjUeVKj44dVANAjuVGRCC3MusJ08lc2a8xFA,10
+nkululeko-0.84.1.dist-info/RECORD,,

{nkululeko-0.84.0.dist-info → nkululeko-0.84.1.dist-info}/LICENSE RENAMED Viewed

File without changes

{nkululeko-0.84.0.dist-info → nkululeko-0.84.1.dist-info}/WHEEL RENAMED Viewed

File without changes

{nkululeko-0.84.0.dist-info → nkululeko-0.84.1.dist-info}/top_level.txt RENAMED Viewed

File without changes

nkululeko 0.84.0__py3-none-any.whl → 0.84.1__py3-none-any.whl

nkululeko 0.84.0py3-none-any.whl → 0.84.1py3-none-any.whl