flexynesis 0.2.2__tar.gz → 0.2.3__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {flexynesis-0.2.2 → flexynesis-0.2.3}/PKG-INFO +1 -1
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/__main__.py +4 -1
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/config.py +4 -4
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/main.py +8 -5
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/PKG-INFO +1 -1
- {flexynesis-0.2.2 → flexynesis-0.2.3}/pyproject.toml +1 -1
- {flexynesis-0.2.2 → flexynesis-0.2.3}/LICENCE.md +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/README.md +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/__init__.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/cli.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/data.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/feature_selection.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/__init__.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/crossmodal_pred.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/direct_pred.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/gnn_early.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/on_ice/direct_pred_cnn.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/on_ice/direct_pred_gcnn.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/on_ice/modules_on_ice.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/supervised_vae.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/triplet_encoder.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/modules.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/utils.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/SOURCES.txt +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/dependency_links.txt +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/entry_points.txt +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/requires.txt +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/top_level.txt +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/setup.cfg +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/tests/__init__.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/tests/unit/__init__.py +0 -0
- {flexynesis-0.2.2 → flexynesis-0.2.3}/tests/unit/test_smoke.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: flexynesis
|
|
3
|
-
Version: 0.2.
|
|
3
|
+
Version: 0.2.3
|
|
4
4
|
Summary: A deep-learning based multi-omics bulk sequencing data integration suite with a focus on (pre-)clinical endpoint prediction.
|
|
5
5
|
Author-email: Bora Uyar <bora.uyar@mdc-berlin.de>, Taras Savchyn <Taras.Savchyn@mdc-berlin.de>, Ricardo Wurmus <Ricardo.Wurmus@mdc-berlin.de>, Ahmet Sarigun <Ahmet.Sariguen@mdc-berlin.de>
|
|
6
6
|
Project-URL: homepage, https://github.com/BIMSBbioinfo/flexynesis
|
|
@@ -46,6 +46,7 @@ def main():
|
|
|
46
46
|
--use_loss_weighting (str): Whether to apply loss-balancing using uncertainty weights method. Choices are ['True', 'False']. Default is 'True'.
|
|
47
47
|
--evaluate_baseline_performance (str): Whether to run Random Forest + SVMs to see the performance of off-the-shelf tools on the same dataset. Choices are ['True', 'False']. Default is 'True'.
|
|
48
48
|
--threads (int): How many threads to use when using CPU. Default is 4.
|
|
49
|
+
--num_workers (int): How many workers to use for model training. Default is 2
|
|
49
50
|
--use_gpu (bool): If set, the system will attempt to use CUDA/GPU if available.
|
|
50
51
|
--disable_marker_finding (bool): If set, marker discovery after model training is disabled.
|
|
51
52
|
--string_organism (int): STRING DB organism id. Default is 9606.
|
|
@@ -99,6 +100,7 @@ def main():
|
|
|
99
100
|
parser.add_argument("--use_loss_weighting", help="whether to apply loss-balancing using uncertainty weights method", type=str, choices=['True', 'False'], default = 'True')
|
|
100
101
|
parser.add_argument("--evaluate_baseline_performance", help="whether to run Random Forest + SVMs to see the performance of off-the-shelf tools on the same dataset", type=str, choices=['True', 'False'], default = 'True')
|
|
101
102
|
parser.add_argument("--threads", help="(Optional) How many threads to use when using CPU (default is 4)", type=int, default = 4)
|
|
103
|
+
parser.add_argument("--num_workers", help="(Optional) How many workers to use for model training (default is 2)", type=int, default = 2)
|
|
102
104
|
parser.add_argument("--use_gpu", action="store_true",
|
|
103
105
|
help="(Optional) If set, the system will attempt to use CUDA/GPU if available.")
|
|
104
106
|
parser.add_argument("--disable_marker_finding", action="store_true",
|
|
@@ -253,7 +255,8 @@ def main():
|
|
|
253
255
|
device_type = device_type,
|
|
254
256
|
gnn_conv_type = gnn_conv_type,
|
|
255
257
|
input_layers = input_layers,
|
|
256
|
-
output_layers = output_layers
|
|
258
|
+
output_layers = output_layers,
|
|
259
|
+
num_workers = args.num_workers)
|
|
257
260
|
|
|
258
261
|
# do a hyperparameter search training multiple models and get the best_configuration
|
|
259
262
|
model, best_params = tuner.perform_tuning(hpo_patience = args.hpo_patience)
|
|
@@ -6,28 +6,28 @@ epochs = [500]
|
|
|
6
6
|
search_spaces = {
|
|
7
7
|
'DirectPred': [
|
|
8
8
|
Integer(16, 128, name='latent_dim'),
|
|
9
|
-
Real(0.2,
|
|
9
|
+
Real(0.2, 0.5, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
|
|
10
10
|
Real(0.0001, 0.01, prior='log-uniform', name='lr'),
|
|
11
11
|
Integer(8, 32, name='supervisor_hidden_dim'),
|
|
12
12
|
Categorical(epochs, name='epochs')
|
|
13
13
|
],
|
|
14
14
|
'supervised_vae': [
|
|
15
15
|
Integer(16, 128, name='latent_dim'),
|
|
16
|
-
Real(0.2,
|
|
16
|
+
Real(0.2, 0.5, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
|
|
17
17
|
Integer(8, 32, name='supervisor_hidden_dim'),
|
|
18
18
|
Real(0.0001, 0.01, prior='log-uniform', name='lr'),
|
|
19
19
|
Categorical(epochs, name='epochs')
|
|
20
20
|
],
|
|
21
21
|
'CrossModalPred': [
|
|
22
22
|
Integer(16, 128, name='latent_dim'),
|
|
23
|
-
Real(0.2,
|
|
23
|
+
Real(0.2, 0.5, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
|
|
24
24
|
Integer(8, 32, name='supervisor_hidden_dim'),
|
|
25
25
|
Real(0.0001, 0.01, prior='log-uniform', name='lr'),
|
|
26
26
|
Categorical(epochs, name='epochs')
|
|
27
27
|
],
|
|
28
28
|
'MultiTripletNetwork': [
|
|
29
29
|
Integer(16, 128, name='latent_dim'),
|
|
30
|
-
Real(0.2,
|
|
30
|
+
Real(0.2, 0.5, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
|
|
31
31
|
Integer(8, 32, name='supervisor_hidden_dim'),
|
|
32
32
|
Real(0.0001, 0.01, prior='log-uniform', name='lr'),
|
|
33
33
|
Categorical(epochs, name='epochs')
|
|
@@ -56,7 +56,7 @@ class HyperparameterTuning:
|
|
|
56
56
|
cv_splits=5, use_loss_weighting=True, early_stop_patience=-1, device_type=None, gnn_conv_type=None,
|
|
57
57
|
input_layers=None, output_layers=None): Initializes the hyperparameter tuner with specific settings.
|
|
58
58
|
|
|
59
|
-
get_batch_space(min_size=16, max_size=
|
|
59
|
+
get_batch_space(min_size=16, max_size=128): Determines the batch size search space based on the dataset size.
|
|
60
60
|
|
|
61
61
|
setup_trainer(params, current_step, total_steps, full_train=False): Sets up the trainer with appropriate callbacks
|
|
62
62
|
and configurations for either full training or validation based training.
|
|
@@ -80,7 +80,7 @@ class HyperparameterTuning:
|
|
|
80
80
|
val_size = 0.2, use_cv = False, cv_splits = 5,
|
|
81
81
|
use_loss_weighting = True, early_stop_patience = -1,
|
|
82
82
|
device_type = None, gnn_conv_type = None,
|
|
83
|
-
input_layers = None, output_layers = None):
|
|
83
|
+
input_layers = None, output_layers = None, num_workers = 2):
|
|
84
84
|
self.dataset = dataset # dataset for model initiation
|
|
85
85
|
self.loader_dataset = dataset # dataset for defining data loaders (this can be model specific)
|
|
86
86
|
self.model_class = model_class
|
|
@@ -107,6 +107,7 @@ class HyperparameterTuning:
|
|
|
107
107
|
self.gnn_conv_type = gnn_conv_type
|
|
108
108
|
self.input_layers = input_layers
|
|
109
109
|
self.output_layers = output_layers
|
|
110
|
+
self.num_workers = num_workers
|
|
110
111
|
|
|
111
112
|
self.DataLoader = torch.utils.data.DataLoader # use torch data loader by default
|
|
112
113
|
|
|
@@ -128,7 +129,7 @@ class HyperparameterTuning:
|
|
|
128
129
|
else:
|
|
129
130
|
raise ValueError(f"'{self.config_name}' not found in the default config.")
|
|
130
131
|
|
|
131
|
-
def get_batch_space(self, min_size = 32, max_size =
|
|
132
|
+
def get_batch_space(self, min_size = 32, max_size = 128):
|
|
132
133
|
m = int(np.log2(len(self.dataset) * 0.8))
|
|
133
134
|
st = int(np.log2(min_size))
|
|
134
135
|
end = int(np.log2(max_size))
|
|
@@ -214,9 +215,11 @@ class HyperparameterTuning:
|
|
|
214
215
|
train_subset = torch.utils.data.Subset(self.loader_dataset, train_index)
|
|
215
216
|
val_subset = torch.utils.data.Subset(self.loader_dataset, val_index)
|
|
216
217
|
train_loader = self.DataLoader(train_subset, batch_size=int(params['batch_size']),
|
|
217
|
-
pin_memory=True, shuffle=True, drop_last=True, num_workers =
|
|
218
|
+
pin_memory=True, shuffle=True, drop_last=True, num_workers = self.num_workers, prefetch_factor = None,
|
|
219
|
+
persistent_workers = self.num_workers > 0)
|
|
218
220
|
val_loader = self.DataLoader(val_subset, batch_size=int(params['batch_size']),
|
|
219
|
-
pin_memory=True, shuffle=False, num_workers =
|
|
221
|
+
pin_memory=True, shuffle=False, num_workers = self.num_workers, prefetch_factor = None,
|
|
222
|
+
persistent_workers = self.num_workers > 0)
|
|
220
223
|
|
|
221
224
|
model = self.model_class(**model_args)
|
|
222
225
|
trainer, early_stop_callback = self.setup_trainer(params, current_step, total_steps)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: flexynesis
|
|
3
|
-
Version: 0.2.
|
|
3
|
+
Version: 0.2.3
|
|
4
4
|
Summary: A deep-learning based multi-omics bulk sequencing data integration suite with a focus on (pre-)clinical endpoint prediction.
|
|
5
5
|
Author-email: Bora Uyar <bora.uyar@mdc-berlin.de>, Taras Savchyn <Taras.Savchyn@mdc-berlin.de>, Ricardo Wurmus <Ricardo.Wurmus@mdc-berlin.de>, Ahmet Sarigun <Ahmet.Sariguen@mdc-berlin.de>
|
|
6
6
|
Project-URL: homepage, https://github.com/BIMSBbioinfo/flexynesis
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|