flexynesis 0.2.2__tar.gz → 0.2.3__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (32) hide show
  1. {flexynesis-0.2.2 → flexynesis-0.2.3}/PKG-INFO +1 -1
  2. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/__main__.py +4 -1
  3. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/config.py +4 -4
  4. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/main.py +8 -5
  5. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/PKG-INFO +1 -1
  6. {flexynesis-0.2.2 → flexynesis-0.2.3}/pyproject.toml +1 -1
  7. {flexynesis-0.2.2 → flexynesis-0.2.3}/LICENCE.md +0 -0
  8. {flexynesis-0.2.2 → flexynesis-0.2.3}/README.md +0 -0
  9. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/__init__.py +0 -0
  10. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/cli.py +0 -0
  11. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/data.py +0 -0
  12. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/feature_selection.py +0 -0
  13. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/__init__.py +0 -0
  14. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/crossmodal_pred.py +0 -0
  15. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/direct_pred.py +0 -0
  16. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/gnn_early.py +0 -0
  17. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/on_ice/direct_pred_cnn.py +0 -0
  18. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/on_ice/direct_pred_gcnn.py +0 -0
  19. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/on_ice/modules_on_ice.py +0 -0
  20. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/supervised_vae.py +0 -0
  21. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/models/triplet_encoder.py +0 -0
  22. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/modules.py +0 -0
  23. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis/utils.py +0 -0
  24. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/SOURCES.txt +0 -0
  25. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/dependency_links.txt +0 -0
  26. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/entry_points.txt +0 -0
  27. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/requires.txt +0 -0
  28. {flexynesis-0.2.2 → flexynesis-0.2.3}/flexynesis.egg-info/top_level.txt +0 -0
  29. {flexynesis-0.2.2 → flexynesis-0.2.3}/setup.cfg +0 -0
  30. {flexynesis-0.2.2 → flexynesis-0.2.3}/tests/__init__.py +0 -0
  31. {flexynesis-0.2.2 → flexynesis-0.2.3}/tests/unit/__init__.py +0 -0
  32. {flexynesis-0.2.2 → flexynesis-0.2.3}/tests/unit/test_smoke.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: flexynesis
3
- Version: 0.2.2
3
+ Version: 0.2.3
4
4
  Summary: A deep-learning based multi-omics bulk sequencing data integration suite with a focus on (pre-)clinical endpoint prediction.
5
5
  Author-email: Bora Uyar <bora.uyar@mdc-berlin.de>, Taras Savchyn <Taras.Savchyn@mdc-berlin.de>, Ricardo Wurmus <Ricardo.Wurmus@mdc-berlin.de>, Ahmet Sarigun <Ahmet.Sariguen@mdc-berlin.de>
6
6
  Project-URL: homepage, https://github.com/BIMSBbioinfo/flexynesis
@@ -46,6 +46,7 @@ def main():
46
46
  --use_loss_weighting (str): Whether to apply loss-balancing using uncertainty weights method. Choices are ['True', 'False']. Default is 'True'.
47
47
  --evaluate_baseline_performance (str): Whether to run Random Forest + SVMs to see the performance of off-the-shelf tools on the same dataset. Choices are ['True', 'False']. Default is 'True'.
48
48
  --threads (int): How many threads to use when using CPU. Default is 4.
49
+ --num_workers (int): How many workers to use for model training. Default is 2
49
50
  --use_gpu (bool): If set, the system will attempt to use CUDA/GPU if available.
50
51
  --disable_marker_finding (bool): If set, marker discovery after model training is disabled.
51
52
  --string_organism (int): STRING DB organism id. Default is 9606.
@@ -99,6 +100,7 @@ def main():
99
100
  parser.add_argument("--use_loss_weighting", help="whether to apply loss-balancing using uncertainty weights method", type=str, choices=['True', 'False'], default = 'True')
100
101
  parser.add_argument("--evaluate_baseline_performance", help="whether to run Random Forest + SVMs to see the performance of off-the-shelf tools on the same dataset", type=str, choices=['True', 'False'], default = 'True')
101
102
  parser.add_argument("--threads", help="(Optional) How many threads to use when using CPU (default is 4)", type=int, default = 4)
103
+ parser.add_argument("--num_workers", help="(Optional) How many workers to use for model training (default is 2)", type=int, default = 2)
102
104
  parser.add_argument("--use_gpu", action="store_true",
103
105
  help="(Optional) If set, the system will attempt to use CUDA/GPU if available.")
104
106
  parser.add_argument("--disable_marker_finding", action="store_true",
@@ -253,7 +255,8 @@ def main():
253
255
  device_type = device_type,
254
256
  gnn_conv_type = gnn_conv_type,
255
257
  input_layers = input_layers,
256
- output_layers = output_layers)
258
+ output_layers = output_layers,
259
+ num_workers = args.num_workers)
257
260
 
258
261
  # do a hyperparameter search training multiple models and get the best_configuration
259
262
  model, best_params = tuner.perform_tuning(hpo_patience = args.hpo_patience)
@@ -6,28 +6,28 @@ epochs = [500]
6
6
  search_spaces = {
7
7
  'DirectPred': [
8
8
  Integer(16, 128, name='latent_dim'),
9
- Real(0.2, 1, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
9
+ Real(0.2, 0.5, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
10
10
  Real(0.0001, 0.01, prior='log-uniform', name='lr'),
11
11
  Integer(8, 32, name='supervisor_hidden_dim'),
12
12
  Categorical(epochs, name='epochs')
13
13
  ],
14
14
  'supervised_vae': [
15
15
  Integer(16, 128, name='latent_dim'),
16
- Real(0.2, 1, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
16
+ Real(0.2, 0.5, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
17
17
  Integer(8, 32, name='supervisor_hidden_dim'),
18
18
  Real(0.0001, 0.01, prior='log-uniform', name='lr'),
19
19
  Categorical(epochs, name='epochs')
20
20
  ],
21
21
  'CrossModalPred': [
22
22
  Integer(16, 128, name='latent_dim'),
23
- Real(0.2, 1, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
23
+ Real(0.2, 0.5, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
24
24
  Integer(8, 32, name='supervisor_hidden_dim'),
25
25
  Real(0.0001, 0.01, prior='log-uniform', name='lr'),
26
26
  Categorical(epochs, name='epochs')
27
27
  ],
28
28
  'MultiTripletNetwork': [
29
29
  Integer(16, 128, name='latent_dim'),
30
- Real(0.2, 1, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
30
+ Real(0.2, 0.5, name='hidden_dim_factor'), # relative size of the hidden_dim w.r.t input_dim
31
31
  Integer(8, 32, name='supervisor_hidden_dim'),
32
32
  Real(0.0001, 0.01, prior='log-uniform', name='lr'),
33
33
  Categorical(epochs, name='epochs')
@@ -56,7 +56,7 @@ class HyperparameterTuning:
56
56
  cv_splits=5, use_loss_weighting=True, early_stop_patience=-1, device_type=None, gnn_conv_type=None,
57
57
  input_layers=None, output_layers=None): Initializes the hyperparameter tuner with specific settings.
58
58
 
59
- get_batch_space(min_size=16, max_size=256): Determines the batch size search space based on the dataset size.
59
+ get_batch_space(min_size=16, max_size=128): Determines the batch size search space based on the dataset size.
60
60
 
61
61
  setup_trainer(params, current_step, total_steps, full_train=False): Sets up the trainer with appropriate callbacks
62
62
  and configurations for either full training or validation based training.
@@ -80,7 +80,7 @@ class HyperparameterTuning:
80
80
  val_size = 0.2, use_cv = False, cv_splits = 5,
81
81
  use_loss_weighting = True, early_stop_patience = -1,
82
82
  device_type = None, gnn_conv_type = None,
83
- input_layers = None, output_layers = None):
83
+ input_layers = None, output_layers = None, num_workers = 2):
84
84
  self.dataset = dataset # dataset for model initiation
85
85
  self.loader_dataset = dataset # dataset for defining data loaders (this can be model specific)
86
86
  self.model_class = model_class
@@ -107,6 +107,7 @@ class HyperparameterTuning:
107
107
  self.gnn_conv_type = gnn_conv_type
108
108
  self.input_layers = input_layers
109
109
  self.output_layers = output_layers
110
+ self.num_workers = num_workers
110
111
 
111
112
  self.DataLoader = torch.utils.data.DataLoader # use torch data loader by default
112
113
 
@@ -128,7 +129,7 @@ class HyperparameterTuning:
128
129
  else:
129
130
  raise ValueError(f"'{self.config_name}' not found in the default config.")
130
131
 
131
- def get_batch_space(self, min_size = 32, max_size = 256):
132
+ def get_batch_space(self, min_size = 32, max_size = 128):
132
133
  m = int(np.log2(len(self.dataset) * 0.8))
133
134
  st = int(np.log2(min_size))
134
135
  end = int(np.log2(max_size))
@@ -214,9 +215,11 @@ class HyperparameterTuning:
214
215
  train_subset = torch.utils.data.Subset(self.loader_dataset, train_index)
215
216
  val_subset = torch.utils.data.Subset(self.loader_dataset, val_index)
216
217
  train_loader = self.DataLoader(train_subset, batch_size=int(params['batch_size']),
217
- pin_memory=True, shuffle=True, drop_last=True, num_workers = 4, prefetch_factor = None, persistent_workers = True)
218
+ pin_memory=True, shuffle=True, drop_last=True, num_workers = self.num_workers, prefetch_factor = None,
219
+ persistent_workers = self.num_workers > 0)
218
220
  val_loader = self.DataLoader(val_subset, batch_size=int(params['batch_size']),
219
- pin_memory=True, shuffle=False, num_workers = 4, prefetch_factor = None, persistent_workers = True)
221
+ pin_memory=True, shuffle=False, num_workers = self.num_workers, prefetch_factor = None,
222
+ persistent_workers = self.num_workers > 0)
220
223
 
221
224
  model = self.model_class(**model_args)
222
225
  trainer, early_stop_callback = self.setup_trainer(params, current_step, total_steps)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: flexynesis
3
- Version: 0.2.2
3
+ Version: 0.2.3
4
4
  Summary: A deep-learning based multi-omics bulk sequencing data integration suite with a focus on (pre-)clinical endpoint prediction.
5
5
  Author-email: Bora Uyar <bora.uyar@mdc-berlin.de>, Taras Savchyn <Taras.Savchyn@mdc-berlin.de>, Ricardo Wurmus <Ricardo.Wurmus@mdc-berlin.de>, Ahmet Sarigun <Ahmet.Sariguen@mdc-berlin.de>
6
6
  Project-URL: homepage, https://github.com/BIMSBbioinfo/flexynesis
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "flexynesis"
7
- version = "0.2.2"
7
+ version = "0.2.3"
8
8
  authors = [
9
9
  {name = "Bora Uyar", email = "bora.uyar@mdc-berlin.de"},
10
10
  {name = "Taras Savchyn", email = "Taras.Savchyn@mdc-berlin.de"},
File without changes
File without changes
File without changes
File without changes
File without changes