cesnet-datazoo 0.1.14__py3-none-any.whl → 0.1.15__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
cesnet_datazoo/config.py CHANGED
@@ -166,7 +166,8 @@ class DatasetConfig():
166
166
  val_workers: Number of workers for loading validation data. `0` means that the data will be loaded in the main process. `Default: 1`
167
167
  batch_size: Number of samples per batch. `Default: 192`
168
168
  test_batch_size: Number of samples per batch for loading validation and test data. `Default: 2048`
169
- preload_val: Whether to dump the validation set with `numpy.savez_compressed` and preload it in future runs. Useful when running a lot of experiments with the same dataset configuration. `Default: False`
169
+ preload_train: Whether to dump the train set with `numpy.savez_compressed` and preload it in future runs. Useful when running a lot of experiments with the same dataset configuration. `Default: False`
170
+ preload_val: Whether to dump the validation set with `numpy.savez_compressed` and preload it in future runs. `Default: False`
170
171
  preload_test: Whether to dump the test set with `numpy.savez_compressed` and preload it in future runs. `Default: False`
171
172
  train_size: Size of the train set. See [instructions][config.DatasetConfig--how-to-configure-train-validation-and-test-sets]. `Default: all`
172
173
  val_known_size: Size of the validation set. See [instructions][config.DatasetConfig--how-to-configure-train-validation-and-test-sets]. `Default: all`
@@ -244,6 +245,7 @@ class DatasetConfig():
244
245
  val_workers: int = 1
245
246
  batch_size: int = 192
246
247
  test_batch_size: int = 2048
248
+ preload_train: bool = False
247
249
  preload_val: bool = False
248
250
  preload_test: bool = False
249
251
  train_size: int | Literal["all"] = "all"
@@ -642,7 +642,9 @@ class CesnetDataset():
642
642
  flowstats_transform=dataset_config.flowstats_transform,
643
643
  flowstats_phist_transform=dataset_config.flowstats_phist_transform,
644
644
  target_transform=label_encoder_fn,
645
- return_tensors=dataset_config.return_tensors,)
645
+ return_tensors=dataset_config.return_tensors,
646
+ preload=dataset_config.preload_train,
647
+ preload_blob=os.path.join(dataset_config._get_train_data_path(), "preload", f"train_dataset-{dataset_config.train_size}.npz"),)
646
648
  if dataset_config.need_val_set:
647
649
  assert val_data_path is not None
648
650
  val_dataset = PyTablesDataset(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: cesnet-datazoo
3
- Version: 0.1.14
3
+ Version: 0.1.15
4
4
  Summary: A toolkit for large network traffic datasets
5
5
  Author-email: Jan Luxemburk <luxemburk@cesnet.cz>, Karel Hynek <hynekkar@cesnet.cz>
6
6
  Maintainer-email: Jan Luxemburk <luxemburk@cesnet.cz>, Karel Hynek <hynekkar@cesnet.cz>
@@ -1,8 +1,8 @@
1
1
  cesnet_datazoo/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
2
- cesnet_datazoo/config.py,sha256=AoYMX_drWqb6K6MhdTQRyvUPf_6kZeL3ie04hUgJzgE,38768
2
+ cesnet_datazoo/config.py,sha256=OEVdJQP9p7RYIgHxbXnwKsLZ85xJzlsA1CCoJ8SO4Ps,38933
3
3
  cesnet_datazoo/constants.py,sha256=6GhcIyjVnWYrVnxRgTlGuiWRtvwZL1KqyzMJS26ge2E,1481
4
4
  cesnet_datazoo/datasets/__init__.py,sha256=8ziQ3EUzUh5fMfWWXwk0cqYk0lOUNU7zbi0Gom3bLnI,443
5
- cesnet_datazoo/datasets/cesnet_dataset.py,sha256=AgxdiEwtJrOug9F8LJcMwttc7NMrligkq7cy4lRmLAs,47817
5
+ cesnet_datazoo/datasets/cesnet_dataset.py,sha256=zP97SwDHHvpRsFVP8kdOntV9tNkXYX_YpYpy1qLt8Zc,48016
6
6
  cesnet_datazoo/datasets/datasets.py,sha256=Bn4SU1k5og6AsUlnPapFPeu4uGlpRH-IaOSafz0ZT2k,3617
7
7
  cesnet_datazoo/datasets/datasets_constants.py,sha256=1P54Ns8wCQMemdKNe8OH7cVUfkxs3vL29ugSmOLXceI,29154
8
8
  cesnet_datazoo/datasets/loaders.py,sha256=9KgRY-Y8CcgtXbgqWpAaG7gyOAsSf278w7b1eHwTSyE,1854
@@ -23,8 +23,8 @@ cesnet_datazoo/utils/class_info.py,sha256=H5UgyRqXIepBJmkLQ1gAIXV4owKSoIllguRiqF
23
23
  cesnet_datazoo/utils/download.py,sha256=hG5V1ZYZGtqCzlVV76NMgOZkSKOywdOFiq9Lagkgego,1441
24
24
  cesnet_datazoo/utils/fileutils.py,sha256=XA_VWDuTiCXnoOgHPUzsmbnLFgrlxOo5cvUY_OBJUR8,642
25
25
  cesnet_datazoo/utils/random.py,sha256=Dqgm_T25ljbew-OJozK90PsiXKnd4Kw6lcUexxF6vIc,575
26
- cesnet_datazoo-0.1.14.dist-info/licenses/LICENCE,sha256=69Wc69APiM1YKrFOIipG7jjU2lk89WQuO_U0AXKU8KE,1541
27
- cesnet_datazoo-0.1.14.dist-info/METADATA,sha256=yp-ld51MKd-oTx-z86x0BwbJEvdY2zlc1fIbfYIDKWY,12574
28
- cesnet_datazoo-0.1.14.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
29
- cesnet_datazoo-0.1.14.dist-info/top_level.txt,sha256=bu1Z8zaI_1Id_ZaYyvJnxIBa87OSrdlZ8J2OBMggK5o,15
30
- cesnet_datazoo-0.1.14.dist-info/RECORD,,
26
+ cesnet_datazoo-0.1.15.dist-info/licenses/LICENCE,sha256=69Wc69APiM1YKrFOIipG7jjU2lk89WQuO_U0AXKU8KE,1541
27
+ cesnet_datazoo-0.1.15.dist-info/METADATA,sha256=iVq2zImXujDGrI8Jca4cVpUY0LqWrBv7oGKVOVTJZ8k,12574
28
+ cesnet_datazoo-0.1.15.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
29
+ cesnet_datazoo-0.1.15.dist-info/top_level.txt,sha256=bu1Z8zaI_1Id_ZaYyvJnxIBa87OSrdlZ8J2OBMggK5o,15
30
+ cesnet_datazoo-0.1.15.dist-info/RECORD,,