cesnet-datazoo 0.1.14__py3-none-any.whl → 0.1.15__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- cesnet_datazoo/config.py +3 -1
- cesnet_datazoo/datasets/cesnet_dataset.py +3 -1
- {cesnet_datazoo-0.1.14.dist-info → cesnet_datazoo-0.1.15.dist-info}/METADATA +1 -1
- {cesnet_datazoo-0.1.14.dist-info → cesnet_datazoo-0.1.15.dist-info}/RECORD +7 -7
- {cesnet_datazoo-0.1.14.dist-info → cesnet_datazoo-0.1.15.dist-info}/WHEEL +0 -0
- {cesnet_datazoo-0.1.14.dist-info → cesnet_datazoo-0.1.15.dist-info}/licenses/LICENCE +0 -0
- {cesnet_datazoo-0.1.14.dist-info → cesnet_datazoo-0.1.15.dist-info}/top_level.txt +0 -0
cesnet_datazoo/config.py
CHANGED
@@ -166,7 +166,8 @@ class DatasetConfig():
|
|
166
166
|
val_workers: Number of workers for loading validation data. `0` means that the data will be loaded in the main process. `Default: 1`
|
167
167
|
batch_size: Number of samples per batch. `Default: 192`
|
168
168
|
test_batch_size: Number of samples per batch for loading validation and test data. `Default: 2048`
|
169
|
-
|
169
|
+
preload_train: Whether to dump the train set with `numpy.savez_compressed` and preload it in future runs. Useful when running a lot of experiments with the same dataset configuration. `Default: False`
|
170
|
+
preload_val: Whether to dump the validation set with `numpy.savez_compressed` and preload it in future runs. `Default: False`
|
170
171
|
preload_test: Whether to dump the test set with `numpy.savez_compressed` and preload it in future runs. `Default: False`
|
171
172
|
train_size: Size of the train set. See [instructions][config.DatasetConfig--how-to-configure-train-validation-and-test-sets]. `Default: all`
|
172
173
|
val_known_size: Size of the validation set. See [instructions][config.DatasetConfig--how-to-configure-train-validation-and-test-sets]. `Default: all`
|
@@ -244,6 +245,7 @@ class DatasetConfig():
|
|
244
245
|
val_workers: int = 1
|
245
246
|
batch_size: int = 192
|
246
247
|
test_batch_size: int = 2048
|
248
|
+
preload_train: bool = False
|
247
249
|
preload_val: bool = False
|
248
250
|
preload_test: bool = False
|
249
251
|
train_size: int | Literal["all"] = "all"
|
@@ -642,7 +642,9 @@ class CesnetDataset():
|
|
642
642
|
flowstats_transform=dataset_config.flowstats_transform,
|
643
643
|
flowstats_phist_transform=dataset_config.flowstats_phist_transform,
|
644
644
|
target_transform=label_encoder_fn,
|
645
|
-
return_tensors=dataset_config.return_tensors,
|
645
|
+
return_tensors=dataset_config.return_tensors,
|
646
|
+
preload=dataset_config.preload_train,
|
647
|
+
preload_blob=os.path.join(dataset_config._get_train_data_path(), "preload", f"train_dataset-{dataset_config.train_size}.npz"),)
|
646
648
|
if dataset_config.need_val_set:
|
647
649
|
assert val_data_path is not None
|
648
650
|
val_dataset = PyTablesDataset(
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: cesnet-datazoo
|
3
|
-
Version: 0.1.
|
3
|
+
Version: 0.1.15
|
4
4
|
Summary: A toolkit for large network traffic datasets
|
5
5
|
Author-email: Jan Luxemburk <luxemburk@cesnet.cz>, Karel Hynek <hynekkar@cesnet.cz>
|
6
6
|
Maintainer-email: Jan Luxemburk <luxemburk@cesnet.cz>, Karel Hynek <hynekkar@cesnet.cz>
|
@@ -1,8 +1,8 @@
|
|
1
1
|
cesnet_datazoo/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
2
|
-
cesnet_datazoo/config.py,sha256=
|
2
|
+
cesnet_datazoo/config.py,sha256=OEVdJQP9p7RYIgHxbXnwKsLZ85xJzlsA1CCoJ8SO4Ps,38933
|
3
3
|
cesnet_datazoo/constants.py,sha256=6GhcIyjVnWYrVnxRgTlGuiWRtvwZL1KqyzMJS26ge2E,1481
|
4
4
|
cesnet_datazoo/datasets/__init__.py,sha256=8ziQ3EUzUh5fMfWWXwk0cqYk0lOUNU7zbi0Gom3bLnI,443
|
5
|
-
cesnet_datazoo/datasets/cesnet_dataset.py,sha256=
|
5
|
+
cesnet_datazoo/datasets/cesnet_dataset.py,sha256=zP97SwDHHvpRsFVP8kdOntV9tNkXYX_YpYpy1qLt8Zc,48016
|
6
6
|
cesnet_datazoo/datasets/datasets.py,sha256=Bn4SU1k5og6AsUlnPapFPeu4uGlpRH-IaOSafz0ZT2k,3617
|
7
7
|
cesnet_datazoo/datasets/datasets_constants.py,sha256=1P54Ns8wCQMemdKNe8OH7cVUfkxs3vL29ugSmOLXceI,29154
|
8
8
|
cesnet_datazoo/datasets/loaders.py,sha256=9KgRY-Y8CcgtXbgqWpAaG7gyOAsSf278w7b1eHwTSyE,1854
|
@@ -23,8 +23,8 @@ cesnet_datazoo/utils/class_info.py,sha256=H5UgyRqXIepBJmkLQ1gAIXV4owKSoIllguRiqF
|
|
23
23
|
cesnet_datazoo/utils/download.py,sha256=hG5V1ZYZGtqCzlVV76NMgOZkSKOywdOFiq9Lagkgego,1441
|
24
24
|
cesnet_datazoo/utils/fileutils.py,sha256=XA_VWDuTiCXnoOgHPUzsmbnLFgrlxOo5cvUY_OBJUR8,642
|
25
25
|
cesnet_datazoo/utils/random.py,sha256=Dqgm_T25ljbew-OJozK90PsiXKnd4Kw6lcUexxF6vIc,575
|
26
|
-
cesnet_datazoo-0.1.
|
27
|
-
cesnet_datazoo-0.1.
|
28
|
-
cesnet_datazoo-0.1.
|
29
|
-
cesnet_datazoo-0.1.
|
30
|
-
cesnet_datazoo-0.1.
|
26
|
+
cesnet_datazoo-0.1.15.dist-info/licenses/LICENCE,sha256=69Wc69APiM1YKrFOIipG7jjU2lk89WQuO_U0AXKU8KE,1541
|
27
|
+
cesnet_datazoo-0.1.15.dist-info/METADATA,sha256=iVq2zImXujDGrI8Jca4cVpUY0LqWrBv7oGKVOVTJZ8k,12574
|
28
|
+
cesnet_datazoo-0.1.15.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
29
|
+
cesnet_datazoo-0.1.15.dist-info/top_level.txt,sha256=bu1Z8zaI_1Id_ZaYyvJnxIBa87OSrdlZ8J2OBMggK5o,15
|
30
|
+
cesnet_datazoo-0.1.15.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|