cesnet-datazoo 0.1.9__tar.gz → 0.1.10__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (35) hide show
  1. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/PKG-INFO +1 -1
  2. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/datasets/cesnet_dataset.py +6 -1
  3. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo.egg-info/PKG-INFO +1 -1
  4. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/pyproject.toml +1 -1
  5. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/LICENCE +0 -0
  6. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/README.md +0 -0
  7. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/__init__.py +0 -0
  8. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/config.py +0 -0
  9. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/constants.py +0 -0
  10. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/datasets/__init__.py +0 -0
  11. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/datasets/datasets.py +0 -0
  12. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/datasets/datasets_constants.py +0 -0
  13. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/datasets/loaders.py +0 -0
  14. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/datasets/metadata/__init__.py +0 -0
  15. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/datasets/metadata/dataset_metadata.py +0 -0
  16. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/datasets/metadata/metadata.csv +0 -0
  17. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/datasets/statistics.py +0 -0
  18. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/metrics/__init__.py +0 -0
  19. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/metrics/classification_report.py +0 -0
  20. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/metrics/provider_metrics.py +0 -0
  21. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/pytables_data/__init__.py +0 -0
  22. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/pytables_data/apps_split.py +0 -0
  23. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/pytables_data/data_scalers.py +0 -0
  24. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/pytables_data/indices_setup.py +0 -0
  25. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/pytables_data/pytables_dataset.py +0 -0
  26. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/utils/__init__.py +0 -0
  27. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/utils/class_info.py +0 -0
  28. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/utils/download.py +0 -0
  29. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/utils/fileutils.py +0 -0
  30. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo/utils/random.py +0 -0
  31. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo.egg-info/SOURCES.txt +0 -0
  32. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo.egg-info/dependency_links.txt +0 -0
  33. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo.egg-info/requires.txt +0 -0
  34. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/cesnet_datazoo.egg-info/top_level.txt +0 -0
  35. {cesnet_datazoo-0.1.9 → cesnet_datazoo-0.1.10}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: cesnet-datazoo
3
- Version: 0.1.9
3
+ Version: 0.1.10
4
4
  Summary: A toolkit for large network traffic datasets
5
5
  Author-email: Jan Luxemburk <luxemburk@cesnet.cz>, Karel Hynek <hynekkar@cesnet.cz>
6
6
  Maintainer-email: Jan Luxemburk <luxemburk@cesnet.cz>, Karel Hynek <hynekkar@cesnet.cz>
@@ -176,7 +176,7 @@ class CesnetDataset():
176
176
  raise ValueError(f"Found {len(available_applications)} applications in the servicemap (omitting background traffic classes), but expected {self.metadata.application_count}. Please report this issue.")
177
177
  self.available_classes = available_applications + self.metadata.background_traffic_classes
178
178
 
179
- def set_dataset_config_and_initialize(self, dataset_config: DatasetConfig, disable_indices_cache: bool = False) -> None:
179
+ def set_dataset_config_and_initialize(self, dataset_config: DatasetConfig, disable_indices_cache: bool = False, silent_warning: bool = False) -> None:
180
180
  """
181
181
  Initialize train, validation, and test sets. Data cannot be accessed before calling this method.
182
182
 
@@ -184,6 +184,11 @@ class CesnetDataset():
184
184
  dataset_config: Desired configuration of the dataset.
185
185
  disable_indices_cache: Whether to disable caching of the dataset indices. This is useful when the dataset is used in many different configurations and you want to save disk space.
186
186
  """
187
+ if self.name.startswith("CESNET-TLS-Year22") and not silent_warning:
188
+ warnings.warn("The CESNET-TLS-Year22 dataset contains traffic from the entire year of 2022. During the dataset collection, in week 10 (7.3.2022 - 13.3.2022), " + \
189
+ "the used flow exporter was updated with new features resulting in a change in the distribution of packet sequence data. " + \
190
+ "This can lead to a decrease in model performance when a model is trained on traffic before week 10 and tested on traffic after week 10. " + \
191
+ "More details can be found in the paper at https://doi.org/10.1038/s41597-024-03927-4. To disable this warning set silent_warning=True.")
187
192
  self.dataset_config = dataset_config
188
193
  self._clear()
189
194
  self._initialize_train_val_test(disable_indices_cache=disable_indices_cache)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: cesnet-datazoo
3
- Version: 0.1.9
3
+ Version: 0.1.10
4
4
  Summary: A toolkit for large network traffic datasets
5
5
  Author-email: Jan Luxemburk <luxemburk@cesnet.cz>, Karel Hynek <hynekkar@cesnet.cz>
6
6
  Maintainer-email: Jan Luxemburk <luxemburk@cesnet.cz>, Karel Hynek <hynekkar@cesnet.cz>
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "cesnet-datazoo"
7
- version = "0.1.9"
7
+ version = "0.1.10"
8
8
  authors = [
9
9
  {name = "Jan Luxemburk", email = "luxemburk@cesnet.cz"},
10
10
  {name = "Karel Hynek", email = "hynekkar@cesnet.cz"},
File without changes