PyPI - stouputils - Versions diffs - 1.14.0__py3-none-any.whl → 1.14.2__py3-none-any.whl - Mend

stouputils 1.14.0py3-none-any.whl → 1.14.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (108) hide show

stouputils/__init__.pyi +15 -0
stouputils/_deprecated.pyi +12 -0
stouputils/all_doctests.pyi +46 -0
stouputils/applications/__init__.pyi +2 -0
stouputils/applications/automatic_docs.py +3 -0
stouputils/applications/automatic_docs.pyi +106 -0
stouputils/applications/upscaler/__init__.pyi +3 -0
stouputils/applications/upscaler/config.pyi +18 -0
stouputils/applications/upscaler/image.pyi +109 -0
stouputils/applications/upscaler/video.pyi +60 -0
stouputils/archive.pyi +67 -0
stouputils/backup.pyi +109 -0
stouputils/collections.pyi +86 -0
stouputils/continuous_delivery/__init__.pyi +5 -0
stouputils/continuous_delivery/cd_utils.pyi +129 -0
stouputils/continuous_delivery/github.pyi +162 -0
stouputils/continuous_delivery/pypi.pyi +52 -0
stouputils/continuous_delivery/pyproject.pyi +67 -0
stouputils/continuous_delivery/stubs.pyi +39 -0
stouputils/ctx.pyi +211 -0
stouputils/data_science/config/get.py +51 -51
stouputils/data_science/data_processing/image/__init__.py +66 -66
stouputils/data_science/data_processing/image/auto_contrast.py +79 -79
stouputils/data_science/data_processing/image/axis_flip.py +58 -58
stouputils/data_science/data_processing/image/bias_field_correction.py +74 -74
stouputils/data_science/data_processing/image/binary_threshold.py +73 -73
stouputils/data_science/data_processing/image/blur.py +59 -59
stouputils/data_science/data_processing/image/brightness.py +54 -54
stouputils/data_science/data_processing/image/canny.py +110 -110
stouputils/data_science/data_processing/image/clahe.py +92 -92
stouputils/data_science/data_processing/image/common.py +30 -30
stouputils/data_science/data_processing/image/contrast.py +53 -53
stouputils/data_science/data_processing/image/curvature_flow_filter.py +74 -74
stouputils/data_science/data_processing/image/denoise.py +378 -378
stouputils/data_science/data_processing/image/histogram_equalization.py +123 -123
stouputils/data_science/data_processing/image/invert.py +64 -64
stouputils/data_science/data_processing/image/laplacian.py +60 -60
stouputils/data_science/data_processing/image/median_blur.py +52 -52
stouputils/data_science/data_processing/image/noise.py +59 -59
stouputils/data_science/data_processing/image/normalize.py +65 -65
stouputils/data_science/data_processing/image/random_erase.py +66 -66
stouputils/data_science/data_processing/image/resize.py +69 -69
stouputils/data_science/data_processing/image/rotation.py +80 -80
stouputils/data_science/data_processing/image/salt_pepper.py +68 -68
stouputils/data_science/data_processing/image/sharpening.py +55 -55
stouputils/data_science/data_processing/image/shearing.py +64 -64
stouputils/data_science/data_processing/image/threshold.py +64 -64
stouputils/data_science/data_processing/image/translation.py +71 -71
stouputils/data_science/data_processing/image/zoom.py +83 -83
stouputils/data_science/data_processing/image_augmentation.py +118 -118
stouputils/data_science/data_processing/image_preprocess.py +183 -183
stouputils/data_science/data_processing/prosthesis_detection.py +359 -359
stouputils/data_science/data_processing/technique.py +481 -481
stouputils/data_science/dataset/__init__.py +45 -45
stouputils/data_science/dataset/dataset.py +292 -292
stouputils/data_science/dataset/dataset_loader.py +135 -135
stouputils/data_science/dataset/grouping_strategy.py +296 -296
stouputils/data_science/dataset/image_loader.py +100 -100
stouputils/data_science/dataset/xy_tuple.py +696 -696
stouputils/data_science/metric_dictionnary.py +106 -106
stouputils/data_science/mlflow_utils.py +206 -206
stouputils/data_science/models/abstract_model.py +149 -149
stouputils/data_science/models/all.py +85 -85
stouputils/data_science/models/keras/all.py +38 -38
stouputils/data_science/models/keras/convnext.py +62 -62
stouputils/data_science/models/keras/densenet.py +50 -50
stouputils/data_science/models/keras/efficientnet.py +60 -60
stouputils/data_science/models/keras/mobilenet.py +56 -56
stouputils/data_science/models/keras/resnet.py +52 -52
stouputils/data_science/models/keras/squeezenet.py +233 -233
stouputils/data_science/models/keras/vgg.py +42 -42
stouputils/data_science/models/keras/xception.py +38 -38
stouputils/data_science/models/keras_utils/callbacks/__init__.py +20 -20
stouputils/data_science/models/keras_utils/callbacks/colored_progress_bar.py +219 -219
stouputils/data_science/models/keras_utils/callbacks/learning_rate_finder.py +148 -148
stouputils/data_science/models/keras_utils/callbacks/model_checkpoint_v2.py +31 -31
stouputils/data_science/models/keras_utils/callbacks/progressive_unfreezing.py +249 -249
stouputils/data_science/models/keras_utils/callbacks/warmup_scheduler.py +66 -66
stouputils/data_science/models/keras_utils/losses/__init__.py +12 -12
stouputils/data_science/models/keras_utils/losses/next_generation_loss.py +56 -56
stouputils/data_science/models/keras_utils/visualizations.py +416 -416
stouputils/data_science/models/sandbox.py +116 -116
stouputils/data_science/range_tuple.py +234 -234
stouputils/data_science/utils.py +285 -285
stouputils/decorators.pyi +242 -0
stouputils/image.pyi +172 -0
stouputils/installer/__init__.py +18 -18
stouputils/installer/__init__.pyi +5 -0
stouputils/installer/common.pyi +39 -0
stouputils/installer/downloader.pyi +24 -0
stouputils/installer/linux.py +144 -144
stouputils/installer/linux.pyi +39 -0
stouputils/installer/main.py +223 -223
stouputils/installer/main.pyi +57 -0
stouputils/installer/windows.py +136 -136
stouputils/installer/windows.pyi +31 -0
stouputils/io.pyi +213 -0
stouputils/parallel.py +12 -10
stouputils/parallel.pyi +211 -0
stouputils/print.pyi +136 -0
stouputils/py.typed +1 -1
stouputils/stouputils/parallel.pyi +4 -4
stouputils/version_pkg.pyi +15 -0
{stouputils-1.14.0.dist-info → stouputils-1.14.2.dist-info}/METADATA +1 -1
stouputils-1.14.2.dist-info/RECORD +171 -0
stouputils-1.14.0.dist-info/RECORD +0 -140
{stouputils-1.14.0.dist-info → stouputils-1.14.2.dist-info}/WHEEL +0 -0
{stouputils-1.14.0.dist-info → stouputils-1.14.2.dist-info}/entry_points.txt +0 -0

stouputils/data_science/data_processing/image/translation.py CHANGED Viewed

@@ -1,71 +1,71 @@
-# Imports
-from .common import Any, NDArray, check_image, cv2, np
-# Functions
-def translate_image(image: NDArray[Any], x: float, y: float, padding: int = 0, ignore_dtype: bool = False) -> NDArray[Any]:
-	""" Translate an image
-	Args:
-		image         (NDArray[Any]):  Image to translate
-		x             (float):       Translation along the x axis (between -1 and 1)
-		y             (float):       Translation along the y axis (between -1 and 1)
-		padding       (int):         Padding that has been added to the image before calling this function
-		ignore_dtype  (bool):        Ignore the dtype check
-	Returns:
-		NDArray[Any]: Translated image
-	>>> ## Basic tests
-	>>> image = np.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]]).astype(np.uint8)
-	>>> translate_image(image, 0.5, 0.5).tolist()
-	[[0, 0, 0], [0, 1, 2], [0, 4, 5]]
-	>>> translate_image(image, 0, -2/3).tolist()
-	[[7, 8, 9], [0, 0, 0], [0, 0, 0]]
-	>>> ## Test invalid inputs
-	>>> translate_image(image, 2, 0)
-	Traceback (most recent call last):
-		...
-	AssertionError: x must be between -1 and 1, got 2
-	>>> translate_image(image, 0, 2)
-	Traceback (most recent call last):
-		...
-	AssertionError: y must be between -1 and 1, got 2
-	>>> translate_image("not an image", 0, 0)
-	Traceback (most recent call last):
-		...
-	AssertionError: Image must be a numpy array
-	>>> translate_image(image, 0, 0, padding=-1)
-	Traceback (most recent call last):
-		...
-	AssertionError: padding must be positive, got -1
-	"""
-	# Check input data
-	check_image(image, ignore_dtype=ignore_dtype)
-	assert isinstance(x, float | int), f"x must be a number, got {type(x)}"
-	assert isinstance(y, float | int), f"y must be a number, got {type(y)}"
-	assert -1 <= x <= 1, f"x must be between -1 and 1, got {x}"
-	assert -1 <= y <= 1, f"y must be between -1 and 1, got {y}"
-	assert isinstance(padding, int), f"padding must be an integer, got {type(padding)}"
-	assert padding >= 0, f"padding must be positive, got {padding}"
-	# Get image dimensions
-	height, width = image.shape[:2]
-	original_width: int = width - 2 * padding
-	original_height: int = height - 2 * padding
-	# Convert relative translations to absolute pixels
-	x_pixels: int = int(x * original_width)
-	y_pixels: int = int(y * original_height)
-	# Create translation matrix
-	translation_matrix: NDArray[Any] = np.array([[1, 0, x_pixels], [0, 1, y_pixels]], dtype=np.float32)
-	# Apply affine transformation
-	return cv2.warpAffine(image, translation_matrix, (width, height))
+# Imports
+from .common import Any, NDArray, check_image, cv2, np
+# Functions
+def translate_image(image: NDArray[Any], x: float, y: float, padding: int = 0, ignore_dtype: bool = False) -> NDArray[Any]:
+	""" Translate an image
+	Args:
+		image         (NDArray[Any]):  Image to translate
+		x             (float):       Translation along the x axis (between -1 and 1)
+		y             (float):       Translation along the y axis (between -1 and 1)
+		padding       (int):         Padding that has been added to the image before calling this function
+		ignore_dtype  (bool):        Ignore the dtype check
+	Returns:
+		NDArray[Any]: Translated image
+	>>> ## Basic tests
+	>>> image = np.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]]).astype(np.uint8)
+	>>> translate_image(image, 0.5, 0.5).tolist()
+	[[0, 0, 0], [0, 1, 2], [0, 4, 5]]
+	>>> translate_image(image, 0, -2/3).tolist()
+	[[7, 8, 9], [0, 0, 0], [0, 0, 0]]
+	>>> ## Test invalid inputs
+	>>> translate_image(image, 2, 0)
+	Traceback (most recent call last):
+		...
+	AssertionError: x must be between -1 and 1, got 2
+	>>> translate_image(image, 0, 2)
+	Traceback (most recent call last):
+		...
+	AssertionError: y must be between -1 and 1, got 2
+	>>> translate_image("not an image", 0, 0)
+	Traceback (most recent call last):
+		...
+	AssertionError: Image must be a numpy array
+	>>> translate_image(image, 0, 0, padding=-1)
+	Traceback (most recent call last):
+		...
+	AssertionError: padding must be positive, got -1
+	"""
+	# Check input data
+	check_image(image, ignore_dtype=ignore_dtype)
+	assert isinstance(x, float | int), f"x must be a number, got {type(x)}"
+	assert isinstance(y, float | int), f"y must be a number, got {type(y)}"
+	assert -1 <= x <= 1, f"x must be between -1 and 1, got {x}"
+	assert -1 <= y <= 1, f"y must be between -1 and 1, got {y}"
+	assert isinstance(padding, int), f"padding must be an integer, got {type(padding)}"
+	assert padding >= 0, f"padding must be positive, got {padding}"
+	# Get image dimensions
+	height, width = image.shape[:2]
+	original_width: int = width - 2 * padding
+	original_height: int = height - 2 * padding
+	# Convert relative translations to absolute pixels
+	x_pixels: int = int(x * original_width)
+	y_pixels: int = int(y * original_height)
+	# Create translation matrix
+	translation_matrix: NDArray[Any] = np.array([[1, 0, x_pixels], [0, 1, y_pixels]], dtype=np.float32)
+	# Apply affine transformation
+	return cv2.warpAffine(image, translation_matrix, (width, height))

stouputils/data_science/data_processing/image/zoom.py CHANGED Viewed

@@ -1,83 +1,83 @@
-# pyright: reportUnusedImport=false
-# ruff: noqa: F401
-# Imports
-from .common import Any, NDArray, check_image, cv2, np
-# Functions
-def zoom_image(image: NDArray[Any], zoom_factor: float, ignore_dtype: bool = False) -> NDArray[Any]:
-	""" Zoom into an image.
-	Args:
-		image         (NDArray[Any]):  Image to zoom
-		zoom_factor   (float):       Zoom factor (greater than 1 for zoom in, less than 1 for zoom out)
-		ignore_dtype  (bool):        Ignore the dtype check
-	Returns:
-		NDArray[Any]: Zoomed image
-	>>> ## Basic tests
-	>>> image = np.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
-	>>> zoomed = zoom_image(image.astype(np.uint8), 1.5)
-	>>> zoomed.shape == image.shape
-	True
-	>>> img = np.eye(4, dtype=np.uint8) * 255
-	>>> zoomed_in = zoom_image(img, 2.0)
-	>>> zoomed_in.shape == img.shape  # Should preserve size
-	True
-	>>> zoomed_out = zoom_image(img, 0.5)
-	>>> zoomed_out.shape == img.shape  # Should preserve size
-	True
-	>>> rgb = np.full((4,4,3), 128, dtype=np.uint8)
-	>>> zoomed_rgb = zoom_image(rgb, 1.5)
-	>>> zoomed_rgb.shape == (4,4,3)
-	True
-	>>> ## Test invalid inputs
-	>>> zoom_image("not an image", 1.5)
-	Traceback (most recent call last):
-		...
-	AssertionError: Image must be a numpy array
-	>>> zoom_image(image.astype(np.uint8), "1.5")
-	Traceback (most recent call last):
-		...
-	AssertionError: zoom_factor must be a number, got <class 'str'>
-	>>> zoom_image(image.astype(np.uint8), -1)
-	Traceback (most recent call last):
-		...
-	AssertionError: zoom_factor must be greater than 0, got -1
-	"""
-	# Check input data
-	check_image(image, ignore_dtype=ignore_dtype)
-	assert isinstance(zoom_factor, float | int), f"zoom_factor must be a number, got {type(zoom_factor)}"
-	assert zoom_factor > 0, f"zoom_factor must be greater than 0, got {zoom_factor}"
-	# Get image dimensions
-	height, width = image.shape[:2]
-	# Calculate new dimensions
-	new_height, new_width = int(height * zoom_factor), int(width * zoom_factor)
-	# Resize image
-	zoomed_image: NDArray[Any] = cv2.resize(image, (new_width, new_height))
-	# Crop or pad to original size
-	if zoom_factor > 1:
-		# Crop
-		start_x: int = (new_width - width) // 2
-		start_y: int = (new_height - height) // 2
-		return zoomed_image[start_y:start_y + height, start_x:start_x + width] # pyright: ignore [reportUnknownVariableType]
-	else:
-		# Pad
-		pad_x: int = (width - new_width) // 2
-		pad_y: int = (height - new_height) // 2
-		# Ensure value list matches number of channels (max 4 for OpenCV)
-		value: list[int] = [0] * min(image.shape[-1], 4)
-		return cv2.copyMakeBorder(zoomed_image, pad_y, pad_y, pad_x, pad_x, cv2.BORDER_CONSTANT, value=value)
+# pyright: reportUnusedImport=false
+# ruff: noqa: F401
+# Imports
+from .common import Any, NDArray, check_image, cv2, np
+# Functions
+def zoom_image(image: NDArray[Any], zoom_factor: float, ignore_dtype: bool = False) -> NDArray[Any]:
+	""" Zoom into an image.
+	Args:
+		image         (NDArray[Any]):  Image to zoom
+		zoom_factor   (float):       Zoom factor (greater than 1 for zoom in, less than 1 for zoom out)
+		ignore_dtype  (bool):        Ignore the dtype check
+	Returns:
+		NDArray[Any]: Zoomed image
+	>>> ## Basic tests
+	>>> image = np.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
+	>>> zoomed = zoom_image(image.astype(np.uint8), 1.5)
+	>>> zoomed.shape == image.shape
+	True
+	>>> img = np.eye(4, dtype=np.uint8) * 255
+	>>> zoomed_in = zoom_image(img, 2.0)
+	>>> zoomed_in.shape == img.shape  # Should preserve size
+	True
+	>>> zoomed_out = zoom_image(img, 0.5)
+	>>> zoomed_out.shape == img.shape  # Should preserve size
+	True
+	>>> rgb = np.full((4,4,3), 128, dtype=np.uint8)
+	>>> zoomed_rgb = zoom_image(rgb, 1.5)
+	>>> zoomed_rgb.shape == (4,4,3)
+	True
+	>>> ## Test invalid inputs
+	>>> zoom_image("not an image", 1.5)
+	Traceback (most recent call last):
+		...
+	AssertionError: Image must be a numpy array
+	>>> zoom_image(image.astype(np.uint8), "1.5")
+	Traceback (most recent call last):
+		...
+	AssertionError: zoom_factor must be a number, got <class 'str'>
+	>>> zoom_image(image.astype(np.uint8), -1)
+	Traceback (most recent call last):
+		...
+	AssertionError: zoom_factor must be greater than 0, got -1
+	"""
+	# Check input data
+	check_image(image, ignore_dtype=ignore_dtype)
+	assert isinstance(zoom_factor, float | int), f"zoom_factor must be a number, got {type(zoom_factor)}"
+	assert zoom_factor > 0, f"zoom_factor must be greater than 0, got {zoom_factor}"
+	# Get image dimensions
+	height, width = image.shape[:2]
+	# Calculate new dimensions
+	new_height, new_width = int(height * zoom_factor), int(width * zoom_factor)
+	# Resize image
+	zoomed_image: NDArray[Any] = cv2.resize(image, (new_width, new_height))
+	# Crop or pad to original size
+	if zoom_factor > 1:
+		# Crop
+		start_x: int = (new_width - width) // 2
+		start_y: int = (new_height - height) // 2
+		return zoomed_image[start_y:start_y + height, start_x:start_x + width] # pyright: ignore [reportUnknownVariableType]
+	else:
+		# Pad
+		pad_x: int = (width - new_width) // 2
+		pad_y: int = (height - new_height) // 2
+		# Ensure value list matches number of channels (max 4 for OpenCV)
+		value: list[int] = [0] * min(image.shape[-1], 4)
+		return cv2.copyMakeBorder(zoomed_image, pad_y, pad_y, pad_x, pad_x, cv2.BORDER_CONSTANT, value=value)

stouputils/data_science/data_processing/image_augmentation.py CHANGED Viewed

@@ -1,118 +1,118 @@
-# Imports
-import os
-import random
-from ...decorators import handle_error
-from ..config.get import DataScienceConfig
-from .image_preprocess import ImageDatasetPreprocess
-from .technique import ProcessingTechnique
-# Image dataset augmentation class
-class ImageDatasetAugmentation(ImageDatasetPreprocess):
-	""" Image dataset augmentation class. Check the class constructor for more information. """
-	# Class constructor (configuration)
-	def __init__(self, final_dataset_size: int, techniques: list[ProcessingTechnique] | None = None) -> None:
-		""" Initialize the image dataset augmentation class with the given parameters.
-		Args:
-			final_dataset_size	(int):							Size of the final dataset
-			techniques			(list[ProcessingTechnique]):	List of processing techniques to apply.
-		"""
-		if techniques is None:
-			techniques = []
-		super().__init__(techniques=techniques)
-		self.final_dataset_size: int = final_dataset_size
-	# Class methods
-	def _add_suffix(self, path: str, used_destinations: set[str]) -> str:
-		""" Add a count suffix to the path in order to avoid overwriting the same file
-		Args:
-			path	(str):	Path to the file (example: "path/to/file.jpg")
-		Returns:
-			str:	Path with the suffix (example: "path/to/file_1.jpg")
-		"""
-		# Split the path into base path and extension (e.g. "path/to/file.jpg" -> "path/to/file", ".jpg")
-		path_no_ext, ext = os.path.splitext(path)
-		# Convert count to augmented path
-		def get_path_from_count(count: int) -> str:
-			return path_no_ext + DataScienceConfig.AUGMENTED_FILE_SUFFIX + str(count) + ext
-		# Function to check if the path is not available
-		def is_not_available(path_aug: str) -> bool:
-			return path_aug in used_destinations or os.path.isfile(path_aug)
-		# Keep incrementing counter until we find a filename that doesn't exist
-		count: int = 1
-		while is_not_available(get_path_from_count(count)):
-			count += 1
-		return get_path_from_count(count)
-	@handle_error(message="Error while getting queue of files to process")
-	def get_queue(
-		self,
-		dataset_path: str,
-		destination_path: str,
-		images_per_class_dict: dict[str, int] | None = None
-	) -> list[tuple[str, str, list[ProcessingTechnique]]]:
-		""" Get the queue of images to process with their techniques.
-		Args:
-			dataset_path          (str):             Path to the dataset
-			destination_path      (str):             Path to the destination dataset
-			images_per_class_dict (dict[str, int]):  Dictionary mapping class names to desired number of images
-				(optional, defaults to empty dictionary)
-		Returns:
-			list[tuple[str, str, list[ProcessingTechnique]]]: Queue of (source_path, dest_path, techniques) tuples
-		"""
-		# Initializations
-		if images_per_class_dict is None:
-			images_per_class_dict = {}
-		queue: list[tuple[str, str, list[ProcessingTechnique]]] = []
-		used_destinations: set[str] = set()
-		# Get all folders (classes) and compute the number of images per class
-		classes: tuple[str, ...] = tuple(f for f in os.listdir(dataset_path) if os.path.isdir(f"{dataset_path}/{f}"))
-		default_images_per_class: int = self.final_dataset_size // len(classes)
-		# For each class, for each image, apply the processing techniques
-		for class_name in classes:
-			class_path: str = f"{dataset_path}/{class_name}"
-			images: list[str] = os.listdir(class_path)
-			# Determine target number of images for this class
-			target_images: int = images_per_class_dict.get(class_name, default_images_per_class)
-			remaining_images: int = target_images - len(images)
-			# Add images to the queue without applying the processing techniques
-			for img in images:
-				files: dict[str, str] = self.get_files_recursively(f"{class_path}/{img}", f"{destination_path}/{class_name}/{img}")
-				for path, dest in files.items():
-					queue.append((path, dest, []))
-			# While there is less images than the desired number, apply the processing techniques
-			while remaining_images > 0:
-				chosen_images: list[str] = random.sample(images, k=min(remaining_images, len(images)))
-				# Apply the processing techniques
-				for img in chosen_images:
-					img_destination: str = self._add_suffix(f"{destination_path}/{class_name}/{img}", used_destinations)
-					used_destinations.add(img_destination)
-					img_path: str = f"{class_path}/{img}"
-					# Get the technique and their fixed values
-					techniques: list[ProcessingTechnique] = [x.deterministic(use_default=False) for x in self.techniques]
-					# For each image found, add it to the queue
-					for path, dest in self.get_files_recursively(img_path, img_destination).items():
-						queue.append((path, dest, techniques))
-				# Update the remaining images
-				remaining_images -= len(chosen_images)
-		return queue
+# Imports
+import os
+import random
+from ...decorators import handle_error
+from ..config.get import DataScienceConfig
+from .image_preprocess import ImageDatasetPreprocess
+from .technique import ProcessingTechnique
+# Image dataset augmentation class
+class ImageDatasetAugmentation(ImageDatasetPreprocess):
+	""" Image dataset augmentation class. Check the class constructor for more information. """
+	# Class constructor (configuration)
+	def __init__(self, final_dataset_size: int, techniques: list[ProcessingTechnique] | None = None) -> None:
+		""" Initialize the image dataset augmentation class with the given parameters.
+		Args:
+			final_dataset_size	(int):							Size of the final dataset
+			techniques			(list[ProcessingTechnique]):	List of processing techniques to apply.
+		"""
+		if techniques is None:
+			techniques = []
+		super().__init__(techniques=techniques)
+		self.final_dataset_size: int = final_dataset_size
+	# Class methods
+	def _add_suffix(self, path: str, used_destinations: set[str]) -> str:
+		""" Add a count suffix to the path in order to avoid overwriting the same file
+		Args:
+			path	(str):	Path to the file (example: "path/to/file.jpg")
+		Returns:
+			str:	Path with the suffix (example: "path/to/file_1.jpg")
+		"""
+		# Split the path into base path and extension (e.g. "path/to/file.jpg" -> "path/to/file", ".jpg")
+		path_no_ext, ext = os.path.splitext(path)
+		# Convert count to augmented path
+		def get_path_from_count(count: int) -> str:
+			return path_no_ext + DataScienceConfig.AUGMENTED_FILE_SUFFIX + str(count) + ext
+		# Function to check if the path is not available
+		def is_not_available(path_aug: str) -> bool:
+			return path_aug in used_destinations or os.path.isfile(path_aug)
+		# Keep incrementing counter until we find a filename that doesn't exist
+		count: int = 1
+		while is_not_available(get_path_from_count(count)):
+			count += 1
+		return get_path_from_count(count)
+	@handle_error(message="Error while getting queue of files to process")
+	def get_queue(
+		self,
+		dataset_path: str,
+		destination_path: str,
+		images_per_class_dict: dict[str, int] | None = None
+	) -> list[tuple[str, str, list[ProcessingTechnique]]]:
+		""" Get the queue of images to process with their techniques.
+		Args:
+			dataset_path          (str):             Path to the dataset
+			destination_path      (str):             Path to the destination dataset
+			images_per_class_dict (dict[str, int]):  Dictionary mapping class names to desired number of images
+				(optional, defaults to empty dictionary)
+		Returns:
+			list[tuple[str, str, list[ProcessingTechnique]]]: Queue of (source_path, dest_path, techniques) tuples
+		"""
+		# Initializations
+		if images_per_class_dict is None:
+			images_per_class_dict = {}
+		queue: list[tuple[str, str, list[ProcessingTechnique]]] = []
+		used_destinations: set[str] = set()
+		# Get all folders (classes) and compute the number of images per class
+		classes: tuple[str, ...] = tuple(f for f in os.listdir(dataset_path) if os.path.isdir(f"{dataset_path}/{f}"))
+		default_images_per_class: int = self.final_dataset_size // len(classes)
+		# For each class, for each image, apply the processing techniques
+		for class_name in classes:
+			class_path: str = f"{dataset_path}/{class_name}"
+			images: list[str] = os.listdir(class_path)
+			# Determine target number of images for this class
+			target_images: int = images_per_class_dict.get(class_name, default_images_per_class)
+			remaining_images: int = target_images - len(images)
+			# Add images to the queue without applying the processing techniques
+			for img in images:
+				files: dict[str, str] = self.get_files_recursively(f"{class_path}/{img}", f"{destination_path}/{class_name}/{img}")
+				for path, dest in files.items():
+					queue.append((path, dest, []))
+			# While there is less images than the desired number, apply the processing techniques
+			while remaining_images > 0:
+				chosen_images: list[str] = random.sample(images, k=min(remaining_images, len(images)))
+				# Apply the processing techniques
+				for img in chosen_images:
+					img_destination: str = self._add_suffix(f"{destination_path}/{class_name}/{img}", used_destinations)
+					used_destinations.add(img_destination)
+					img_path: str = f"{class_path}/{img}"
+					# Get the technique and their fixed values
+					techniques: list[ProcessingTechnique] = [x.deterministic(use_default=False) for x in self.techniques]
+					# For each image found, add it to the queue
+					for path, dest in self.get_files_recursively(img_path, img_destination).items():
+						queue.append((path, dest, techniques))
+				# Update the remaining images
+				remaining_images -= len(chosen_images)
+		return queue

stouputils 1.14.0__py3-none-any.whl → 1.14.2__py3-none-any.whl

stouputils 1.14.0py3-none-any.whl → 1.14.2py3-none-any.whl