PyPI - RadGEEToolbox - Versions diffs - 1.6.7__py3-none-any.whl → 1.6.8__py3-none-any.whl - Mend

RadGEEToolbox 1.6.7py3-none-any.whl → 1.6.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

RadGEEToolbox/LandsatCollection.py +1043 -207
RadGEEToolbox/Sentinel1Collection.py +543 -210
RadGEEToolbox/Sentinel2Collection.py +937 -216
RadGEEToolbox/VisParams.py +173 -85
RadGEEToolbox/__init__.py +1 -1
{radgeetoolbox-1.6.7.dist-info → radgeetoolbox-1.6.8.dist-info}/METADATA +32 -9
radgeetoolbox-1.6.8.dist-info/RECORD +12 -0
radgeetoolbox-1.6.7.dist-info/RECORD +0 -12
{radgeetoolbox-1.6.7.dist-info → radgeetoolbox-1.6.8.dist-info}/WHEEL +0 -0
{radgeetoolbox-1.6.7.dist-info → radgeetoolbox-1.6.8.dist-info}/licenses/LICENSE.txt +0 -0
{radgeetoolbox-1.6.7.dist-info → radgeetoolbox-1.6.8.dist-info}/top_level.txt +0 -0

RadGEEToolbox/Sentinel1Collection.py CHANGED Viewed

@@ -236,60 +236,91 @@ class Sentinel1Collection:
     @staticmethod
     def PixelAreaSum(
-        image, band_name, geometry, threshold=-1, scale=30, maxPixels=1e12
+        image, band_name, geometry, threshold=-1, scale=10, maxPixels=1e12
     ):
         """
-        Function to calculate the summation of area for pixels of interest (above a specific threshold) in a geometry
-        and store the value as image property (matching name of chosen band).
+        Calculates the summation of area for pixels of interest (above a specific threshold) in a geometry
+        and store the value as image property (matching name of chosen band). If multiple band names are provided in a list,
+        the function will calculate area for each band in the list and store each as a separate property.
+        NOTE: The resulting value has units of square meters.
         Args:
             image (ee.Image): input ee.Image
-            band_name (string): name of band (string) for calculating area
+            band_name (string or list of strings): name of band(s) (string) for calculating area. If providing multiple band names, pass as a list of strings.
             geometry (ee.Geometry): ee.Geometry object denoting area to clip to for area calculation
-            threshold (float): integer threshold to specify masking of pixels below threshold (defaults to -1)
-            scale (int): integer scale of image resolution (meters) (defaults to 30)
+            threshold (float): integer threshold to specify masking of pixels below threshold (defaults to -1). If providing multiple band names, the same threshold will be applied to all bands. Best practice in this case is to mask the bands prior to passing to this function and leave threshold at default of -1.
+            scale (int): integer scale of image resolution (meters) (defaults to 10)
             maxPixels (int): integer denoting maximum number of pixels for calculations
         Returns:
-            ee.Image: ee.Image with area calculation stored as property matching name of band
+            ee.Image: ee.Image with area calculation in square meters stored as property matching name of band
         """
+        # Ensure band_name is a server-side ee.List for consistent processing. Wrap band_name in a list if it's a single string.
+        bands = ee.List(band_name) if isinstance(band_name, list) else ee.List([band_name])
+        # Create an image representing the area of each pixel in square meters
         area_image = ee.Image.pixelArea()
-        mask = image.select(band_name).gte(threshold)
-        final = image.addBands(area_image)
-        stats = (
-            final.select("area")
-            .updateMask(mask)
-            .rename(band_name)
-            .reduceRegion(
-                reducer=ee.Reducer.sum(),
-                geometry=geometry,
-                scale=scale,
-                maxPixels=maxPixels,
+        # Function to iterate over each band and calculate area, storing the result as a property on the image
+        def calculate_and_set_area(band, img_accumulator):
+            # Explcitly cast inputs to expected types
+            img_accumulator = ee.Image(img_accumulator)
+            band = ee.String(band)
+            # Create a mask from the input image for the current band
+            mask = img_accumulator.select(band).gte(threshold)
+            # Combine the original image with the area image
+            final = img_accumulator.addBands(area_image)
+            # Calculation of area for a given band, utilizing other inputs
+            stats = (
+                final.select("area").updateMask(mask)
+                .rename(band) # renames 'area' to band name like 'ndwi'
+                .reduceRegion(
+                    reducer=ee.Reducer.sum(),
+                    geometry=geometry,
+                    scale=scale,
+                    maxPixels=maxPixels,
+                )
             )
-        )
-        return image.set(band_name, stats.get(band_name))
+            # Retrieving the area value from the stats dictionary with stats.get(band), as the band name is now the key
+            reduced_area = stats.get(band)
+            # Checking whether the calculated area is valid and replaces with 0 if not. This avoids breaking the loop for erroneous images.
+            area_value = ee.Algorithms.If(reduced_area, reduced_area, 0)
+            # Set the property on the image, named after the band
+            return img_accumulator.set(band, area_value)
+        # Call to iterate the calculate_and_set_area function over the list of bands, starting with the original image
+        final_image = ee.Image(bands.iterate(calculate_and_set_area, image))
+        return final_image
     def PixelAreaSumCollection(
-        self, band_name, geometry, threshold=-1, scale=30, maxPixels=1e12
+        self, band_name, geometry, threshold=-1, scale=10, maxPixels=1e12, output_type='ImageCollection', area_data_export_path=None
     ):
         """
-        Function to calculate the summation of area for pixels of interest (above a specific threshold)
-        within a geometry and store the value as image property (matching name of chosen band) for an entire
-        image collection.
-        The resulting value has units of square meters.
+        Calculates the geodesic summation of area for pixels of interest (above a specific threshold)
+        within a geometry and stores the value as an image property (matching name of chosen band) for an entire
+        image collection. Optionally exports the area data to a CSV file.
+        NOTE: The resulting value has units of square meters.
         Args:
-            band_name (str): name of band (string) for calculating area.
-            geometry (ee.Geometry): ee.Geometry object denoting area to clip to for area calculation.
-            threshold (int): integer threshold to specify masking of pixels below threshold (defaults to -1).
-            scale (int): integer scale of image resolution (meters) (defaults to 30).
-            maxPixels (int): integer denoting maximum number of pixels for calculations.
+            band_name (string or list of strings): name of band(s) (string) for calculating area. If providing multiple band names, pass as a list of strings.
+            geometry (ee.Geometry): ee.Geometry object denoting area to clip to for area calculation
+            threshold (float): integer threshold to specify masking of pixels below threshold (defaults to -1). If providing multiple band names, the same threshold will be applied to all bands. Best practice in this case is to mask the bands prior to passing to this function and leave threshold at default of -1.
+            scale (int): integer scale of image resolution (meters) (defaults to 10)
+            maxPixels (int): integer denoting maximum number of pixels for calculations
+            output_type (str): 'ImageCollection' to return an ee.ImageCollection, 'Sentinel1Collection' to return a Sentinel1Collection object (defaults to 'ImageCollection')
+            area_data_export_path (str, optional): If provided, the function will save the resulting area data to a CSV file at the specified path.
         Returns:
-            ee.Image: Image with area calculation stored as property matching name of band.
+            ee.ImageCollection or Sentinel1Collection: Image collection of images with area calculation (square meters) stored as property matching name of band. Type of output depends on output_type argument.
         """
+        # If the area calculation has not been computed for this Sentinel1Collection instance, the area will be calculated for the provided bands
         if self._PixelAreaSumCollection is None:
             collection = self.collection
+            # Area calculation for each image in the collection, using the PixelAreaSum function
             AreaCollection = collection.map(
                 lambda image: Sentinel1Collection.PixelAreaSum(
                     image,
@@ -300,8 +331,38 @@ class Sentinel1Collection:
                     maxPixels=maxPixels,
                 )
             )
+            # Storing the result in the instance variable to avoid redundant calculations
             self._PixelAreaSumCollection = AreaCollection
-        return self._PixelAreaSumCollection
+        # If an export path is provided, the area data will be exported to a CSV file
+        if area_data_export_path:
+            Sentinel1Collection(collection=self._PixelAreaSumCollection).ExportProperties(property_names=band_name, file_path=area_data_export_path+'.csv')
+        # Returning the result in the desired format based on output_type argument or raising an error for invalid input
+        if output_type == 'ImageCollection':
+            return self._PixelAreaSumCollection
+        elif output_type == 'Sentinel1Collection':
+            return Sentinel1Collection(collection=self._PixelAreaSumCollection)
+        else:
+            raise ValueError("output_type must be 'ImageCollection' or 'Sentinel1Collection'")
+    def merge(self, other):
+        """
+        Merges the current Sentinel1Collection with another Sentinel1Collection, where images/bands with the same date are combined to a single multiband image.
+        Args:
+            other (Sentinel1Collection): Another Sentinel1Collection to merge with current collection.
+        Returns:
+            Sentinel1Collection: A new Sentinel1Collection containing images from both collections.
+        """
+        # Checking if 'other' is an instance of Sentinel1Collection
+        if not isinstance(other, Sentinel1Collection):
+            raise ValueError("The 'other' parameter must be an instance of Sentinel1Collection.")
+        # Merging the collections using the .combine() method
+        merged_collection = self.collection.combine(other.collection)
+        return Sentinel1Collection(collection=merged_collection)
     @staticmethod
     def multilook_fn(image, looks):
@@ -620,6 +681,60 @@ class Sentinel1Collection:
             dates = self._dates_list.getInfo()
             self._dates = dates
         return self._dates
+    def ExportProperties(self, property_names, file_path=None):
+        """
+        Fetches and returns specified properties from each image in the collection as a list, and returns a pandas DataFrame and optionally saves the results to a csv file.
+        Args:
+            property_names (list or str): A property name or list of property names to retrieve. The 'Date_Filter' property is always included to provide temporal context.
+            file_path (str, optional): If provided, the function will save the resulting DataFrame to a CSV file at this path. Defaults to None.
+        Returns:
+            pd.DataFrame: A pandas DataFrame containing the requested properties for each image, sorted chronologically by 'Date_Filter'.
+        """
+        # Ensure property_names is a list for consistent processing
+        if isinstance(property_names, str):
+            property_names = [property_names]
+        # Ensure properties are included without duplication, including 'Date_Filter'
+        all_properties_to_fetch = list(set(['Date_Filter'] + property_names))
+        # Defining the helper function to create features with specified properties
+        def create_feature_with_properties(image):
+            """A function to map over the collection and store the image properties as an ee.Feature.
+            Args:
+                image (ee.Image): An image from the collection.
+            Returns:
+                ee.Feature: A feature containing the specified properties from the image.
+            """
+            properties = image.toDictionary(all_properties_to_fetch)
+            return ee.Feature(None, properties)
+        # Map the feature creation function over the server-side collection.
+        # The result is an ee.FeatureCollection where each feature holds the properties of one image.
+        mapped_collection = self.collection.map(create_feature_with_properties)
+        # Explicitly cast to ee.FeatureCollection for clarity
+        feature_collection = ee.FeatureCollection(mapped_collection)
+        # Use the existing ee_to_df static method. This performs the single .getInfo() call
+        # and converts the structured result directly to a pandas DataFrame.
+        df = Sentinel1Collection.ee_to_df(feature_collection, columns=all_properties_to_fetch)
+        # Sort by date for a clean, chronological output.
+        if 'Date_Filter' in df.columns:
+            df = df.sort_values(by='Date_Filter').reset_index(drop=True)
+        # Check condition for saving to CSV
+        if file_path:
+            # Check whether file_path ends with .csv, if not, append it
+            if not file_path.lower().endswith('.csv'):
+                file_path += '.csv'
+            # Save DataFrame to CSV
+            df.to_csv(file_path, index=True)
+            print(f"Properties saved to {file_path}")
+        return df
     def get_filtered_collection(self):
         """
@@ -759,6 +874,37 @@ class Sentinel1Collection:
             self._min = col
         return self._min
+    def binary_mask(self, threshold=None, band_name=None):
+        """
+        Creates a binary mask (value of 1 for pixels above set threshold and value of 0 for all other pixels) of the Sentinel1Collection image collection based on a specified band.
+        If a singleband image is provided, the band name is automatically determined.
+        If multiple bands are available, the user must specify the band name to use for masking.
+        Args:
+            band_name (str, optional): The name of the band to use for masking. Defaults to None.
+        Returns:
+            Sentinel1Collection: Sentinel1Collection singleband image collection with binary masks applied.
+        """
+        if self.collection.size().eq(0).getInfo():
+            raise ValueError("The collection is empty. Cannot create a binary mask.")
+        if band_name is None:
+            first_image = self.collection.first()
+            band_names = first_image.bandNames()
+            if band_names.size().getInfo() == 0:
+                raise ValueError("No bands available in the collection.")
+            if band_names.size().getInfo() > 1:
+                raise ValueError("Multiple bands available, please specify a band name.")
+            else:
+                band_name = band_names.get(0).getInfo()
+        if threshold is None:
+            raise ValueError("Threshold must be specified for binary masking.")
+        col = self.collection.map(
+            lambda image: image.select(band_name).gte(threshold).rename(band_name)
+        )
+        return Sentinel1Collection(collection=col)
     def mask_to_polygon(self, polygon):
         """
         Function to mask Sentinel1Collection image collection by a polygon (ee.Geometry), where pixels outside the polygon are masked out.
@@ -1046,7 +1192,8 @@ class Sentinel1Collection:
         to_pandas=False,
         **kwargs,
     ):
-        """Extracts transect from an image. Adapted from the geemap package (https://geemap.org/common/#geemap.common.extract_transect). Exists as an alternative to RadGEEToolbox 'transect' function.
+        """
+        Extracts transect from an image. Adapted from the geemap package (https://geemap.org/common/#geemap.common.extract_transect).
         Args:
             image (ee.Image): The image to extract transect from.
@@ -1120,7 +1267,8 @@ class Sentinel1Collection:
         dist_interval=10,
         to_pandas=True,
     ):
-        """Computes and stores the values along a transect for each line in a list of lines. Builds off of the extract_transect function from the geemap package
+        """
+        Computes and stores the values along a transect for each line in a list of lines. Builds off of the extract_transect function from the geemap package
             where checks are ran to ensure that the reducer column is present in the transect data. If the reducer column is not present, a column of NaNs is created.
             An ee reducer is used to aggregate the values along the transect, depending on the number of segments or distance interval specified. Defaults to 'mean' reducer.
@@ -1195,52 +1343,201 @@ class Sentinel1Collection:
         self,
         lines,
         line_names,
-        save_folder_path,
         reducer="mean",
+        dist_interval= 10,
         n_segments=None,
-        dist_interval=10,
-        to_pandas=True,
+        scale=10,
+        processing_mode='aggregated',
+        save_folder_path=None,
+        sampling_method='line',
+        point_buffer_radius=5
     ):
-        """Computes and stores the values along a transect for each line in a list of lines for each image in a Sentinel1Collection image collection, then saves the data for each image to a csv file. Builds off of the extract_transect function from the geemap package
-            where checks are ran to ensure that the reducer column is present in the transect data. If the reducer column is not present, a column of NaNs is created.
-            An ee reducer is used to aggregate the values along the transect, depending on the number of segments or distance interval specified. Defaults to 'mean' reducer.
-            Naming conventions for the csv files follows as: "image-date_line-name.csv"
+        """
+        Computes and returns pixel values along transects for each image in a collection.
-        Args:
-            lines (list): List of ee.Geometry.LineString objects.
-            line_names (list of strings): List of line string names.
-            save_folder_path (str): The path to the folder where the csv files will be saved.
-            reducer (str): The ee reducer to use. Defaults to 'mean'.
-            n_segments (int): The number of segments that the LineString will be split into. Defaults to None.
-            dist_interval (float): The distance interval used for splitting the LineString. If specified, the n_segments parameter will be ignored. Defaults to 10.
-            to_pandas (bool): Whether to convert the result to a pandas dataframe. Defaults to True.
+        This iterative function generates time-series data along one or more lines, and
+        supports two different geometric sampling methods ('line' and 'buffered_point')
+        for maximum flexibility and performance.
-        Raises:
-            Exception: If the program fails to compute.
+        There are two processing modes available, aggregated and iterative:
+        - 'aggregated' (default; suggested): Fast, server-side processing. Fetches all results
+            in a single request. Highly recommended. Returns a dictionary of pandas DataFrames.
+        - 'iterative': Slower, client-side loop that processes one image at a time.
+            Kept for backward compatibility (effectively depreciated). Returns None and saves individual CSVs.
+            This method is not recommended unless absolutely necessary, as it is less efficient and may be subject to client-side timeouts.
+        Args:
+            lines (list): A list of one or more ee.Geometry.LineString objects that
+                define the transects.
+            line_names (list): A list of string names for each transect. The length
+                of this list must match the length of the `lines` list.
+            reducer (str, optional): The name of the ee.Reducer to apply at each
+                transect point (e.g., 'mean', 'median', 'first'). Defaults to 'mean'.
+            dist_interval (float, optional): The distance interval in meters for
+                sampling points along each transect. Will be overridden if `n_segments` is provided.
+                Defaults to 10. Recommended to increase this value when using the
+                'line' processing method, or else you may get blank rows.
+            n_segments (int, optional): The number of equal-length segments to split
+                each transect line into for sampling. This parameter overrides `dist_interval`.
+                Defaults to None.
+            scale (int, optional): The nominal scale in meters for the reduction,
+                which should typically match the pixel resolution of the imagery.
+                Defaults to 10.
+            processing_mode (str, optional): The method for processing the collection.
+                - 'aggregated' (default): Fast, server-side processing. Fetches all
+                  results in a single request. Highly recommended. Returns a dictionary
+                  of pandas DataFrames.
+                - 'iterative': Slower, client-side loop that processes one image at a
+                  time. Kept for backward compatibility. Returns None and saves
+                  individual CSVs.
+            save_folder_path (str, optional): If provided, the function will save the
+                resulting transect data to CSV files. The behavior depends on the
+                `processing_mode`:
+                - In 'aggregated' mode, one CSV is saved for each transect,
+                  containing all dates. (e.g., 'MyTransect_transects.csv').
+                - In 'iterative' mode, one CSV is saved for each date,
+                  containing all transects. (e.g., '2022-06-15_transects.csv').
+            sampling_method (str, optional): The geometric method used for sampling.
+                - 'line' (default): Reduces all pixels intersecting each small line
+                  segment. This can be unreliable and produce blank rows if
+                  `dist_interval` is too small relative to the `scale`.
+                - 'buffered_point': Reduces all pixels within a buffer around the
+                  midpoint of each line segment. This method is more robust and
+                  reliably avoids blank rows, but may not reduce all pixels along a line segment.
+            point_buffer_radius (int, optional): The radius in meters for the buffer
+                when `sampling_method` is 'buffered_point'. Defaults to 5.
         Returns:
-            csv file: file for each image with an organized list of values along the transect(s)
+            dict or None:
+            - If `processing_mode` is 'aggregated', returns a dictionary where each
+              key is a transect name and each value is a pandas DataFrame. In the
+              DataFrame, the index is the distance along the transect and each
+              column represents an image date. Optionally saves CSV files if
+                `save_folder_path` is provided.
+            - If `processing_mode` is 'iterative', returns None as it saves
+              files directly.
+        Raises:
+            ValueError: If `lines` and `line_names` have different lengths, or if
+                an unknown reducer or processing mode is specified.
         """
-        image_collection = self
-        image_collection_dates = self.dates
-        for i, date in enumerate(image_collection_dates):
+        # Validating inputs
+        if len(lines) != len(line_names):
+            raise ValueError("'lines' and 'line_names' must have the same number of elements.")
+        ### Current, server-side processing method ###
+        if processing_mode == 'aggregated':
+            # Validating reducer type
             try:
-                print(f"Processing image {i+1}/{len(image_collection_dates)}: {date}")
-                image = image_collection.image_grab(i)
-                transects_df = Sentinel1Collection.transect(
-                    image,
-                    lines,
-                    line_names,
-                    reducer=reducer,
-                    n_segments=n_segments,
-                    dist_interval=dist_interval,
-                    to_pandas=to_pandas,
-                )
-                image_id = date
-                transects_df.to_csv(f"{save_folder_path}{image_id}_transects.csv")
-                print(f"{image_id}_transects saved to csv")
-            except Exception as e:
-                print(f"An error occurred while processing image {i+1}: {e}")
+                ee_reducer = getattr(ee.Reducer, reducer)()
+            except AttributeError:
+                raise ValueError(f"Unknown reducer: '{reducer}'.")
+            ### Function to extract transects for a single image
+            def get_transects_for_image(image):
+                image_date = image.get('Date_Filter')
+                # Initialize an empty list to hold all transect FeatureCollections
+                all_transects_for_image = ee.List([])
+                # Looping through each line and processing
+                for i, line in enumerate(lines):
+                    # Index line and name
+                    line_name = line_names[i]
+                    # Determine maxError based on image projection, used for geometry operations
+                    maxError = image.projection().nominalScale().divide(5)
+                    # Calculate effective distance interval
+                    length = line.length(maxError) # using maxError here ensures consistency with cutLines
+                    # Determine effective distance interval based on n_segments or dist_interval
+                    effective_dist_interval = ee.Algorithms.If(
+                        n_segments,
+                        length.divide(n_segments),
+                        dist_interval or 30 # Defaults to 30 if both are None
+                    )
+                    # Generate distances along the line(s) for segmentation
+                    distances = ee.List.sequence(0, length, effective_dist_interval)
+                    # Segmenting the line into smaller lines at the specified distances
+                    cut_lines_geoms = line.cutLines(distances, maxError).geometries()
+                    # Function to create features with distance attributes
+                    # Adjusted to ensure consistent return types
+                    def set_dist_attr(l):
+                        # l is a list: [geometry, distance]
+                        # Extracting geometry portion of line
+                        geom_segment = ee.Geometry(ee.List(l).get(0))
+                        # Extracting distance value for attribute
+                        distance = ee.Number(ee.List(l).get(1))
+                        ### Determine final geometry based on sampling method
+                        # If the sampling method is 'buffered_point',
+                        # create a buffered point feature at the centroid of each segment,
+                        # otherwise create a line feature
+                        final_feature = ee.Algorithms.If(
+                            ee.String(sampling_method).equals('buffered_point'),
+                            # True Case: Create the buffered point feature
+                            ee.Feature(
+                                geom_segment.centroid(maxError).buffer(point_buffer_radius),
+                                {'distance': distance}
+                            ),
+                            # False Case: Create the line segment feature
+                            ee.Feature(geom_segment, {'distance': distance})
+                        )
+                        # Return either the line segment feature or the buffered point feature
+                        return final_feature
+                    # Creating a FeatureCollection of the cut lines with distance attributes
+                    # Using map to apply the set_dist_attr function to each cut line geometry
+                    line_features = ee.FeatureCollection(cut_lines_geoms.zip(distances).map(set_dist_attr))
+                    # Reducing the image over the line features to get transect values
+                    transect_fc = image.reduceRegions(
+                        collection=line_features, reducer=ee_reducer, scale=scale
+                    )
+                    # Adding image date and line name properties to each feature
+                    def set_props(feature):
+                        return feature.set({'image_date': image_date, 'transect_name': line_name})
+                    # Append to the list of all transects for this image
+                    all_transects_for_image = all_transects_for_image.add(transect_fc.map(set_props))
+                # Combine all transect FeatureCollections into a single FeatureCollection and flatten
+                # Flatten is used to merge the list of FeatureCollections into one
+                return ee.FeatureCollection(all_transects_for_image).flatten()
+            # Map the function over the entire image collection and flatten the results
+            results_fc = ee.FeatureCollection(self.collection.map(get_transects_for_image)).flatten()
+            # Convert the results to a pandas DataFrame
+            df = Sentinel1Collection.ee_to_df(results_fc, remove_geom=True)
+            # Check if the DataFrame is empty
+            if df.empty:
+                print("Warning: No transect data was generated.")
+                return {}
+            # Initialize dictionary to hold output DataFrames for each transect
+            output_dfs = {}
+            # Loop through each unique transect name and create a pivot table
+            for name in sorted(df['transect_name'].unique()):
+                transect_df = df[df['transect_name'] == name]
+                pivot_df = transect_df.pivot(index='distance', columns='image_date', values=reducer)
+                pivot_df.columns.name = 'Date'
+                output_dfs[name] = pivot_df
+            # Optionally save each transect DataFrame to CSV
+            if save_folder_path:
+                for transect_name, transect_df in output_dfs.items():
+                    safe_filename = "".join(x for x in transect_name if x.isalnum() or x in "._-")
+                    file_path = f"{save_folder_path}{safe_filename}_transects.csv"
+                    transect_df.to_csv(file_path)
+                    print(f"Saved transect data to {file_path}")
+            return output_dfs
+        ### old, depreciated iterative client-side processing method ###
+        elif processing_mode == 'iterative':
+            if not save_folder_path:
+                raise ValueError("`save_folder_path` is required for 'iterative' processing mode.")
+            image_collection_dates = self.dates
+            for i, date in enumerate(image_collection_dates):
+                try:
+                    print(f"Processing image {i+1}/{len(image_collection_dates)}: {date}")
+                    image = self.image_grab(i)
+                    transects_df = Sentinel1Collection.transect(
+                        image, lines, line_names, reducer, n_segments, dist_interval, to_pandas=True
+                    )
+                    transects_df.to_csv(f"{save_folder_path}{date}_transects.csv")
+                    print(f"{date}_transects saved to csv")
+                except Exception as e:
+                    print(f"An error occurred while processing image {i+1}: {e}")
+        else:
+            raise ValueError("`processing_mode` must be 'iterative' or 'aggregated'.")
     @staticmethod
     def extract_zonal_stats_from_buffer(
@@ -1248,42 +1545,40 @@ class Sentinel1Collection:
         coordinates,
         buffer_size=1,
         reducer_type="mean",
-        scale=40,
+        scale=10,
         tileScale=1,
         coordinate_names=None,
     ):
         """
-        Function to extract spatial statistics from an image for a list of coordinates, providing individual statistics for each location.
+        Function to extract spatial statistics from an image for a list or single set of (long, lat) coordinates, providing individual statistics for each location.
         A radial buffer is applied around each coordinate to extract the statistics, which defaults to 1 meter.
         The function returns a pandas DataFrame with the statistics for each coordinate.
+        NOTE: Be sure the coordinates are provided as longitude, latitude (x, y) tuples!
         Args:
-            image (ee.Image): The image from which to extract the statistics. Must be a singleband image or else resulting values will all be zero!
-            coordinates (list): Single tuple or list of tuples with the decimal degrees coordinates in the format of (longitude, latitude) for which to extract the statistics. NOTE the format needs to be [(x1, y1), (x2, y2), ...].
-            buffer_size (int, optional): The radial buffer size around the coordinates in meters. Defaults to 1.
-            reducer_type (str, optional): The reducer type to use. Defaults to 'mean'. Options are 'mean', 'median', 'min', and 'max'.
-            scale (int, optional): The scale (pixel size) to use in meters. Defaults to 40.
-            tileScale (int, optional): The tile scale to use. Defaults to 1.
-            coordinate_names (list, optional): A list of strings with the names of the coordinates. Defaults to None.
+            image (ee.Image): The image from which to extract statistics. Should be single-band.
+            coordinates (list or tuple): A single (lon, lat) tuple or a list of (lon, lat) tuples.
+            buffer_size (int, optional): The radial buffer size in meters. Defaults to 1.
+            reducer_type (str, optional): The ee.Reducer to use ('mean', 'median', 'min', etc.). Defaults to 'mean'.
+            scale (int, optional): The scale in meters for the reduction. Defaults to 10.
+            tileScale (int, optional): The tile scale factor. Defaults to 1.
+            coordinate_names (list, optional): A list of names for the coordinates.
         Returns:
-            pd.DataFrame: A pandas DataFrame with the statistics for each coordinate, each column name corresponds to the name of the coordinate feature (which may be blank if no names are supplied).
+            pd.DataFrame: A pandas DataFrame with the image's 'Date_Filter' as the index and a
+                          column for each coordinate location.
         """
-        # Check if coordinates is a single tuple and convert it to a list of tuples if necessary
         if isinstance(coordinates, tuple) and len(coordinates) == 2:
             coordinates = [coordinates]
         elif not (
             isinstance(coordinates, list)
-            and all(
-                isinstance(coord, tuple) and len(coord) == 2 for coord in coordinates
-            )
+            and all(isinstance(coord, tuple) and len(coord) == 2 for coord in coordinates)
         ):
             raise ValueError(
-                "Coordinates must be a list of tuples with two elements each (latitude, longitude)."
+                "Coordinates must be a list of tuples with two elements each (longitude, latitude)."
             )
-        # Check if coordinate_names is a list of strings
         if coordinate_names is not None:
             if not isinstance(coordinate_names, list) or not all(
                 isinstance(name, str) for name in coordinate_names
@@ -1296,146 +1591,184 @@ class Sentinel1Collection:
         else:
             coordinate_names = [f"Location {i+1}" for i in range(len(coordinates))]
-        # Check if the image is a singleband image
-        def check_singleband(image):
-            band_count = image.bandNames().size()
-            return ee.Algorithms.If(band_count.eq(1), image, ee.Image.constant(0))
+        image_date = image.get('Date_Filter')
-        # Check if the image is a singleband image
-        image = ee.Image(check_singleband(image))
-        # Convert coordinates to ee.Geometry.Point, buffer them, and add label/name to feature
         points = [
             ee.Feature(
-                ee.Geometry.Point([coord[0], coord[1]]).buffer(buffer_size),
-                {"name": str(coordinate_names[i])},
+                ee.Geometry.Point(coord).buffer(buffer_size),
+                {"location_name": str(name)},
             )
-            for i, coord in enumerate(coordinates)
+            for coord, name in zip(coordinates, coordinate_names)
         ]
-        # Create a feature collection from the buffered points
         features = ee.FeatureCollection(points)
-        # Reduce the image to the buffered points - handle different reducer types
-        if reducer_type == "mean":
-            img_stats = image.reduceRegions(
-                collection=features,
-                reducer=ee.Reducer.mean(),
-                scale=scale,
-                tileScale=tileScale,
-            )
-            mean_values = img_stats.getInfo()
-            means = []
-            names = []
-            for feature in mean_values["features"]:
-                names.append(feature["properties"]["name"])
-                means.append(feature["properties"]["mean"])
-            organized_values = pd.DataFrame([means], columns=names)
-        elif reducer_type == "median":
-            img_stats = image.reduceRegions(
-                collection=features,
-                reducer=ee.Reducer.median(),
-                scale=scale,
-                tileScale=tileScale,
-            )
-            median_values = img_stats.getInfo()
-            medians = []
-            names = []
-            for feature in median_values["features"]:
-                names.append(feature["properties"]["name"])
-                medians.append(feature["properties"]["median"])
-            organized_values = pd.DataFrame([medians], columns=names)
-        elif reducer_type == "min":
-            img_stats = image.reduceRegions(
-                collection=features,
-                reducer=ee.Reducer.min(),
-                scale=scale,
-                tileScale=tileScale,
-            )
-            min_values = img_stats.getInfo()
-            mins = []
-            names = []
-            for feature in min_values["features"]:
-                names.append(feature["properties"]["name"])
-                mins.append(feature["properties"]["min"])
-            organized_values = pd.DataFrame([mins], columns=names)
-        elif reducer_type == "max":
-            img_stats = image.reduceRegions(
-                collection=features,
-                reducer=ee.Reducer.max(),
-                scale=scale,
-                tileScale=tileScale,
-            )
-            max_values = img_stats.getInfo()
-            maxs = []
-            names = []
-            for feature in max_values["features"]:
-                names.append(feature["properties"]["name"])
-                maxs.append(feature["properties"]["max"])
-            organized_values = pd.DataFrame([maxs], columns=names)
-        else:
-            raise ValueError(
-                "reducer_type must be one of 'mean', 'median', 'min', or 'max'."
-            )
-        return organized_values
+        try:
+            reducer = getattr(ee.Reducer, reducer_type)()
+        except AttributeError:
+            raise ValueError(f"Unknown reducer_type: '{reducer_type}'.")
+        stats_fc = image.reduceRegions(
+            collection=features,
+            reducer=reducer,
+            scale=scale,
+            tileScale=tileScale,
+        )
+        df = Sentinel1Collection.ee_to_df(stats_fc, remove_geom=True)
+        if df.empty:
+            print("Warning: No results returned. The points may not intersect the image.")
+            empty_df = pd.DataFrame(columns=coordinate_names)
+            empty_df.index.name = 'Date'
+            return empty_df
+        if reducer_type not in df.columns:
+            print(f"Warning: Reducer type '{reducer_type}' not found in results. Returning raw data.")
+            return df
+        pivot_df = df.pivot(columns='location_name', values=reducer_type)
+        pivot_df['Date'] = image_date.getInfo() # .getInfo() is needed here as it's a server object
+        pivot_df = pivot_df.set_index('Date')
+        return pivot_df
     def iterate_zonal_stats(
         self,
-        coordinates,
-        buffer_size=1,
+        geometries,
         reducer_type="mean",
-        scale=40,
+        scale=10,
+        geometry_names=None,
+        buffer_size=1,
         tileScale=1,
-        coordinate_names=None,
-        file_path=None,
         dates=None,
+        file_path=None
     ):
         """
-        Function to iterate over a collection of images and extract spatial statistics for a list of coordinates (defaults to mean). Individual statistics are provided for each location.
-        A radial buffer is applied around each coordinate to extract the statistics, which defaults to 1 meter.
+        Iterates over a collection of images and extracts spatial statistics (defaults to mean) for a given list of geometries or coordinates. Individual statistics are calculated for each geometry or coordinate provided.
+        When coordinates are provided, a radial buffer is applied around each coordinate to extract the statistics, where the size of the buffer is determined by the buffer_size argument (defaults to 1 meter).
         The function returns a pandas DataFrame with the statistics for each coordinate and date, or optionally exports the data to a table in .csv format.
-        NOTE: The input RadGEEToolbox class object but be a collection of singleband images or else resulting values will all be zero!
         Args:
-            coordinates (list): Single tuple or a list of tuples with the coordinates as decimal degrees in the format of (longitude, latitude) for which to extract the statistics. NOTE the format needs to be [(x1, y1), (x2, y2), ...].
-            buffer_size (int, optional): The radial buffer size in meters around the coordinates. Defaults to 1.
-            reducer_type (str, optional): The reducer type to use. Defaults to 'mean'. Options are 'mean', 'median', 'min', and 'max'.
-            scale (int, optional): The scale (pixel size) to use in meters. Defaults to 40.
-            tileScale (int, optional): The tile scale to use. Defaults to 1.
-            coordinate_names (list, optional): A list of strings with the names of the coordinates. Defaults to None.
-            file_path (str, optional): The file path to export the data to. Defaults to None. Ensure ".csv" is NOT included in the file name path.
-            dates (list, optional): A list of dates for which to extract the statistics. Defaults to None.
+            geometries (ee.Geometry, ee.Feature, ee.FeatureCollection, list, or tuple): Input geometries for which to extract statistics. Can be a single ee.Geometry, an ee.Feature, an ee.FeatureCollection, a list of (lon, lat) tuples, or a list of ee.Geometry objects. Be careful to NOT provide coordinates as (lat, lon)!
+            reducer_type (str, optional): The ee.Reducer to use, e.g., 'mean', 'median', 'max', 'sum'. Defaults to 'mean'. Any ee.Reducer method can be used.
+            scale (int, optional): Pixel scale in meters for the reduction. Defaults to 10.
+            geometry_names (list, optional): A list of string names for the geometries. If provided, must match the number of geometries. Defaults to None.
+            buffer_size (int, optional): Radial buffer in meters around coordinates. Defaults to 1.
+            tileScale (int, optional): A scaling factor to reduce aggregation tile size. Defaults to 1.
+            dates (list, optional): A list of date strings ('YYYY-MM-DD') for filtering the collection, such that only images from these dates are included for zonal statistic retrieval. Defaults to None, which uses all dates in the collection.
+            file_path (str, optional): File path to save the output CSV.
         Returns:
-            pd.DataFrame: A pandas DataFrame with the statistics for each coordinate and date, each row corresponds to a date and each column to a coordinate.
-            .csv file: Optionally exports the data to a table in .csv format. If file_path is None, the function returns the DataFrame - otherwise the function will only export the csv file.
-        """
-        img_collection = self
-        # Create empty DataFrame to accumulate results
-        accumulated_df = pd.DataFrame()
-        # Check if dates is None, if not use the dates provided
-        if dates is None:
-            dates = img_collection.dates
-        else:
-            dates = dates
-        # Iterate over the dates and extract the zonal statistics for each date
-        for date in dates:
-            image = img_collection.collection.filter(
-                ee.Filter.eq("Date_Filter", date)
-            ).first()
-            single_df = Sentinel1Collection.extract_zonal_stats_from_buffer(
-                image,
-                coordinates,
-                buffer_size=buffer_size,
-                reducer_type=reducer_type,
-                scale=scale,
-                tileScale=tileScale,
-                coordinate_names=coordinate_names,
+            pd.DataFrame or None: A pandas DataFrame with dates as the index and coordinate names
+                                  as columns. Returns None if using 'iterative' mode with file_path.
+        Raises:
+            ValueError: If input parameters are invalid.
+            TypeError: If geometries input type is unsupported.
+        """
+        img_collection_obj = self
+        # Filter collection by dates if provided
+        if dates:
+            img_collection_obj = Sentinel1Collection(
+                collection=self.collection.filter(ee.Filter.inList('Date_Filter', dates))
             )
-            single_df["Date"] = date
-            single_df.set_index("Date", inplace=True)
-            accumulated_df = pd.concat([accumulated_df, single_df])
-        # Return the DataFrame or export the data to a .csv file
-        if file_path is None:
-            return accumulated_df
+        # Initialize variables
+        features = None
+        validated_coordinates = []
+        # Function to standardize feature names if no names are provided
+        def set_standard_name(feature):
+            has_geo_name = feature.get('geo_name')
+            has_name = feature.get('name')
+            has_index = feature.get('system:index')
+            new_name = ee.Algorithms.If(
+                has_geo_name, has_geo_name,
+                ee.Algorithms.If(has_name, has_name,
+                ee.Algorithms.If(has_index, has_index, 'unnamed_geometry')))
+            return feature.set({'geo_name': new_name})
+        if isinstance(geometries, (ee.FeatureCollection, ee.Feature)):
+            features = ee.FeatureCollection(geometries)
+            if geometry_names:
+                 print("Warning: 'geometry_names' are ignored when the input is an ee.Feature or ee.FeatureCollection.")
+        elif isinstance(geometries, ee.Geometry):
+             name = geometry_names[0] if (geometry_names and geometry_names[0]) else 'unnamed_geometry'
+             features = ee.FeatureCollection([ee.Feature(geometries).set('geo_name', name)])
+        elif isinstance(geometries, list):
+            if not geometries: # Handle empty list case
+                raise ValueError("'geometries' list cannot be empty.")
+            # Case: List of coordinates
+            if all(isinstance(i, tuple) for i in geometries):
+                validated_coordinates = geometries
+                if geometry_names is None:
+                    geometry_names = [f"Location_{i+1}" for i in range(len(validated_coordinates))]
+                elif len(geometry_names) != len(validated_coordinates):
+                     raise ValueError("geometry_names must have the same length as the coordinates list.")
+                points = [
+                    ee.Feature(ee.Geometry.Point(coord).buffer(buffer_size), {'geo_name': str(name)})
+                    for coord, name in zip(validated_coordinates, geometry_names)
+                ]
+                features = ee.FeatureCollection(points)
+            # Case: List of Geometries
+            elif all(isinstance(i, ee.Geometry) for i in geometries):
+                if geometry_names is None:
+                    geometry_names = [f"Geometry_{i+1}" for i in range(len(geometries))]
+                elif len(geometry_names) != len(geometries):
+                     raise ValueError("geometry_names must have the same length as the geometries list.")
+                geom_features = [
+                    ee.Feature(geom).set({'geo_name': str(name)})
+                    for geom, name in zip(geometries, geometry_names)
+                ]
+                features = ee.FeatureCollection(geom_features)
+            else:
+                raise TypeError("Input list must be a list of (lon, lat) tuples OR a list of ee.Geometry objects.")
+        elif isinstance(geometries, tuple) and len(geometries) == 2:
+            name = geometry_names[0] if geometry_names else 'Location_1'
+            features = ee.FeatureCollection([
+                ee.Feature(ee.Geometry.Point(geometries).buffer(buffer_size), {'geo_name': name})
+            ])
         else:
-            return accumulated_df.to_csv(f"{file_path}.csv")
+            raise TypeError("Unsupported type for 'geometries'.")
+        features = features.map(set_standard_name)
+        try:
+            reducer = getattr(ee.Reducer, reducer_type)()
+        except AttributeError:
+            raise ValueError(f"Unknown reducer_type: '{reducer_type}'.")
+        def calculate_stats_for_image(image):
+            image_date = image.get('Date_Filter')
+            stats_fc = image.reduceRegions(
+                collection=features, reducer=reducer, scale=scale, tileScale=tileScale
+            )
+            return stats_fc.map(lambda f: f.set('image_date', image_date))
+        results_fc = ee.FeatureCollection(img_collection_obj.collection.map(calculate_stats_for_image)).flatten()
+        df = Sentinel1Collection.ee_to_df(results_fc, remove_geom=True)
+        # Checking for issues
+        if df.empty:
+            print("No results found for the given parameters. Check if the geometries intersect with the images, if the dates filter is too restrictive, or if the provided bands are empty.")
+            return df
+        if reducer_type not in df.columns:
+            print(f"Warning: Reducer '{reducer_type}' not found in results.")
+            return df
+        # Reshape DataFrame to have dates as index and geometry names as columns
+        pivot_df = df.pivot(index='image_date', columns='geo_name', values=reducer_type)
+        pivot_df.index.name = 'Date'
+        if file_path:
+            # Check if file_path ends with .csv and remove it if so for consistency
+            if file_path.endswith('.csv'):
+                file_path = file_path[:-4]
+            pivot_df.to_csv(f"{file_path}.csv")
+            print(f"Zonal stats saved to {file_path}.csv")
+            return
+        return pivot_df

RadGEEToolbox 1.6.7__py3-none-any.whl → 1.6.8__py3-none-any.whl

RadGEEToolbox 1.6.7py3-none-any.whl → 1.6.8py3-none-any.whl