PyPI - rslearn - Versions diffs - 0.0.1__py3-none-any.whl → 0.0.3__py3-none-any.whl - Mend

rslearn 0.0.1py3-none-any.whl → 0.0.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (117) hide show

rslearn/config/__init__.py +2 -2
rslearn/config/dataset.py +164 -98
rslearn/const.py +9 -15
rslearn/data_sources/__init__.py +8 -0
rslearn/data_sources/aws_landsat.py +235 -80
rslearn/data_sources/aws_open_data.py +103 -118
rslearn/data_sources/aws_sentinel1.py +142 -0
rslearn/data_sources/climate_data_store.py +303 -0
rslearn/data_sources/copernicus.py +943 -12
rslearn/data_sources/data_source.py +17 -12
rslearn/data_sources/earthdaily.py +489 -0
rslearn/data_sources/earthdata_srtm.py +300 -0
rslearn/data_sources/gcp_public_data.py +556 -203
rslearn/data_sources/geotiff.py +1 -0
rslearn/data_sources/google_earth_engine.py +454 -115
rslearn/data_sources/local_files.py +153 -103
rslearn/data_sources/openstreetmap.py +33 -39
rslearn/data_sources/planet.py +17 -35
rslearn/data_sources/planet_basemap.py +296 -0
rslearn/data_sources/planetary_computer.py +764 -0
rslearn/data_sources/raster_source.py +11 -297
rslearn/data_sources/usda_cdl.py +206 -0
rslearn/data_sources/usgs_landsat.py +130 -73
rslearn/data_sources/utils.py +256 -61
rslearn/data_sources/vector_source.py +1 -0
rslearn/data_sources/worldcereal.py +456 -0
rslearn/data_sources/worldcover.py +142 -0
rslearn/data_sources/worldpop.py +156 -0
rslearn/data_sources/xyz_tiles.py +141 -79
rslearn/dataset/__init__.py +8 -2
rslearn/dataset/add_windows.py +1 -1
rslearn/dataset/dataset.py +43 -7
rslearn/dataset/index.py +173 -0
rslearn/dataset/manage.py +137 -49
rslearn/dataset/materialize.py +436 -95
rslearn/dataset/window.py +225 -34
rslearn/log_utils.py +24 -0
rslearn/main.py +351 -130
rslearn/models/clip.py +62 -0
rslearn/models/conv.py +56 -0
rslearn/models/croma.py +270 -0
rslearn/models/detr/__init__.py +5 -0
rslearn/models/detr/box_ops.py +103 -0
rslearn/models/detr/detr.py +493 -0
rslearn/models/detr/matcher.py +107 -0
rslearn/models/detr/position_encoding.py +114 -0
rslearn/models/detr/transformer.py +429 -0
rslearn/models/detr/util.py +24 -0
rslearn/models/faster_rcnn.py +10 -19
rslearn/models/fpn.py +1 -1
rslearn/models/module_wrapper.py +91 -0
rslearn/models/moe/distributed.py +262 -0
rslearn/models/moe/soft.py +676 -0
rslearn/models/molmo.py +65 -0
rslearn/models/multitask.py +351 -24
rslearn/models/pick_features.py +15 -2
rslearn/models/pooling_decoder.py +4 -2
rslearn/models/satlaspretrain.py +4 -7
rslearn/models/simple_time_series.py +75 -59
rslearn/models/singletask.py +8 -4
rslearn/models/ssl4eo_s12.py +10 -10
rslearn/models/swin.py +22 -21
rslearn/models/task_embedding.py +250 -0
rslearn/models/terramind.py +219 -0
rslearn/models/trunk.py +280 -0
rslearn/models/unet.py +21 -5
rslearn/models/upsample.py +35 -0
rslearn/models/use_croma.py +508 -0
rslearn/py.typed +0 -0
rslearn/tile_stores/__init__.py +52 -18
rslearn/tile_stores/default.py +382 -0
rslearn/tile_stores/tile_store.py +236 -132
rslearn/train/callbacks/freeze_unfreeze.py +32 -20
rslearn/train/callbacks/gradients.py +109 -0
rslearn/train/callbacks/peft.py +116 -0
rslearn/train/data_module.py +407 -14
rslearn/train/dataset.py +746 -200
rslearn/train/lightning_module.py +164 -54
rslearn/train/optimizer.py +31 -0
rslearn/train/prediction_writer.py +235 -78
rslearn/train/scheduler.py +62 -0
rslearn/train/tasks/classification.py +13 -12
rslearn/train/tasks/detection.py +101 -39
rslearn/train/tasks/multi_task.py +24 -9
rslearn/train/tasks/regression.py +113 -21
rslearn/train/tasks/segmentation.py +353 -35
rslearn/train/tasks/task.py +2 -2
rslearn/train/transforms/__init__.py +1 -1
rslearn/train/transforms/concatenate.py +9 -5
rslearn/train/transforms/crop.py +8 -4
rslearn/train/transforms/flip.py +5 -1
rslearn/train/transforms/normalize.py +34 -10
rslearn/train/transforms/pad.py +1 -1
rslearn/train/transforms/transform.py +75 -73
rslearn/utils/__init__.py +2 -6
rslearn/utils/array.py +2 -2
rslearn/utils/feature.py +2 -2
rslearn/utils/fsspec.py +70 -1
rslearn/utils/geometry.py +214 -7
rslearn/utils/get_utm_ups_crs.py +2 -3
rslearn/utils/grid_index.py +5 -5
rslearn/utils/jsonargparse.py +33 -0
rslearn/utils/mp.py +4 -3
rslearn/utils/raster_format.py +211 -96
rslearn/utils/rtree_index.py +64 -17
rslearn/utils/sqlite_index.py +7 -1
rslearn/utils/vector_format.py +235 -77
{rslearn-0.0.1.dist-info → rslearn-0.0.3.dist-info}/METADATA +366 -284
rslearn-0.0.3.dist-info/RECORD +123 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.3.dist-info}/WHEEL +1 -1
rslearn/tile_stores/file.py +0 -242
rslearn/utils/mgrs.py +0 -24
rslearn/utils/utils.py +0 -22
rslearn-0.0.1.dist-info/RECORD +0 -88
{rslearn-0.0.1.dist-info → rslearn-0.0.3.dist-info}/entry_points.txt +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.3.dist-info/licenses}/LICENSE +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.3.dist-info}/top_level.txt +0 -0

rslearn/train/tasks/segmentation.py CHANGED Viewed

@@ -12,22 +12,23 @@ from rslearn.utils import Feature
 from .task import BasicTask
+# TODO: This is duplicated code fix it
 DEFAULT_COLORS = [
-    [255, 0, 0],
-    [0, 255, 0],
-    [0, 0, 255],
-    [255, 255, 0],
-    [0, 255, 255],
-    [255, 0, 255],
-    [0, 128, 0],
-    [255, 160, 122],
-    [139, 69, 19],
-    [128, 128, 128],
-    [255, 255, 255],
-    [143, 188, 143],
-    [95, 158, 160],
-    [255, 200, 0],
-    [128, 0, 0],
+    (255, 0, 0),
+    (0, 255, 0),
+    (0, 0, 255),
+    (255, 255, 0),
+    (0, 255, 255),
+    (255, 0, 255),
+    (0, 128, 0),
+    (255, 160, 122),
+    (139, 69, 19),
+    (128, 128, 128),
+    (255, 255, 255),
+    (143, 188, 143),
+    (95, 158, 160),
+    (255, 200, 0),
+    (128, 0, 0),
 ]
@@ -39,28 +40,58 @@ class SegmentationTask(BasicTask):
         num_classes: int,
         colors: list[tuple[int, int, int]] = DEFAULT_COLORS,
         zero_is_invalid: bool = False,
+        enable_accuracy_metric: bool = True,
+        enable_miou_metric: bool = False,
+        enable_f1_metric: bool = False,
+        f1_metric_thresholds: list[list[float]] = [[0.5]],
         metric_kwargs: dict[str, Any] = {},
-        **kwargs,
-    ):
+        miou_metric_kwargs: dict[str, Any] = {},
+        prob_scales: list[float] | None = None,
+        other_metrics: dict[str, Metric] = {},
+        **kwargs: Any,
+    ) -> None:
         """Initialize a new SegmentationTask.
         Args:
             num_classes: the number of classes to predict
             colors: optional colors for each class
             zero_is_invalid: whether pixels labeled class 0 should be marked invalid
+            enable_accuracy_metric: whether to enable the accuracy metric (default
+                true).
+            enable_f1_metric: whether to enable the F1 metric (default false).
+            enable_miou_metric: whether to enable the mean IoU metric (default false).
+            f1_metric_thresholds: list of list of thresholds to apply for F1 metric.
+                Each inner list is used to initialize a separate F1 metric where the
+                best F1 across the thresholds within the inner list is computed. If
+                there are multiple inner lists, then multiple F1 scores will be
+                reported.
             metric_kwargs: additional arguments to pass to underlying metric, see
                 torchmetrics.classification.MulticlassAccuracy.
+            miou_metric_kwargs: additional arguments to pass to MeanIoUMetric, if
+                enable_miou_metric is passed.
+            prob_scales: during inference, scale the output probabilities by this much
+                before computing the argmax. There is one scale per class. Note that
+                this is only applied during prediction, not when computing val or test
+                metrics.
+            other_metrics: additional metrics to configure on this task.
             kwargs: additional arguments to pass to BasicTask
         """
         super().__init__(**kwargs)
         self.num_classes = num_classes
         self.colors = colors
         self.zero_is_invalid = zero_is_invalid
+        self.enable_accuracy_metric = enable_accuracy_metric
+        self.enable_f1_metric = enable_f1_metric
+        self.enable_miou_metric = enable_miou_metric
+        self.f1_metric_thresholds = f1_metric_thresholds
         self.metric_kwargs = metric_kwargs
+        self.miou_metric_kwargs = miou_metric_kwargs
+        self.prob_scales = prob_scales
+        self.other_metrics = other_metrics
     def process_inputs(
         self,
-        raw_inputs: dict[str, torch.Tensor | list[Feature]],
+        raw_inputs: dict[str, torch.Tensor],
         metadata: dict[str, Any],
         load_targets: bool = True,
     ) -> tuple[dict[str, Any], dict[str, Any]]:
@@ -78,6 +109,7 @@ class SegmentationTask(BasicTask):
         if not load_targets:
             return {}, {}
+        # TODO: List[Feature] is currently not supported
         assert raw_inputs["targets"].shape[0] == 1
         labels = raw_inputs["targets"][0, :, :].long()
@@ -103,7 +135,11 @@ class SegmentationTask(BasicTask):
         Returns:
             either raster or vector data.
         """
-        classes = raw_output.cpu().numpy().argmax(axis=0).astype(np.uint8)
+        raw_output_np = raw_output.cpu().numpy()
+        if self.prob_scales is not None:
+            # Scale the channel dimension by the provided scales.
+            raw_output_np = raw_output_np * np.array(self.prob_scales)[:, None, None]
+        classes = raw_output_np.argmax(axis=0).astype(np.uint8)
         return classes[None, :, :]
     def visualize(
@@ -123,6 +159,8 @@ class SegmentationTask(BasicTask):
             a dictionary mapping image name to visualization image
         """
         image = super().visualize(input_dict, target_dict, output)["image"]
+        if target_dict is None:
+            raise ValueError("target_dict is required for visualization")
         gt_classes = target_dict["classes"].cpu().numpy()
         pred_classes = output.cpu().numpy().argmax(axis=0)
         gt_vis = np.zeros((gt_classes.shape[0], gt_classes.shape[1], 3), dtype=np.uint8)
@@ -143,11 +181,53 @@ class SegmentationTask(BasicTask):
     def get_metrics(self) -> MetricCollection:
         """Get the metrics for this task."""
         metrics = {}
-        metric_kwargs = dict(num_classes=self.num_classes)
-        metric_kwargs.update(self.metric_kwargs)
-        metrics["accuracy"] = SegmentationMetric(
-            torchmetrics.classification.MulticlassAccuracy(**metric_kwargs)
-        )
+        if self.enable_accuracy_metric:
+            accuracy_metric_kwargs = dict(num_classes=self.num_classes)
+            accuracy_metric_kwargs.update(self.metric_kwargs)
+            metrics["accuracy"] = SegmentationMetric(
+                torchmetrics.classification.MulticlassAccuracy(**accuracy_metric_kwargs)
+            )
+        if self.enable_f1_metric:
+            for thresholds in self.f1_metric_thresholds:
+                if len(self.f1_metric_thresholds) == 1:
+                    suffix = ""
+                else:
+                    # Metric name can't contain "." so change to ",".
+                    suffix = "_" + str(thresholds[0]).replace(".", ",")
+                metrics["F1" + suffix] = SegmentationMetric(
+                    F1Metric(num_classes=self.num_classes, score_thresholds=thresholds)
+                )
+                metrics["precision" + suffix] = SegmentationMetric(
+                    F1Metric(
+                        num_classes=self.num_classes,
+                        score_thresholds=thresholds,
+                        metric_mode="precision",
+                    )
+                )
+                metrics["recall" + suffix] = SegmentationMetric(
+                    F1Metric(
+                        num_classes=self.num_classes,
+                        score_thresholds=thresholds,
+                        metric_mode="recall",
+                    )
+                )
+        if self.enable_miou_metric:
+            miou_metric_kwargs: dict[str, Any] = dict(num_classes=self.num_classes)
+            if self.zero_is_invalid:
+                miou_metric_kwargs["zero_is_invalid"] = True
+            miou_metric_kwargs.update(self.miou_metric_kwargs)
+            metrics["mean_iou"] = SegmentationMetric(
+                MeanIoUMetric(**miou_metric_kwargs),
+                pass_probabilities=False,
+            )
+        if self.other_metrics:
+            metrics.update(self.other_metrics)
         return MetricCollection(metrics)
@@ -159,7 +239,7 @@ class SegmentationHead(torch.nn.Module):
         logits: torch.Tensor,
         inputs: list[dict[str, Any]],
         targets: list[dict[str, Any]] | None = None,
-    ):
+    ) -> tuple[torch.Tensor, dict[str, Any]]:
         """Compute the segmentation outputs from logits and targets.
         Args:
@@ -172,28 +252,51 @@ class SegmentationHead(torch.nn.Module):
         """
         outputs = torch.nn.functional.softmax(logits, dim=1)
-        loss = None
+        losses = {}
         if targets:
             labels = torch.stack([target["classes"] for target in targets], dim=0)
             mask = torch.stack([target["valid"] for target in targets], dim=0)
-            loss = (
-                torch.nn.functional.cross_entropy(logits, labels, reduction="none")
-                * mask
+            per_pixel_loss = torch.nn.functional.cross_entropy(
+                logits, labels, reduction="none"
             )
-            loss = torch.mean(loss)
+            mask_sum = torch.sum(mask)
+            if mask_sum > 0:
+                # Compute average loss over valid pixels.
+                losses["cls"] = torch.sum(per_pixel_loss * mask) / torch.sum(mask)
+            else:
+                # If there are no valid pixels, we avoid dividing by zero and just let
+                # the summed mask loss be zero.
+                losses["cls"] = torch.sum(per_pixel_loss * mask)
-        return outputs, {"cls": loss}
+        return outputs, losses
 class SegmentationMetric(Metric):
     """Metric for segmentation task."""
-    def __init__(self, metric: Metric):
-        """Initialize a new SegmentationMetric."""
+    def __init__(
+        self,
+        metric: Metric,
+        pass_probabilities: bool = True,
+        class_idx: int | None = None,
+    ):
+        """Initialize a new SegmentationMetric.
+        Args:
+            metric: the metric to wrap. This wrapping class will handle selecting the
+                classes from the targets and masking out invalid pixels.
+            pass_probabilities: whether to pass predicted probabilities to the metric.
+                If False, argmax is applied to pass the predicted classes instead.
+            class_idx: if metric returns value for multiple classes, select this class.
+        """
         super().__init__()
         self.metric = metric
+        self.pass_probablities = pass_probabilities
+        self.class_idx = class_idx
-    def update(self, preds: list[Any], targets: list[dict[str, Any]]) -> None:
+    def update(
+        self, preds: list[Any] | torch.Tensor, targets: list[dict[str, Any]]
+    ) -> None:
         """Update metric.
         Args:
@@ -213,11 +316,17 @@ class SegmentationMetric(Metric):
         if len(preds) == 0:
             return
+        if not self.pass_probablities:
+            preds = preds.argmax(dim=1)
         self.metric.update(preds, labels)
     def compute(self) -> Any:
         """Returns the computed metric."""
-        return self.metric.compute()
+        result = self.metric.compute()
+        if self.class_idx is not None:
+            result = result[self.class_idx]
+        return result
     def reset(self) -> None:
         """Reset metric."""
@@ -227,3 +336,212 @@ class SegmentationMetric(Metric):
     def plot(self, *args: list[Any], **kwargs: dict[str, Any]) -> Any:
         """Returns a plot of the metric."""
         return self.metric.plot(*args, **kwargs)
+class F1Metric(Metric):
+    """F1 score for segmentation.
+    It treats each class as a separate prediction task, and computes the maximum F1
+    score under the different configured thresholds per-class.
+    """
+    def __init__(
+        self,
+        num_classes: int,
+        score_thresholds: list[float],
+        metric_mode: str = "f1",
+    ):
+        """Create a new F1Metric.
+        Args:
+            num_classes: number of classes.
+            score_thresholds: list of score thresholds to check F1 score for. The final
+                metric is the best F1 across score thresholds.
+            metric_mode: set to "precision" or "recall" to return that instead of F1
+                (default "f1")
+        """
+        super().__init__()
+        self.num_classes = num_classes
+        self.score_thresholds = score_thresholds
+        self.metric_mode = metric_mode
+        assert self.metric_mode in ["f1", "precision", "recall"]
+        for cls_idx in range(self.num_classes):
+            for thr_idx in range(len(self.score_thresholds)):
+                cur_prefix = self._get_state_prefix(cls_idx, thr_idx)
+                self.add_state(
+                    cur_prefix + "tp", default=torch.tensor(0), dist_reduce_fx="sum"
+                )
+                self.add_state(
+                    cur_prefix + "fp", default=torch.tensor(0), dist_reduce_fx="sum"
+                )
+                self.add_state(
+                    cur_prefix + "fn", default=torch.tensor(0), dist_reduce_fx="sum"
+                )
+    def _get_state_prefix(self, cls_idx: int, thr_idx: int) -> str:
+        return f"{cls_idx}_{thr_idx}_"
+    def update(self, preds: torch.Tensor, labels: torch.Tensor) -> None:
+        """Update metric.
+        Args:
+            preds: the predictions, NxC.
+            labels: the targets, N, with values from 0 to C-1.
+        """
+        for cls_idx in range(self.num_classes):
+            for thr_idx, score_threshold in enumerate(self.score_thresholds):
+                pred_bin = preds[:, cls_idx] > score_threshold
+                gt_bin = labels == cls_idx
+                tp = torch.count_nonzero(pred_bin & gt_bin).item()
+                fp = torch.count_nonzero(pred_bin & torch.logical_not(gt_bin)).item()
+                fn = torch.count_nonzero(torch.logical_not(pred_bin) & gt_bin).item()
+                cur_prefix = self._get_state_prefix(cls_idx, thr_idx)
+                setattr(self, cur_prefix + "tp", getattr(self, cur_prefix + "tp") + tp)
+                setattr(self, cur_prefix + "fp", getattr(self, cur_prefix + "fp") + fp)
+                setattr(self, cur_prefix + "fn", getattr(self, cur_prefix + "fn") + fn)
+    def compute(self) -> Any:
+        """Compute metric.
+        Returns:
+            the best F1 score across score thresholds and classes.
+        """
+        best_scores = []
+        for cls_idx in range(self.num_classes):
+            best_score = None
+            for thr_idx in range(len(self.score_thresholds)):
+                cur_prefix = self._get_state_prefix(cls_idx, thr_idx)
+                tp = getattr(self, cur_prefix + "tp")
+                fp = getattr(self, cur_prefix + "fp")
+                fn = getattr(self, cur_prefix + "fn")
+                device = tp.device
+                if tp + fp == 0:
+                    precision = torch.tensor(0, dtype=torch.float32, device=device)
+                else:
+                    precision = tp / (tp + fp)
+                if tp + fn == 0:
+                    recall = torch.tensor(0, dtype=torch.float32, device=device)
+                else:
+                    recall = tp / (tp + fn)
+                if precision + recall < 0.001:
+                    f1 = torch.tensor(0, dtype=torch.float32, device=device)
+                else:
+                    f1 = 2 * precision * recall / (precision + recall)
+                if self.metric_mode == "f1":
+                    score = f1
+                elif self.metric_mode == "precision":
+                    score = precision
+                elif self.metric_mode == "recall":
+                    score = recall
+                if best_score is None or score > best_score:
+                    best_score = score
+            best_scores.append(best_score)
+        return torch.mean(torch.stack(best_scores))
+class MeanIoUMetric(Metric):
+    """Mean IoU for segmentation.
+    This is the mean of the per-class intersection-over-union scores. The per-class
+    intersection is the number of pixels across all examples where the predicted label
+    and ground truth label are both that class, and the per-class union is defined
+    similarly.
+    This differs from torchmetrics.segmentation.MeanIoU, where the mean IoU is computed
+    per-image, and averaged across images.
+    """
+    def __init__(
+        self,
+        num_classes: int,
+        zero_is_invalid: bool = False,
+        ignore_missing_classes: bool = False,
+        class_idx: int | None = None,
+    ):
+        """Create a new MeanIoUMetric.
+        Args:
+            num_classes: the number of classes for the task.
+            zero_is_invalid: whether to ignore class 0 in computing mean IoU.
+            ignore_missing_classes: whether to ignore classes that don't appear in
+                either the predictions or the ground truth. If false, the IoU for a
+                missing class will be 0.
+            class_idx: only compute and return the IoU for this class. This option is
+                provided so the user can get per-class IoU results, since Lightning
+                only supports scalar return values from metrics.
+        """
+        super().__init__()
+        self.num_classes = num_classes
+        self.zero_is_invalid = zero_is_invalid
+        self.ignore_missing_classes = ignore_missing_classes
+        self.class_idx = class_idx
+        self.add_state(
+            "intersections", default=torch.zeros(self.num_classes), dist_reduce_fx="sum"
+        )
+        self.add_state(
+            "unions", default=torch.zeros(self.num_classes), dist_reduce_fx="sum"
+        )
+    def update(self, preds: torch.Tensor, labels: torch.Tensor) -> None:
+        """Update metric.
+        Like torchmetrics.segmentation.MeanIoU with input_format="index", we expect
+        predictions and labels to both be class integers. This is achieved by passing
+        pass_probabilities=False to the SegmentationMetric wrapper.
+        Args:
+            preds: the predictions, (N,), with values from 0 to C-1.
+            labels: the targets, (N,), with values from 0 to C-1.
+        """
+        if preds.min() < 0 or preds.max() >= self.num_classes:
+            raise ValueError("predicted class outside of expected range")
+        if labels.min() < 0 or labels.max() >= self.num_classes:
+            raise ValueError("label class outside of expected range")
+        new_intersections = torch.zeros(
+            self.num_classes, device=self.intersections.device
+        )
+        new_unions = torch.zeros(self.num_classes, device=self.unions.device)
+        for cls_idx in range(self.num_classes):
+            new_intersections[cls_idx] = (
+                (preds == cls_idx) & (labels == cls_idx)
+            ).sum()
+            new_unions[cls_idx] = ((preds == cls_idx) | (labels == cls_idx)).sum()
+        self.intersections += new_intersections
+        self.unions += new_unions
+    def compute(self) -> Any:
+        """Compute metric.
+        Returns:
+            the mean IoU across classes.
+        """
+        per_class_scores = []
+        for cls_idx in range(self.num_classes):
+            if cls_idx == 0 and self.zero_is_invalid:
+                continue
+            intersection = self.intersections[cls_idx]
+            union = self.unions[cls_idx]
+            if union == 0 and self.ignore_missing_classes:
+                continue
+            per_class_scores.append(intersection / union)
+        return torch.mean(torch.stack(per_class_scores))

rslearn/train/tasks/task.py CHANGED Viewed

@@ -39,7 +39,7 @@ class Task:
     def process_output(
         self, raw_output: Any, metadata: dict[str, Any]
-    ) -> npt.NDArray[Any] | list[Feature]:
+    ) -> npt.NDArray[Any] | list[Feature] | dict[str, Any]:
         """Processes an output into raster or vector data.
         Args:
@@ -47,7 +47,7 @@ class Task:
             metadata: metadata about the patch being read
         Returns:
-            either raster or vector data.
+            raster data, vector data, or multi-task dictionary output.
         """
         raise NotImplementedError

rslearn/train/transforms/__init__.py CHANGED Viewed

@@ -12,7 +12,7 @@ class Sequential(torch.nn.Module):
     tuple.
     """
-    def __init__(self, *args):
+    def __init__(self, *args: Any) -> None:
         """Initialize a new Sequential from a list of transforms."""
         super().__init__()
         self.transforms = torch.nn.ModuleList(args)

rslearn/train/transforms/concatenate.py CHANGED Viewed

@@ -1,8 +1,10 @@
-"""Normalization transforms."""
+"""Concatenate bands across multiple image inputs."""
+from typing import Any
 import torch
-from .transform import Transform
+from .transform import Transform, read_selector, write_selector
 class Concatenate(Transform):
@@ -24,7 +26,9 @@ class Concatenate(Transform):
         self.selections = selections
         self.output_selector = output_selector
-    def forward(self, input_dict, target_dict):
+    def forward(
+        self, input_dict: dict[str, Any], target_dict: dict[str, Any]
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
         """Apply concatenation over the inputs and targets.
         Args:
@@ -36,10 +40,10 @@ class Concatenate(Transform):
         """
         images = []
         for selector, wanted_bands in self.selections.items():
-            image = self.read_selector(input_dict, target_dict, selector)
+            image = read_selector(input_dict, target_dict, selector)
             if wanted_bands:
                 image = image[wanted_bands, :, :]
             images.append(image)
         result = torch.concatenate(images, dim=0)
-        self.write_selector(input_dict, target_dict, self.output_selector, result)
+        write_selector(input_dict, target_dict, self.output_selector, result)
         return input_dict, target_dict

rslearn/train/transforms/crop.py CHANGED Viewed

@@ -5,7 +5,7 @@ from typing import Any
 import torch
 import torchvision
-from .transform import Transform
+from .transform import Transform, read_selector
 class Crop(Transform):
@@ -69,7 +69,7 @@ class Crop(Transform):
             "remove_from_top": remove_from_top,
         }
-    def apply_image(self, image: torch.Tensor, state: dict[str, bool]) -> torch.Tensor:
+    def apply_image(self, image: torch.Tensor, state: dict[str, Any]) -> torch.Tensor:
         """Apply the sampled state on the specified image.
         Args:
@@ -97,7 +97,9 @@ class Crop(Transform):
         """
         raise NotImplementedError
-    def forward(self, input_dict, target_dict):
+    def forward(
+        self, input_dict: dict[str, Any], target_dict: dict[str, Any]
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
         """Apply transform over the inputs and targets.
         Args:
@@ -109,13 +111,15 @@ class Crop(Transform):
         """
         smallest_image_shape = None
         for selector in self.image_selectors:
-            image = self.read_selector(input_dict, target_dict, selector)
+            image = read_selector(input_dict, target_dict, selector)
             if (
                 smallest_image_shape is None
                 or image.shape[-1] < smallest_image_shape[1]
             ):
                 smallest_image_shape = image.shape[-2:]
+        if smallest_image_shape is None:
+            raise ValueError("No image found to crop")
         state = self.sample_state(smallest_image_shape)
         self.apply_fn(

rslearn/train/transforms/flip.py CHANGED Viewed

@@ -1,5 +1,7 @@
 """Flip transform."""
+from typing import Any
 import torch
 from .transform import Transform
@@ -90,7 +92,9 @@ class Flip(Transform):
             )
         return boxes
-    def forward(self, input_dict, target_dict):
+    def forward(
+        self, input_dict: dict[str, Any], target_dict: dict[str, Any]
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
         """Apply transform over the inputs and targets.
         Args:

rslearn 0.0.1__py3-none-any.whl → 0.0.3__py3-none-any.whl

rslearn 0.0.1py3-none-any.whl → 0.0.3py3-none-any.whl