PyPI - rslearn - Versions diffs - 0.0.1__py3-none-any.whl → 0.0.21__py3-none-any.whl - Mend

rslearn 0.0.1py3-none-any.whl → 0.0.21py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (166) hide show

rslearn/arg_parser.py +31 -0
rslearn/config/__init__.py +6 -12
rslearn/config/dataset.py +520 -401
rslearn/const.py +9 -15
rslearn/data_sources/__init__.py +8 -23
rslearn/data_sources/aws_landsat.py +242 -98
rslearn/data_sources/aws_open_data.py +111 -151
rslearn/data_sources/aws_sentinel1.py +131 -0
rslearn/data_sources/climate_data_store.py +471 -0
rslearn/data_sources/copernicus.py +884 -12
rslearn/data_sources/data_source.py +43 -12
rslearn/data_sources/earthdaily.py +484 -0
rslearn/data_sources/earthdata_srtm.py +282 -0
rslearn/data_sources/eurocrops.py +242 -0
rslearn/data_sources/gcp_public_data.py +578 -222
rslearn/data_sources/google_earth_engine.py +461 -135
rslearn/data_sources/local_files.py +219 -150
rslearn/data_sources/openstreetmap.py +51 -89
rslearn/data_sources/planet.py +24 -60
rslearn/data_sources/planet_basemap.py +275 -0
rslearn/data_sources/planetary_computer.py +798 -0
rslearn/data_sources/usda_cdl.py +195 -0
rslearn/data_sources/usgs_landsat.py +115 -83
rslearn/data_sources/utils.py +249 -61
rslearn/data_sources/vector_source.py +1 -0
rslearn/data_sources/worldcereal.py +449 -0
rslearn/data_sources/worldcover.py +144 -0
rslearn/data_sources/worldpop.py +153 -0
rslearn/data_sources/xyz_tiles.py +150 -107
rslearn/dataset/__init__.py +8 -2
rslearn/dataset/add_windows.py +2 -2
rslearn/dataset/dataset.py +40 -51
rslearn/dataset/handler_summaries.py +131 -0
rslearn/dataset/manage.py +313 -74
rslearn/dataset/materialize.py +431 -107
rslearn/dataset/remap.py +29 -4
rslearn/dataset/storage/__init__.py +1 -0
rslearn/dataset/storage/file.py +202 -0
rslearn/dataset/storage/storage.py +140 -0
rslearn/dataset/window.py +181 -44
rslearn/lightning_cli.py +454 -0
rslearn/log_utils.py +24 -0
rslearn/main.py +384 -181
rslearn/models/anysat.py +215 -0
rslearn/models/attention_pooling.py +177 -0
rslearn/models/clay/clay.py +231 -0
rslearn/models/clay/configs/metadata.yaml +295 -0
rslearn/models/clip.py +68 -0
rslearn/models/component.py +111 -0
rslearn/models/concatenate_features.py +103 -0
rslearn/models/conv.py +63 -0
rslearn/models/croma.py +306 -0
rslearn/models/detr/__init__.py +5 -0
rslearn/models/detr/box_ops.py +103 -0
rslearn/models/detr/detr.py +504 -0
rslearn/models/detr/matcher.py +107 -0
rslearn/models/detr/position_encoding.py +114 -0
rslearn/models/detr/transformer.py +429 -0
rslearn/models/detr/util.py +24 -0
rslearn/models/dinov3.py +177 -0
rslearn/models/faster_rcnn.py +30 -28
rslearn/models/feature_center_crop.py +53 -0
rslearn/models/fpn.py +19 -8
rslearn/models/galileo/__init__.py +5 -0
rslearn/models/galileo/galileo.py +595 -0
rslearn/models/galileo/single_file_galileo.py +1678 -0
rslearn/models/module_wrapper.py +65 -0
rslearn/models/molmo.py +69 -0
rslearn/models/multitask.py +384 -28
rslearn/models/olmoearth_pretrain/__init__.py +1 -0
rslearn/models/olmoearth_pretrain/model.py +421 -0
rslearn/models/olmoearth_pretrain/norm.py +86 -0
rslearn/models/panopticon.py +170 -0
rslearn/models/panopticon_data/sensors/drone.yaml +32 -0
rslearn/models/panopticon_data/sensors/enmap.yaml +904 -0
rslearn/models/panopticon_data/sensors/goes.yaml +9 -0
rslearn/models/panopticon_data/sensors/himawari.yaml +9 -0
rslearn/models/panopticon_data/sensors/intuition.yaml +606 -0
rslearn/models/panopticon_data/sensors/landsat8.yaml +84 -0
rslearn/models/panopticon_data/sensors/modis_terra.yaml +99 -0
rslearn/models/panopticon_data/sensors/qb2_ge1.yaml +34 -0
rslearn/models/panopticon_data/sensors/sentinel1.yaml +85 -0
rslearn/models/panopticon_data/sensors/sentinel2.yaml +97 -0
rslearn/models/panopticon_data/sensors/superdove.yaml +60 -0
rslearn/models/panopticon_data/sensors/wv23.yaml +63 -0
rslearn/models/pick_features.py +17 -10
rslearn/models/pooling_decoder.py +60 -7
rslearn/models/presto/__init__.py +5 -0
rslearn/models/presto/presto.py +297 -0
rslearn/models/presto/single_file_presto.py +926 -0
rslearn/models/prithvi.py +1147 -0
rslearn/models/resize_features.py +59 -0
rslearn/models/sam2_enc.py +13 -9
rslearn/models/satlaspretrain.py +38 -18
rslearn/models/simple_time_series.py +188 -77
rslearn/models/singletask.py +24 -13
rslearn/models/ssl4eo_s12.py +40 -30
rslearn/models/swin.py +44 -32
rslearn/models/task_embedding.py +250 -0
rslearn/models/terramind.py +256 -0
rslearn/models/trunk.py +139 -0
rslearn/models/unet.py +68 -22
rslearn/models/upsample.py +48 -0
rslearn/models/use_croma.py +508 -0
rslearn/template_params.py +26 -0
rslearn/tile_stores/__init__.py +41 -18
rslearn/tile_stores/default.py +409 -0
rslearn/tile_stores/tile_store.py +236 -132
rslearn/train/all_patches_dataset.py +530 -0
rslearn/train/callbacks/adapters.py +53 -0
rslearn/train/callbacks/freeze_unfreeze.py +348 -17
rslearn/train/callbacks/gradients.py +129 -0
rslearn/train/callbacks/peft.py +116 -0
rslearn/train/data_module.py +444 -20
rslearn/train/dataset.py +588 -235
rslearn/train/lightning_module.py +192 -62
rslearn/train/model_context.py +88 -0
rslearn/train/optimizer.py +31 -0
rslearn/train/prediction_writer.py +319 -84
rslearn/train/scheduler.py +92 -0
rslearn/train/tasks/classification.py +55 -28
rslearn/train/tasks/detection.py +132 -76
rslearn/train/tasks/embedding.py +120 -0
rslearn/train/tasks/multi_task.py +28 -14
rslearn/train/tasks/per_pixel_regression.py +291 -0
rslearn/train/tasks/regression.py +161 -44
rslearn/train/tasks/segmentation.py +428 -53
rslearn/train/tasks/task.py +6 -5
rslearn/train/transforms/__init__.py +1 -1
rslearn/train/transforms/concatenate.py +54 -10
rslearn/train/transforms/crop.py +29 -11
rslearn/train/transforms/flip.py +18 -6
rslearn/train/transforms/mask.py +78 -0
rslearn/train/transforms/normalize.py +101 -17
rslearn/train/transforms/pad.py +19 -7
rslearn/train/transforms/resize.py +83 -0
rslearn/train/transforms/select_bands.py +76 -0
rslearn/train/transforms/sentinel1.py +75 -0
rslearn/train/transforms/transform.py +89 -70
rslearn/utils/__init__.py +2 -6
rslearn/utils/array.py +8 -6
rslearn/utils/feature.py +2 -2
rslearn/utils/fsspec.py +90 -1
rslearn/utils/geometry.py +347 -7
rslearn/utils/get_utm_ups_crs.py +2 -3
rslearn/utils/grid_index.py +5 -5
rslearn/utils/jsonargparse.py +178 -0
rslearn/utils/mp.py +4 -3
rslearn/utils/raster_format.py +268 -116
rslearn/utils/rtree_index.py +64 -17
rslearn/utils/sqlite_index.py +7 -1
rslearn/utils/vector_format.py +252 -97
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/METADATA +532 -283
rslearn-0.0.21.dist-info/RECORD +167 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/WHEEL +1 -1
rslearn-0.0.21.dist-info/licenses/NOTICE +115 -0
rslearn/data_sources/raster_source.py +0 -309
rslearn/models/registry.py +0 -5
rslearn/tile_stores/file.py +0 -242
rslearn/utils/mgrs.py +0 -24
rslearn/utils/utils.py +0 -22
rslearn-0.0.1.dist-info/RECORD +0 -88
/rslearn/{data_sources/geotiff.py → py.typed} +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/entry_points.txt +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info/licenses}/LICENSE +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/top_level.txt +0 -0

rslearn/train/tasks/regression.py CHANGED Viewed

@@ -1,15 +1,24 @@
-"""Classification task."""
+"""Regression task."""
-from typing import Any
+from typing import Any, Literal
 import numpy as np
 import numpy.typing as npt
+import shapely
 import torch
 import torchmetrics
 from PIL import Image, ImageDraw
 from torchmetrics import Metric, MetricCollection
-from rslearn.utils import Feature
+from rslearn.models.component import FeatureVector, Predictor
+from rslearn.train.model_context import (
+    ModelContext,
+    ModelOutput,
+    RasterImage,
+    SampleMetadata,
+)
+from rslearn.utils.feature import Feature
+from rslearn.utils.geometry import STGeometry
 from .task import BasicTask
@@ -20,23 +29,29 @@ class RegressionTask(BasicTask):
     def __init__(
         self,
         property_name: str,
-        filters: list[tuple[str, str]] | None,
+        filters: list[tuple[str, str]] | None = None,
         allow_invalid: bool = False,
         scale_factor: float = 1,
-        metric_mode: str = "mse",
-        **kwargs,
-    ):
+        metric_mode: Literal["mse", "l1"] = "mse",
+        use_accuracy_metric: bool = False,
+        within_factor: float = 0.1,
+        **kwargs: Any,
+    ) -> None:
         """Initialize a new RegressionTask.
         Args:
-            property_name: the property from which to extract the regression value. The
-                value is read from the first matching feature.
+            property_name: the property from which to extract the ground truth
+                regression value. The value is read from the first matching feature.
             filters: optional list of (property_name, property_value) to only consider
                 features with matching properties.
             allow_invalid: instead of throwing error when no regression label is found
                 at a window, simply mark the example invalid for this task
-            scale_factor: multiply the label value by this factor
-            metric_mode: what metric to use, either mse or l1
+            scale_factor: multiply the label value by this factor for training
+            metric_mode: what metric to use, either "mse" (default) or "l1"
+            use_accuracy_metric: include metric that reports percentage of
+                examples where output is within a factor of the ground truth.
+            within_factor: the factor for accuracy metric. If it's 0.2, and ground
+                truth is 5.0, then values from 5.0*0.8 to 5.0*1.2 are accepted.
             kwargs: other arguments to pass to BasicTask
         """
         super().__init__(**kwargs)
@@ -45,14 +60,16 @@ class RegressionTask(BasicTask):
         self.allow_invalid = allow_invalid
         self.scale_factor = scale_factor
         self.metric_mode = metric_mode
+        self.use_accuracy_metric = use_accuracy_metric
+        self.within_factor = within_factor
         if not self.filters:
             self.filters = []
     def process_inputs(
         self,
-        raw_inputs: dict[str, torch.Tensor | list[Feature]],
-        metadata: dict[str, Any],
+        raw_inputs: dict[str, RasterImage | list[Feature]],
+        metadata: SampleMetadata,
         load_targets: bool = True,
     ) -> tuple[dict[str, Any], dict[str, Any]]:
         """Processes the data into targets.
@@ -70,7 +87,10 @@ class RegressionTask(BasicTask):
             return {}, {}
         data = raw_inputs["targets"]
+        assert isinstance(data, list)
         for feat in data:
+            if feat.properties is None or self.filters is None:
+                continue
             for property_name, property_value in self.filters:
                 if feat.properties.get(property_name) != property_value:
                     continue
@@ -90,6 +110,35 @@ class RegressionTask(BasicTask):
             "valid": torch.tensor(0, dtype=torch.float32),
         }
+    def process_output(
+        self, raw_output: Any, metadata: SampleMetadata
+    ) -> list[Feature]:
+        """Processes an output into raster or vector data.
+        Args:
+            raw_output: the output from prediction head, which must be a scalar tensor.
+            metadata: metadata about the patch being read
+        Returns:
+            a list with a single Feature corresponding to the patch extent and with a
+                property containing the predicted value.
+        """
+        if not isinstance(raw_output, torch.Tensor) or len(raw_output.shape) != 0:
+            raise ValueError("output for RegressionTask must be a scalar Tensor")
+        output = raw_output.item() / self.scale_factor
+        feature = Feature(
+            STGeometry(
+                metadata.projection,
+                shapely.Point(metadata.patch_bounds[0], metadata.patch_bounds[1]),
+                None,
+            ),
+            {
+                self.property_name: output,
+            },
+        )
+        return [feature]
     def visualize(
         self,
         input_dict: dict[str, Any],
@@ -109,6 +158,8 @@ class RegressionTask(BasicTask):
         image = super().visualize(input_dict, target_dict, output)["image"]
         image = Image.fromarray(image)
         draw = ImageDraw.Draw(image)
+        if target_dict is None:
+            raise ValueError("target_dict is required for visualization")
         target = target_dict["value"] / self.scale_factor
         output = output / self.scale_factor
         text = f"Label: {target:.2f}\nOutput: {output:.2f}"
@@ -121,27 +172,36 @@ class RegressionTask(BasicTask):
     def get_metrics(self) -> MetricCollection:
         """Get the metrics for this task."""
+        metric_dict: dict[str, Metric] = {}
         if self.metric_mode == "mse":
-            metric = torchmetrics.MeanSquaredError()
+            metric_dict["mse"] = RegressionMetricWrapper(
+                metric=torchmetrics.MeanSquaredError(), scale_factor=self.scale_factor
+            )
         elif self.metric_mode == "l1":
-            metric = torchmetrics.MeanAbsoluteError()
-        return MetricCollection(
-            {
-                self.metric_mode: RegressionMetricWrapper(
-                    metric=metric, scale_factor=self.scale_factor
-                )
-            }
-        )
+            metric_dict["l1"] = RegressionMetricWrapper(
+                metric=torchmetrics.MeanAbsoluteError(), scale_factor=self.scale_factor
+            )
+        if self.use_accuracy_metric:
+            metric_dict["accuracy"] = RegressionMetricWrapper(
+                metric=RegressionAccuracy(self.within_factor),
+                scale_factor=self.scale_factor,
+            )
-class RegressionHead(torch.nn.Module):
+        return MetricCollection(metric_dict)
+class RegressionHead(Predictor):
     """Head for regression task."""
-    def __init__(self, loss_mode: str = "mse", use_sigmoid: bool = False):
+    def __init__(
+        self, loss_mode: Literal["mse", "l1"] = "mse", use_sigmoid: bool = False
+    ):
         """Initialize a new RegressionHead.
         Args:
-            loss_mode: the loss function to use, either "mse" or "l1".
+            loss_mode: the loss function to use, either "mse" (default) or "l1".
             use_sigmoid: whether to apply a sigmoid activation on the output. This
                 requires targets to be between 0-1.
         """
@@ -151,48 +211,59 @@ class RegressionHead(torch.nn.Module):
     def forward(
         self,
-        logits: torch.Tensor,
-        inputs: list[dict[str, Any]],
+        intermediates: Any,
+        context: ModelContext,
         targets: list[dict[str, Any]] | None = None,
-    ):
+    ) -> ModelOutput:
         """Compute the regression outputs and loss from logits and targets.
         Args:
-            logits: tensor that is (BatchSize, 1) or (BatchSize) in shape.
-            inputs: original inputs (ignored).
-            targets: should contain target key that stores the regression label.
+            intermediates: output from previous model component, which must be a
+                FeatureVector with channel dimension size 1 (Bx1).
+            context: the model context.
+            targets: target dicts, which each must contain a "value" key containing the
+                regression label, along with a "valid" key containing a flag indicating
+                whether each example is valid for this task.
         Returns:
-            tuple of outputs and loss dict
+            the model outputs. The output is a B tensor so that it is split up into a
+                scalar for each example.
         """
-        assert len(logits.shape) in [1, 2]
-        if len(logits.shape) == 2:
-            assert logits.shape[1] == 1
-            logits = logits[:, 0]
+        if not isinstance(intermediates, FeatureVector):
+            raise ValueError("the input to RegressionHead must be a FeatureVector")
+        if intermediates.feature_vector.shape[1] != 1:
+            raise ValueError(
+                f"the input to RegressionHead must have channel dimension size 1, but got shape {intermediates.feature_vector.shape}"
+            )
+        logits = intermediates.feature_vector[:, 0]
         if self.use_sigmoid:
             outputs = torch.nn.functional.sigmoid(logits)
         else:
             outputs = logits
-        loss = None
+        losses = {}
         if targets:
             labels = torch.stack([target["value"] for target in targets])
             mask = torch.stack([target["valid"] for target in targets])
             if self.loss_mode == "mse":
-                loss = torch.mean(torch.square(outputs - labels) * mask)
+                losses["regress"] = torch.mean(torch.square(outputs - labels) * mask)
             elif self.loss_mode == "l1":
-                loss = torch.mean(torch.abs(outputs - labels) * mask)
+                losses["regress"] = torch.mean(torch.abs(outputs - labels) * mask)
             else:
-                assert False
+                raise ValueError(f"unknown loss mode {self.loss_mode}")
-        return outputs, {"regress": loss}
+        return ModelOutput(
+            outputs=outputs,
+            loss_dict=losses,
+        )
 class RegressionMetricWrapper(Metric):
     """Metric for regression task."""
-    def __init__(self, metric: Metric, scale_factor: float, **kwargs):
+    def __init__(self, metric: Metric, scale_factor: float, **kwargs: Any) -> None:
         """Initialize a new RegressionMetricWrapper.
         Args:
@@ -206,14 +277,17 @@ class RegressionMetricWrapper(Metric):
         self.metric = metric
         self.scale_factor = scale_factor
-    def update(self, preds: list[Any], targets: list[dict[str, Any]]) -> None:
+    def update(
+        self, preds: list[Any] | torch.Tensor, targets: list[dict[str, Any]]
+    ) -> None:
         """Update metric.
         Args:
             preds: the predictions
             targets: the targets
         """
-        preds = torch.stack(preds)
+        if not isinstance(preds, torch.Tensor):
+            preds = torch.stack(preds)
         labels = torch.stack([target["value"] for target in targets])
         # Sub-select the valid labels.
@@ -237,3 +311,46 @@ class RegressionMetricWrapper(Metric):
     def plot(self, *args: list[Any], **kwargs: dict[str, Any]) -> Any:
         """Returns a plot of the metric."""
         return self.metric.plot(*args, **kwargs)
+class RegressionAccuracy(Metric):
+    """Percentage of examples with estimate within some factor of ground truth."""
+    def __init__(self, factor: float) -> None:
+        """Initialize a new RegressionAccuracy.
+        Args:
+            factor: the factor so if estimate is within this much of ground truth then
+                it is marked correct.
+        """
+        super().__init__()
+        self.factor = factor
+        self.correct = 0
+        self.total = 0
+    def update(self, preds: torch.Tensor, labels: torch.Tensor) -> None:
+        """Update metric.
+        Args:
+            preds: the predictions
+            labels: the ground truth data
+        """
+        decisions = (preds >= labels * (1 - self.factor)) & (
+            preds <= labels * (1 + self.factor)
+        )
+        self.correct += torch.count_nonzero(decisions)
+        self.total += len(decisions)
+    def compute(self) -> Any:
+        """Returns the computed metric."""
+        return torch.tensor(self.correct / self.total)
+    def reset(self) -> None:
+        """Reset metric."""
+        super().reset()
+        self.correct = 0
+        self.total = 0
+    def plot(self, *args: list[Any], **kwargs: dict[str, Any]) -> Any:
+        """Returns a plot of the metric."""
+        return None

rslearn 0.0.1__py3-none-any.whl → 0.0.21__py3-none-any.whl

rslearn 0.0.1py3-none-any.whl → 0.0.21py3-none-any.whl