PyPI - rslearn - Versions diffs - 0.0.1__py3-none-any.whl → 0.0.21__py3-none-any.whl - Mend

rslearn 0.0.1py3-none-any.whl → 0.0.21py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (166) hide show

rslearn/arg_parser.py +31 -0
rslearn/config/__init__.py +6 -12
rslearn/config/dataset.py +520 -401
rslearn/const.py +9 -15
rslearn/data_sources/__init__.py +8 -23
rslearn/data_sources/aws_landsat.py +242 -98
rslearn/data_sources/aws_open_data.py +111 -151
rslearn/data_sources/aws_sentinel1.py +131 -0
rslearn/data_sources/climate_data_store.py +471 -0
rslearn/data_sources/copernicus.py +884 -12
rslearn/data_sources/data_source.py +43 -12
rslearn/data_sources/earthdaily.py +484 -0
rslearn/data_sources/earthdata_srtm.py +282 -0
rslearn/data_sources/eurocrops.py +242 -0
rslearn/data_sources/gcp_public_data.py +578 -222
rslearn/data_sources/google_earth_engine.py +461 -135
rslearn/data_sources/local_files.py +219 -150
rslearn/data_sources/openstreetmap.py +51 -89
rslearn/data_sources/planet.py +24 -60
rslearn/data_sources/planet_basemap.py +275 -0
rslearn/data_sources/planetary_computer.py +798 -0
rslearn/data_sources/usda_cdl.py +195 -0
rslearn/data_sources/usgs_landsat.py +115 -83
rslearn/data_sources/utils.py +249 -61
rslearn/data_sources/vector_source.py +1 -0
rslearn/data_sources/worldcereal.py +449 -0
rslearn/data_sources/worldcover.py +144 -0
rslearn/data_sources/worldpop.py +153 -0
rslearn/data_sources/xyz_tiles.py +150 -107
rslearn/dataset/__init__.py +8 -2
rslearn/dataset/add_windows.py +2 -2
rslearn/dataset/dataset.py +40 -51
rslearn/dataset/handler_summaries.py +131 -0
rslearn/dataset/manage.py +313 -74
rslearn/dataset/materialize.py +431 -107
rslearn/dataset/remap.py +29 -4
rslearn/dataset/storage/__init__.py +1 -0
rslearn/dataset/storage/file.py +202 -0
rslearn/dataset/storage/storage.py +140 -0
rslearn/dataset/window.py +181 -44
rslearn/lightning_cli.py +454 -0
rslearn/log_utils.py +24 -0
rslearn/main.py +384 -181
rslearn/models/anysat.py +215 -0
rslearn/models/attention_pooling.py +177 -0
rslearn/models/clay/clay.py +231 -0
rslearn/models/clay/configs/metadata.yaml +295 -0
rslearn/models/clip.py +68 -0
rslearn/models/component.py +111 -0
rslearn/models/concatenate_features.py +103 -0
rslearn/models/conv.py +63 -0
rslearn/models/croma.py +306 -0
rslearn/models/detr/__init__.py +5 -0
rslearn/models/detr/box_ops.py +103 -0
rslearn/models/detr/detr.py +504 -0
rslearn/models/detr/matcher.py +107 -0
rslearn/models/detr/position_encoding.py +114 -0
rslearn/models/detr/transformer.py +429 -0
rslearn/models/detr/util.py +24 -0
rslearn/models/dinov3.py +177 -0
rslearn/models/faster_rcnn.py +30 -28
rslearn/models/feature_center_crop.py +53 -0
rslearn/models/fpn.py +19 -8
rslearn/models/galileo/__init__.py +5 -0
rslearn/models/galileo/galileo.py +595 -0
rslearn/models/galileo/single_file_galileo.py +1678 -0
rslearn/models/module_wrapper.py +65 -0
rslearn/models/molmo.py +69 -0
rslearn/models/multitask.py +384 -28
rslearn/models/olmoearth_pretrain/__init__.py +1 -0
rslearn/models/olmoearth_pretrain/model.py +421 -0
rslearn/models/olmoearth_pretrain/norm.py +86 -0
rslearn/models/panopticon.py +170 -0
rslearn/models/panopticon_data/sensors/drone.yaml +32 -0
rslearn/models/panopticon_data/sensors/enmap.yaml +904 -0
rslearn/models/panopticon_data/sensors/goes.yaml +9 -0
rslearn/models/panopticon_data/sensors/himawari.yaml +9 -0
rslearn/models/panopticon_data/sensors/intuition.yaml +606 -0
rslearn/models/panopticon_data/sensors/landsat8.yaml +84 -0
rslearn/models/panopticon_data/sensors/modis_terra.yaml +99 -0
rslearn/models/panopticon_data/sensors/qb2_ge1.yaml +34 -0
rslearn/models/panopticon_data/sensors/sentinel1.yaml +85 -0
rslearn/models/panopticon_data/sensors/sentinel2.yaml +97 -0
rslearn/models/panopticon_data/sensors/superdove.yaml +60 -0
rslearn/models/panopticon_data/sensors/wv23.yaml +63 -0
rslearn/models/pick_features.py +17 -10
rslearn/models/pooling_decoder.py +60 -7
rslearn/models/presto/__init__.py +5 -0
rslearn/models/presto/presto.py +297 -0
rslearn/models/presto/single_file_presto.py +926 -0
rslearn/models/prithvi.py +1147 -0
rslearn/models/resize_features.py +59 -0
rslearn/models/sam2_enc.py +13 -9
rslearn/models/satlaspretrain.py +38 -18
rslearn/models/simple_time_series.py +188 -77
rslearn/models/singletask.py +24 -13
rslearn/models/ssl4eo_s12.py +40 -30
rslearn/models/swin.py +44 -32
rslearn/models/task_embedding.py +250 -0
rslearn/models/terramind.py +256 -0
rslearn/models/trunk.py +139 -0
rslearn/models/unet.py +68 -22
rslearn/models/upsample.py +48 -0
rslearn/models/use_croma.py +508 -0
rslearn/template_params.py +26 -0
rslearn/tile_stores/__init__.py +41 -18
rslearn/tile_stores/default.py +409 -0
rslearn/tile_stores/tile_store.py +236 -132
rslearn/train/all_patches_dataset.py +530 -0
rslearn/train/callbacks/adapters.py +53 -0
rslearn/train/callbacks/freeze_unfreeze.py +348 -17
rslearn/train/callbacks/gradients.py +129 -0
rslearn/train/callbacks/peft.py +116 -0
rslearn/train/data_module.py +444 -20
rslearn/train/dataset.py +588 -235
rslearn/train/lightning_module.py +192 -62
rslearn/train/model_context.py +88 -0
rslearn/train/optimizer.py +31 -0
rslearn/train/prediction_writer.py +319 -84
rslearn/train/scheduler.py +92 -0
rslearn/train/tasks/classification.py +55 -28
rslearn/train/tasks/detection.py +132 -76
rslearn/train/tasks/embedding.py +120 -0
rslearn/train/tasks/multi_task.py +28 -14
rslearn/train/tasks/per_pixel_regression.py +291 -0
rslearn/train/tasks/regression.py +161 -44
rslearn/train/tasks/segmentation.py +428 -53
rslearn/train/tasks/task.py +6 -5
rslearn/train/transforms/__init__.py +1 -1
rslearn/train/transforms/concatenate.py +54 -10
rslearn/train/transforms/crop.py +29 -11
rslearn/train/transforms/flip.py +18 -6
rslearn/train/transforms/mask.py +78 -0
rslearn/train/transforms/normalize.py +101 -17
rslearn/train/transforms/pad.py +19 -7
rslearn/train/transforms/resize.py +83 -0
rslearn/train/transforms/select_bands.py +76 -0
rslearn/train/transforms/sentinel1.py +75 -0
rslearn/train/transforms/transform.py +89 -70
rslearn/utils/__init__.py +2 -6
rslearn/utils/array.py +8 -6
rslearn/utils/feature.py +2 -2
rslearn/utils/fsspec.py +90 -1
rslearn/utils/geometry.py +347 -7
rslearn/utils/get_utm_ups_crs.py +2 -3
rslearn/utils/grid_index.py +5 -5
rslearn/utils/jsonargparse.py +178 -0
rslearn/utils/mp.py +4 -3
rslearn/utils/raster_format.py +268 -116
rslearn/utils/rtree_index.py +64 -17
rslearn/utils/sqlite_index.py +7 -1
rslearn/utils/vector_format.py +252 -97
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/METADATA +532 -283
rslearn-0.0.21.dist-info/RECORD +167 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/WHEEL +1 -1
rslearn-0.0.21.dist-info/licenses/NOTICE +115 -0
rslearn/data_sources/raster_source.py +0 -309
rslearn/models/registry.py +0 -5
rslearn/tile_stores/file.py +0 -242
rslearn/utils/mgrs.py +0 -24
rslearn/utils/utils.py +0 -22
rslearn-0.0.1.dist-info/RECORD +0 -88
/rslearn/{data_sources/geotiff.py → py.typed} +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/entry_points.txt +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info/licenses}/LICENSE +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/top_level.txt +0 -0

rslearn/train/tasks/classification.py CHANGED Viewed

@@ -15,6 +15,13 @@ from torchmetrics.classification import (
     MulticlassRecall,
 )
+from rslearn.models.component import FeatureVector, Predictor
+from rslearn.train.model_context import (
+    ModelContext,
+    ModelOutput,
+    RasterImage,
+    SampleMetadata,
+)
 from rslearn.utils import Feature, STGeometry
 from .task import BasicTask
@@ -27,7 +34,7 @@ class ClassificationTask(BasicTask):
         self,
         property_name: str,
         classes: list[str],
-        filters: list[tuple[str, str]] | None = None,
+        filters: list[tuple[str, str]] = [],
         read_class_id: bool = False,
         allow_invalid: bool = False,
         skip_unknown_categories: bool = False,
@@ -37,7 +44,7 @@ class ClassificationTask(BasicTask):
         f1_metric_kwargs: dict[str, Any] = {},
         positive_class: str | None = None,
         positive_class_threshold: float = 0.5,
-        **kwargs,
+        **kwargs: Any,
     ):
         """Initialize a new ClassificationTask.
@@ -49,8 +56,8 @@ class ClassificationTask(BasicTask):
                 features with matching properties.
             read_class_id: whether to read an integer class ID instead of the class
                 name.
-            allow_invalid: instead of throwing error when no regression label is found
-                at a window, simply mark the example invalid for this task
+            allow_invalid: instead of throwing error when no classification label is
+                found at a window, simply mark the example invalid for this task
             skip_unknown_categories: whether to skip examples with categories that are
                 not passed via classes, instead of throwing error
             prob_property: when predicting, write probabilities in addition to class ID
@@ -95,13 +102,10 @@ class ClassificationTask(BasicTask):
             else:
                 self.positive_class_id = self.classes.index(self.positive_class)
-        if not self.filters:
-            self.filters = []
     def process_inputs(
         self,
-        raw_inputs: dict[str, torch.Tensor | list[Feature]],
-        metadata: dict[str, Any],
+        raw_inputs: dict[str, RasterImage | list[Feature]],
+        metadata: SampleMetadata,
         load_targets: bool = True,
     ) -> tuple[dict[str, Any], dict[str, Any]]:
         """Processes the data into targets.
@@ -119,7 +123,10 @@ class ClassificationTask(BasicTask):
             return {}, {}
         data = raw_inputs["targets"]
+        assert isinstance(data, list)
         for feat in data:
+            if feat.properties is None:
+                continue
             for property_name, property_value in self.filters:
                 if feat.properties.get(property_name) != property_value:
                     continue
@@ -155,17 +162,25 @@ class ClassificationTask(BasicTask):
         }
     def process_output(
-        self, raw_output: Any, metadata: dict[str, Any]
-    ) -> npt.NDArray[Any] | list[Feature]:
+        self, raw_output: Any, metadata: SampleMetadata
+    ) -> list[Feature]:
         """Processes an output into raster or vector data.
         Args:
-            raw_output: the output from prediction head.
+            raw_output: the output from prediction head, which must be a tensor
+                containing output probabilities (one dimension).
             metadata: metadata about the patch being read
         Returns:
-            either raster or vector data.
+            a list with one Feature corresponding to the input patch extent with a
+                property name containing the predicted class. It will have another
+                property containing the probabilities if prob_property was set.
         """
+        if not isinstance(raw_output, torch.Tensor) or len(raw_output.shape) != 1:
+            raise ValueError(
+                "expected output for ClassificationTask to be a Tensor with one dimension"
+            )
         probs = raw_output.cpu().numpy()
         if len(self.classes) == 2 and self.positive_class_threshold != 0.5:
             positive_class_prob = probs[self.positive_class_id]
@@ -175,24 +190,25 @@ class ClassificationTask(BasicTask):
                 class_idx = 1 - self.positive_class_id
         else:
             # For multiclass classification or when using the default threshold
-            class_idx = probs.argmax()
+            class_idx = probs.argmax().item()
+        value: str | int
         if not self.read_class_id:
-            value = self.classes[class_idx]
+            value = self.classes[class_idx]  # type: ignore
         else:
             value = class_idx
         feature = Feature(
             STGeometry(
-                metadata["projection"],
-                shapely.Point(metadata["bounds"][0], metadata["bounds"][1]),
+                metadata.projection,
+                shapely.Point(metadata.patch_bounds[0], metadata.patch_bounds[1]),
                 None,
             ),
             {
                 self.property_name: value,
             },
         )
-        if self.prob_property:
+        if self.prob_property is not None and feature.properties is not None:
             feature.properties[self.prob_property] = probs.tolist()
         return [feature]
@@ -215,6 +231,8 @@ class ClassificationTask(BasicTask):
         image = super().visualize(input_dict, target_dict, output)["image"]
         image = Image.fromarray(image)
         draw = ImageDraw.Draw(image)
+        if target_dict is None:
+            raise ValueError("target_dict is required for visualization")
         target_class = self.classes[target_dict["class"]]
         output_class = self.classes[output.argmax()]
         text = f"Label: {target_class}\nOutput: {output_class}"
@@ -263,28 +281,34 @@ class ClassificationTask(BasicTask):
         return MetricCollection(metrics)
-class ClassificationHead(torch.nn.Module):
+class ClassificationHead(Predictor):
     """Head for classification task."""
     def forward(
         self,
-        logits: torch.Tensor,
-        inputs: list[dict[str, Any]],
+        intermediates: Any,
+        context: ModelContext,
         targets: list[dict[str, Any]] | None = None,
-    ) -> tuple[torch.Tensor, dict[str, torch.Tensor]]:
+    ) -> ModelOutput:
         """Compute the classification outputs and loss from logits and targets.
         Args:
-            logits: tensor that is (BatchSize, NumClasses) in shape.
-            inputs: original inputs (ignored).
-            targets: should contain class key that stores the class label.
+            intermediates: output from the previous model component, it should be a
+                FeatureVector with a tensor that is (BatchSize, NumClasses) in shape.
+            context: the model context.
+            targets: must contain "class" key that stores the class label, along with
+                "valid" key indicating whether the label is valid for each example.
         Returns:
             tuple of outputs and loss dict
         """
+        if not isinstance(intermediates, FeatureVector):
+            raise ValueError("the input to ClassificationHead must be a FeatureVector")
+        logits = intermediates.feature_vector
         outputs = torch.nn.functional.softmax(logits, dim=1)
-        loss = None
+        losses = {}
         if targets:
             class_labels = torch.stack([target["class"] for target in targets], dim=0)
             mask = torch.stack([target["valid"] for target in targets], dim=0)
@@ -294,9 +318,12 @@ class ClassificationHead(torch.nn.Module):
                 )
                 * mask
             )
-            loss = torch.mean(loss)
+            losses["cls"] = torch.mean(loss)
-        return outputs, {"cls": loss}
+        return ModelOutput(
+            outputs=outputs,
+            loss_dict=losses,
+        )
 class ClassificationMetric(Metric):

rslearn/train/tasks/detection.py CHANGED Viewed

@@ -12,26 +12,27 @@ import torchmetrics.classification
 import torchvision
 from torchmetrics import Metric, MetricCollection
+from rslearn.train.model_context import RasterImage, SampleMetadata
 from rslearn.utils import Feature, STGeometry
 from .task import BasicTask
 DEFAULT_COLORS = [
-    [255, 0, 0],
-    [0, 255, 0],
-    [0, 0, 255],
-    [255, 255, 0],
-    [0, 255, 255],
-    [255, 0, 255],
-    [0, 128, 0],
-    [255, 160, 122],
-    [139, 69, 19],
-    [128, 128, 128],
-    [255, 255, 255],
-    [143, 188, 143],
-    [95, 158, 160],
-    [255, 200, 0],
-    [128, 0, 0],
+    (255, 0, 0),
+    (0, 255, 0),
+    (0, 0, 255),
+    (255, 255, 0),
+    (0, 255, 255),
+    (255, 0, 255),
+    (0, 128, 0),
+    (255, 160, 122),
+    (139, 69, 19),
+    (128, 128, 128),
+    (255, 255, 255),
+    (143, 188, 143),
+    (95, 158, 160),
+    (255, 200, 0),
+    (128, 0, 0),
 ]
@@ -53,14 +54,30 @@ class DetectionTask(BasicTask):
         score_threshold: float = 0.5,
         enable_map_metric: bool = True,
         enable_f1_metric: bool = False,
+        enable_precision_recall: bool = False,
+        f1_metric_thresholds: list[list[float]] = [
+            [
+                0.05,
+                0.1,
+                0.2,
+                0.3,
+                0.4,
+                0.5,
+                0.6,
+                0.7,
+                0.8,
+                0.9,
+                0.95,
+            ]
+        ],
         f1_metric_kwargs: dict[str, Any] = {},
-        **kwargs,
-    ):
-        """Initialize a new SegmentationTask.
+        **kwargs: Any,
+    ) -> None:
+        """Initialize a new DetectionTask.
         Args:
-            property_name: the property from which to extract the class name. The class
-                is read from the first matching feature.
+            property_name: the property from which to extract the class name. Features
+                without this property name are ignored.
             classes: a list of class names.
             filters: optional list of (property_name, property_value) to only consider
                 features with matching properties.
@@ -70,14 +87,20 @@ class DetectionTask(BasicTask):
                 not passed via classes, instead of throwing error
             skip_empty_examples: whether to skip examples with zero labels.
             colors: optional colors for each class
-            box_size: force all boxes to be this size, centered at the centroid of the
-                geometry. Required for Point geometries.
+            box_size: force all boxes to be two times this size, centered at the
+                centroid of the geometry. Required for Point geometries.
             clip_boxes: whether to clip boxes to the image bounds.
             exclude_by_center: before optionally clipping boxes, exclude boxes if the
                 center is outside the image bounds.
             score_threshold: confidence threshold for visualization and prediction.
             enable_map_metric: whether to compute mAP (default true)
             enable_f1_metric: whether to compute F1 (default false)
+            enable_precision_recall: whether to compute precision and recall.
+            f1_metric_thresholds: list of list of thresholds to apply for F1 metric, as
+                well as for precision and recall if enabled. Each inner list is used to
+                initialize a separate F1 metric where the best F1 across the thresholds
+                within the inner list is computed. If there are multiple inner lists,
+                then multiple F1 scores will be reported.
             f1_metric_kwargs: extra arguments to pass to F1 metric.
             kwargs: additional arguments to pass to BasicTask
         """
@@ -95,6 +118,8 @@ class DetectionTask(BasicTask):
         self.score_threshold = score_threshold
         self.enable_map_metric = enable_map_metric
         self.enable_f1_metric = enable_f1_metric
+        self.enable_precision_recall = enable_precision_recall
+        self.f1_metric_thresholds = f1_metric_thresholds
         self.f1_metric_kwargs = f1_metric_kwargs
         if not self.filters:
@@ -102,8 +127,8 @@ class DetectionTask(BasicTask):
     def process_inputs(
         self,
-        raw_inputs: dict[str, torch.Tensor | list[Feature]],
-        metadata: dict[str, Any],
+        raw_inputs: dict[str, RasterImage | list[Feature]],
+        metadata: SampleMetadata,
         load_targets: bool = True,
     ) -> tuple[dict[str, Any], dict[str, Any]]:
         """Processes the data into targets.
@@ -120,15 +145,21 @@ class DetectionTask(BasicTask):
         if not load_targets:
             return {}, {}
+        bounds = metadata.patch_bounds
         boxes = []
         class_labels = []
         valid = 1
         data = raw_inputs["targets"]
+        assert isinstance(data, list)
         for feat in data:
-            for property_name, property_value in self.filters:
-                if feat.properties.get(property_name) != property_value:
-                    continue
+            if feat.properties is None:
+                continue
+            if self.filters is not None:
+                for property_name, property_value in self.filters:
+                    if feat.properties.get(property_name) != property_value:
+                        continue
             if self.property_name not in feat.properties:
                 continue
@@ -159,39 +190,33 @@ class DetectionTask(BasicTask):
             else:
                 box = [int(val) for val in shp.bounds]
-            if box[0] >= metadata["bounds"][2] or box[2] <= metadata["bounds"][0]:
+            if box[0] >= bounds[2] or box[2] <= bounds[0]:
                 continue
-            if box[1] >= metadata["bounds"][3] or box[3] <= metadata["bounds"][1]:
+            if box[1] >= bounds[3] or box[3] <= bounds[1]:
                 continue
             if self.exclude_by_center:
                 center_col = (box[0] + box[2]) // 2
                 center_row = (box[1] + box[3]) // 2
-                if (
-                    center_col <= metadata["bounds"][0]
-                    or center_col >= metadata["bounds"][2]
-                ):
+                if center_col <= bounds[0] or center_col >= bounds[2]:
                     continue
-                if (
-                    center_row <= metadata["bounds"][1]
-                    or center_row >= metadata["bounds"][3]
-                ):
+                if center_row <= bounds[1] or center_row >= bounds[3]:
                     continue
             if self.clip_boxes:
                 box = [
-                    np.clip(box[0], metadata["bounds"][0], metadata["bounds"][2]),
-                    np.clip(box[1], metadata["bounds"][1], metadata["bounds"][3]),
-                    np.clip(box[2], metadata["bounds"][0], metadata["bounds"][2]),
-                    np.clip(box[3], metadata["bounds"][1], metadata["bounds"][3]),
+                    np.clip(box[0], bounds[0], bounds[2]),
+                    np.clip(box[1], bounds[1], bounds[3]),
+                    np.clip(box[2], bounds[0], bounds[2]),
+                    np.clip(box[3], bounds[1], bounds[3]),
                 ]
             # Convert to relative coordinates.
             box = [
-                box[0] - metadata["bounds"][0],
-                box[1] - metadata["bounds"][1],
-                box[2] - metadata["bounds"][0],
-                box[3] - metadata["bounds"][1],
+                box[0] - bounds[0],
+                box[1] - bounds[1],
+                box[2] - bounds[0],
+                box[3] - bounds[1],
             ]
             boxes.append(box)
@@ -211,16 +236,12 @@ class DetectionTask(BasicTask):
             "valid": torch.tensor(valid, dtype=torch.int32),
             "boxes": boxes,
             "labels": class_labels,
-            "width": torch.tensor(
-                metadata["bounds"][2] - metadata["bounds"][0], dtype=torch.float32
-            ),
-            "height": torch.tensor(
-                metadata["bounds"][3] - metadata["bounds"][1], dtype=torch.float32
-            ),
+            "width": torch.tensor(bounds[2] - bounds[0], dtype=torch.float32),
+            "height": torch.tensor(bounds[3] - bounds[1], dtype=torch.float32),
         }
     def process_output(
-        self, raw_output: Any, metadata: dict[str, Any]
+        self, raw_output: Any, metadata: SampleMetadata
     ) -> npt.NDArray[Any] | list[Feature]:
         """Processes an output into raster or vector data.
@@ -240,13 +261,13 @@ class DetectionTask(BasicTask):
         features = []
         for box, class_id, score in zip(boxes, class_ids, scores):
             shp = shapely.box(
-                metadata["bounds"][0] + float(box[0]),
-                metadata["bounds"][1] + float(box[1]),
-                metadata["bounds"][0] + float(box[2]),
-                metadata["bounds"][1] + float(box[3]),
+                metadata.patch_bounds[0] + float(box[0]),
+                metadata.patch_bounds[1] + float(box[1]),
+                metadata.patch_bounds[0] + float(box[2]),
+                metadata.patch_bounds[1] + float(box[3]),
             )
-            geom = STGeometry(metadata["projection"], shp, None)
-            properties = {
+            geom = STGeometry(metadata.projection, shp, None)
+            properties: dict[str, Any] = {
                 "score": float(score),
             }
@@ -278,7 +299,9 @@ class DetectionTask(BasicTask):
         """
         image = super().visualize(input_dict, target_dict, output)["image"]
-        def draw_boxes(image: npt.NDArray[Any], d: dict[str, torch.Tensor]):
+        def draw_boxes(
+            image: npt.NDArray[Any], d: dict[str, torch.Tensor]
+        ) -> npt.NDArray[Any]:
             boxes = d["boxes"].cpu().numpy()
             class_ids = d["labels"].cpu().numpy()
             if "scores" in d:
@@ -299,6 +322,8 @@ class DetectionTask(BasicTask):
             return image
+        if target_dict is None:
+            raise ValueError("target_dict is required for visualization")
         return {
             "gt": draw_boxes(image.copy(), target_dict),
             "pred": draw_boxes(image.copy(), output),
@@ -307,17 +332,46 @@ class DetectionTask(BasicTask):
     def get_metrics(self) -> MetricCollection:
         """Get the metrics for this task."""
         metrics = {}
         if self.enable_map_metric:
             metrics["mAP"] = DetectionMetric(
                 torchmetrics.detection.mean_ap.MeanAveragePrecision(),
                 output_key="map",
             )
-        if self.enable_f1_metric:
+        if self.enable_f1_metric or self.enable_precision_recall:
             kwargs = dict(
                 num_classes=len(self.classes),
             )
             kwargs.update(self.f1_metric_kwargs)
-            metrics["F1"] = DetectionMetric(F1Metric(**kwargs))
+            for thresholds in self.f1_metric_thresholds:
+                if len(self.f1_metric_thresholds) == 1:
+                    suffix = ""
+                else:
+                    # Metric name can't contain "." so change to ",".
+                    suffix = "_" + str(thresholds[0]).replace(".", ",")
+                if self.enable_f1_metric:
+                    metrics["F1" + suffix] = DetectionMetric(
+                        F1Metric(score_thresholds=thresholds, **kwargs)  # type: ignore
+                    )
+                if self.enable_precision_recall:
+                    metrics["precision" + suffix] = DetectionMetric(
+                        F1Metric(
+                            score_thresholds=thresholds,
+                            metric_mode="precision",
+                            **kwargs,  # type: ignore
+                        )
+                    )
+                    metrics["recall" + suffix] = DetectionMetric(
+                        F1Metric(
+                            score_thresholds=thresholds,
+                            metric_mode="recall",
+                            **kwargs,  # type: ignore
+                        )
+                    )
         return MetricCollection(metrics)
@@ -377,22 +431,11 @@ class F1Metric(Metric):
     def __init__(
         self,
         num_classes: int,
+        score_thresholds: list[float],
         cmp_mode: str = "iou",
         cmp_threshold: float = 0.5,
-        score_thresholds: list[float] = [
-            0.05,
-            0.1,
-            0.2,
-            0.3,
-            0.4,
-            0.5,
-            0.6,
-            0.7,
-            0.8,
-            0.9,
-            0.95,
-        ],
         flatten_classes: bool = False,
+        metric_mode: str = "f1",
     ):
         """Create a new F1Metric.
@@ -406,6 +449,8 @@ class F1Metric(Metric):
             flatten_classes: sum true positives, false positives, and false negatives
                 across classes and report combined F1 instead of computing F1 score for
                 each class and then reporting the average.
+            metric_mode: set to "precision" or "recall" to return that instead of F1
+                (default "f1")
         """
         super().__init__()
         self.num_classes = num_classes
@@ -413,6 +458,10 @@ class F1Metric(Metric):
         self.cmp_threshold = cmp_threshold
         self.score_thresholds = score_thresholds
         self.flatten_classes = flatten_classes
+        self.metric_mode = metric_mode
+        assert self.cmp_mode in ["iou", "distance"]
+        assert self.metric_mode in ["f1", "precision", "recall"]
         for cls_idx in range(self.num_classes):
             for thr_idx in range(len(self.score_thresholds)):
@@ -531,8 +580,15 @@ class F1Metric(Metric):
                 else:
                     f1 = 2 * precision * recall / (precision + recall)
-                if best_score is None or f1 > best_score:
-                    best_score = f1
+                if self.metric_mode == "f1":
+                    score = f1
+                elif self.metric_mode == "precision":
+                    score = precision
+                elif self.metric_mode == "recall":
+                    score = recall
+                if best_score is None or score > best_score:
+                    best_score = score
             best_scores.append(best_score)

rslearn/train/tasks/embedding.py ADDED Viewed

@@ -0,0 +1,120 @@
+"""Embedding task."""
+from typing import Any
+import numpy.typing as npt
+import torch
+from torchmetrics import MetricCollection
+from rslearn.models.component import FeatureMaps
+from rslearn.train.model_context import ModelContext, ModelOutput, SampleMetadata
+from rslearn.utils import Feature
+from .task import Task
+class EmbeddingTask(Task):
+    """A dummy task for computing embeddings.
+    This task does not compute any targets or loss. Instead, it is just set up for
+    inference, to save embeddings from the configured model.
+    """
+    def process_inputs(
+        self,
+        raw_inputs: dict[str, torch.Tensor],
+        metadata: SampleMetadata,
+        load_targets: bool = True,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        """Processes the data into targets.
+        Args:
+            raw_inputs: raster or vector data to process
+            metadata: metadata about the patch being read
+            load_targets: whether to load the targets or only inputs
+        Returns:
+            tuple (input_dict, target_dict) containing the processed inputs and targets
+                that are compatible with both metrics and loss functions
+        """
+        return {}, {}
+    def process_output(
+        self, raw_output: Any, metadata: SampleMetadata
+    ) -> npt.NDArray[Any] | list[Feature]:
+        """Processes an output into raster or vector data.
+        Args:
+            raw_output: the output from prediction head, which must be a CxHxW tensor.
+            metadata: metadata about the patch being read
+        Returns:
+            either raster or vector data.
+        """
+        if not isinstance(raw_output, torch.Tensor) or len(raw_output.shape) != 3:
+            raise ValueError(
+                "output for EmbeddingTask must be a tensor with three dimensions"
+            )
+        # Just convert the raw output to numpy array that can be saved to GeoTIFF.
+        return raw_output.cpu().numpy()
+    def visualize(
+        self,
+        input_dict: dict[str, Any],
+        target_dict: dict[str, Any] | None,
+        output: Any,
+    ) -> dict[str, npt.NDArray[Any]]:
+        """Visualize the outputs and targets.
+        Args:
+            input_dict: the input dict from process_inputs
+            target_dict: the target dict from process_inputs
+            output: the prediction
+        Returns:
+            a dictionary mapping image name to visualization image
+        """
+        # EmbeddingTask is only set up to support `model predict`.
+        raise NotImplementedError
+    def get_metrics(self) -> MetricCollection:
+        """Get the metrics for this task."""
+        return MetricCollection({})
+class EmbeddingHead:
+    """Head for embedding task.
+    It just adds a dummy loss to act as a Predictor.
+    """
+    def forward(
+        self,
+        intermediates: Any,
+        context: ModelContext,
+        targets: list[dict[str, Any]] | None = None,
+    ) -> ModelOutput:
+        """Return the feature map along with a dummy loss.
+        Args:
+            intermediates: output from the previous model component, which must be a
+                FeatureMaps consisting of a single feature map.
+            context: the model context.
+            targets: the targets (ignored).
+        Returns:
+            model output with the feature map that was input to this component along
+                with a dummy loss.
+        """
+        if not isinstance(intermediates, FeatureMaps):
+            raise ValueError("input to EmbeddingHead must be a FeatureMaps")
+        if len(intermediates.feature_maps) != 1:
+            raise ValueError(
+                f"input to EmbeddingHead must have one feature map, but got {len(intermediates.feature_maps)}"
+            )
+        return ModelOutput(
+            outputs=intermediates.feature_maps[0],
+            loss_dict={"loss": 0},
+        )

rslearn 0.0.1__py3-none-any.whl → 0.0.21__py3-none-any.whl

rslearn 0.0.1py3-none-any.whl → 0.0.21py3-none-any.whl