PyPI - rslearn - Versions diffs - 0.0.1__py3-none-any.whl → 0.0.21__py3-none-any.whl - Mend

rslearn 0.0.1py3-none-any.whl → 0.0.21py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (166) hide show

rslearn/arg_parser.py +31 -0
rslearn/config/__init__.py +6 -12
rslearn/config/dataset.py +520 -401
rslearn/const.py +9 -15
rslearn/data_sources/__init__.py +8 -23
rslearn/data_sources/aws_landsat.py +242 -98
rslearn/data_sources/aws_open_data.py +111 -151
rslearn/data_sources/aws_sentinel1.py +131 -0
rslearn/data_sources/climate_data_store.py +471 -0
rslearn/data_sources/copernicus.py +884 -12
rslearn/data_sources/data_source.py +43 -12
rslearn/data_sources/earthdaily.py +484 -0
rslearn/data_sources/earthdata_srtm.py +282 -0
rslearn/data_sources/eurocrops.py +242 -0
rslearn/data_sources/gcp_public_data.py +578 -222
rslearn/data_sources/google_earth_engine.py +461 -135
rslearn/data_sources/local_files.py +219 -150
rslearn/data_sources/openstreetmap.py +51 -89
rslearn/data_sources/planet.py +24 -60
rslearn/data_sources/planet_basemap.py +275 -0
rslearn/data_sources/planetary_computer.py +798 -0
rslearn/data_sources/usda_cdl.py +195 -0
rslearn/data_sources/usgs_landsat.py +115 -83
rslearn/data_sources/utils.py +249 -61
rslearn/data_sources/vector_source.py +1 -0
rslearn/data_sources/worldcereal.py +449 -0
rslearn/data_sources/worldcover.py +144 -0
rslearn/data_sources/worldpop.py +153 -0
rslearn/data_sources/xyz_tiles.py +150 -107
rslearn/dataset/__init__.py +8 -2
rslearn/dataset/add_windows.py +2 -2
rslearn/dataset/dataset.py +40 -51
rslearn/dataset/handler_summaries.py +131 -0
rslearn/dataset/manage.py +313 -74
rslearn/dataset/materialize.py +431 -107
rslearn/dataset/remap.py +29 -4
rslearn/dataset/storage/__init__.py +1 -0
rslearn/dataset/storage/file.py +202 -0
rslearn/dataset/storage/storage.py +140 -0
rslearn/dataset/window.py +181 -44
rslearn/lightning_cli.py +454 -0
rslearn/log_utils.py +24 -0
rslearn/main.py +384 -181
rslearn/models/anysat.py +215 -0
rslearn/models/attention_pooling.py +177 -0
rslearn/models/clay/clay.py +231 -0
rslearn/models/clay/configs/metadata.yaml +295 -0
rslearn/models/clip.py +68 -0
rslearn/models/component.py +111 -0
rslearn/models/concatenate_features.py +103 -0
rslearn/models/conv.py +63 -0
rslearn/models/croma.py +306 -0
rslearn/models/detr/__init__.py +5 -0
rslearn/models/detr/box_ops.py +103 -0
rslearn/models/detr/detr.py +504 -0
rslearn/models/detr/matcher.py +107 -0
rslearn/models/detr/position_encoding.py +114 -0
rslearn/models/detr/transformer.py +429 -0
rslearn/models/detr/util.py +24 -0
rslearn/models/dinov3.py +177 -0
rslearn/models/faster_rcnn.py +30 -28
rslearn/models/feature_center_crop.py +53 -0
rslearn/models/fpn.py +19 -8
rslearn/models/galileo/__init__.py +5 -0
rslearn/models/galileo/galileo.py +595 -0
rslearn/models/galileo/single_file_galileo.py +1678 -0
rslearn/models/module_wrapper.py +65 -0
rslearn/models/molmo.py +69 -0
rslearn/models/multitask.py +384 -28
rslearn/models/olmoearth_pretrain/__init__.py +1 -0
rslearn/models/olmoearth_pretrain/model.py +421 -0
rslearn/models/olmoearth_pretrain/norm.py +86 -0
rslearn/models/panopticon.py +170 -0
rslearn/models/panopticon_data/sensors/drone.yaml +32 -0
rslearn/models/panopticon_data/sensors/enmap.yaml +904 -0
rslearn/models/panopticon_data/sensors/goes.yaml +9 -0
rslearn/models/panopticon_data/sensors/himawari.yaml +9 -0
rslearn/models/panopticon_data/sensors/intuition.yaml +606 -0
rslearn/models/panopticon_data/sensors/landsat8.yaml +84 -0
rslearn/models/panopticon_data/sensors/modis_terra.yaml +99 -0
rslearn/models/panopticon_data/sensors/qb2_ge1.yaml +34 -0
rslearn/models/panopticon_data/sensors/sentinel1.yaml +85 -0
rslearn/models/panopticon_data/sensors/sentinel2.yaml +97 -0
rslearn/models/panopticon_data/sensors/superdove.yaml +60 -0
rslearn/models/panopticon_data/sensors/wv23.yaml +63 -0
rslearn/models/pick_features.py +17 -10
rslearn/models/pooling_decoder.py +60 -7
rslearn/models/presto/__init__.py +5 -0
rslearn/models/presto/presto.py +297 -0
rslearn/models/presto/single_file_presto.py +926 -0
rslearn/models/prithvi.py +1147 -0
rslearn/models/resize_features.py +59 -0
rslearn/models/sam2_enc.py +13 -9
rslearn/models/satlaspretrain.py +38 -18
rslearn/models/simple_time_series.py +188 -77
rslearn/models/singletask.py +24 -13
rslearn/models/ssl4eo_s12.py +40 -30
rslearn/models/swin.py +44 -32
rslearn/models/task_embedding.py +250 -0
rslearn/models/terramind.py +256 -0
rslearn/models/trunk.py +139 -0
rslearn/models/unet.py +68 -22
rslearn/models/upsample.py +48 -0
rslearn/models/use_croma.py +508 -0
rslearn/template_params.py +26 -0
rslearn/tile_stores/__init__.py +41 -18
rslearn/tile_stores/default.py +409 -0
rslearn/tile_stores/tile_store.py +236 -132
rslearn/train/all_patches_dataset.py +530 -0
rslearn/train/callbacks/adapters.py +53 -0
rslearn/train/callbacks/freeze_unfreeze.py +348 -17
rslearn/train/callbacks/gradients.py +129 -0
rslearn/train/callbacks/peft.py +116 -0
rslearn/train/data_module.py +444 -20
rslearn/train/dataset.py +588 -235
rslearn/train/lightning_module.py +192 -62
rslearn/train/model_context.py +88 -0
rslearn/train/optimizer.py +31 -0
rslearn/train/prediction_writer.py +319 -84
rslearn/train/scheduler.py +92 -0
rslearn/train/tasks/classification.py +55 -28
rslearn/train/tasks/detection.py +132 -76
rslearn/train/tasks/embedding.py +120 -0
rslearn/train/tasks/multi_task.py +28 -14
rslearn/train/tasks/per_pixel_regression.py +291 -0
rslearn/train/tasks/regression.py +161 -44
rslearn/train/tasks/segmentation.py +428 -53
rslearn/train/tasks/task.py +6 -5
rslearn/train/transforms/__init__.py +1 -1
rslearn/train/transforms/concatenate.py +54 -10
rslearn/train/transforms/crop.py +29 -11
rslearn/train/transforms/flip.py +18 -6
rslearn/train/transforms/mask.py +78 -0
rslearn/train/transforms/normalize.py +101 -17
rslearn/train/transforms/pad.py +19 -7
rslearn/train/transforms/resize.py +83 -0
rslearn/train/transforms/select_bands.py +76 -0
rslearn/train/transforms/sentinel1.py +75 -0
rslearn/train/transforms/transform.py +89 -70
rslearn/utils/__init__.py +2 -6
rslearn/utils/array.py +8 -6
rslearn/utils/feature.py +2 -2
rslearn/utils/fsspec.py +90 -1
rslearn/utils/geometry.py +347 -7
rslearn/utils/get_utm_ups_crs.py +2 -3
rslearn/utils/grid_index.py +5 -5
rslearn/utils/jsonargparse.py +178 -0
rslearn/utils/mp.py +4 -3
rslearn/utils/raster_format.py +268 -116
rslearn/utils/rtree_index.py +64 -17
rslearn/utils/sqlite_index.py +7 -1
rslearn/utils/vector_format.py +252 -97
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/METADATA +532 -283
rslearn-0.0.21.dist-info/RECORD +167 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/WHEEL +1 -1
rslearn-0.0.21.dist-info/licenses/NOTICE +115 -0
rslearn/data_sources/raster_source.py +0 -309
rslearn/models/registry.py +0 -5
rslearn/tile_stores/file.py +0 -242
rslearn/utils/mgrs.py +0 -24
rslearn/utils/utils.py +0 -22
rslearn-0.0.1.dist-info/RECORD +0 -88
/rslearn/{data_sources/geotiff.py → py.typed} +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/entry_points.txt +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info/licenses}/LICENSE +0 -0
{rslearn-0.0.1.dist-info → rslearn-0.0.21.dist-info}/top_level.txt +0 -0

rslearn/models/presto/presto.py ADDED Viewed

@@ -0,0 +1,297 @@
+"""Presto wrapper to ingest Masked Helios Samples."""
+import logging
+import tempfile
+from datetime import datetime
+import torch
+from einops import rearrange, repeat
+from huggingface_hub import hf_hub_download
+from upath import UPath
+from rslearn.models.component import FeatureExtractor, FeatureMaps
+from rslearn.models.presto.single_file_presto import (
+    ERA5_BANDS,
+    NUM_DYNAMIC_WORLD_CLASSES,
+    PRESTO_ADD_BY,
+    PRESTO_BANDS,
+    PRESTO_DIV_BY,
+    PRESTO_S1_BANDS,
+    PRESTO_S2_BANDS,
+    SRTM_BANDS,
+)
+from rslearn.models.presto.single_file_presto import Presto as SFPresto
+from rslearn.train.model_context import ModelContext
+logger = logging.getLogger(__name__)
+INPUT_PRESTO_BANDS = [b for b in PRESTO_BANDS if b != "B09"]
+INPUT_PRESTO_S2_BANDS = [b for b in PRESTO_S2_BANDS if b != "B09"]
+PRESTO_S1_SUBTRACT_VALUE = -25.0
+PRESTO_S1_DIV_VALUE = 25.0
+PRESTO_S2_SUBTRACT_VALUE = 0.0
+PRESTO_S2_DIV_VALUE = 1e4
+HF_HUB_ID = "nasaharvest/presto"
+MODEL_FILENAME = "default_model.pt"
+class Presto(FeatureExtractor):
+    """Presto."""
+    input_keys = [
+        "s1",
+        "s2",
+        "era5",
+        "srtm",
+        "dynamic_world",
+        "latlon",
+    ]
+    def __init__(
+        self,
+        pretrained_path: str | UPath | None = None,
+        pixel_batch_size: int = 128,
+    ):
+        """Initialize the Presto wrapper.
+        Args:
+            pretrained_path: The directory to load from
+            pixel_batch_size: If the input has a h,w dimension >1, this is
+                flattened into a batch dimension (b h w) before being passed
+                to the model (since Presto is designed for pixel timeseries).
+        """
+        super().__init__()
+        if pretrained_path is None:
+            pretrained_path = UPath(tempfile.gettempdir(), "rslearn_cache", "presto")
+        if not (UPath(pretrained_path) / MODEL_FILENAME).exists():
+            _ = hf_hub_download(
+                local_dir=UPath(pretrained_path),
+                repo_id=HF_HUB_ID,
+                filename=MODEL_FILENAME,
+                # pin the model to a specific hugging face commit
+                revision="1b97f885969da4e2d5834ca8c92707c737911464",
+            )
+        model = SFPresto.construct()
+        model.load_state_dict(
+            torch.load(
+                UPath(pretrained_path) / MODEL_FILENAME,
+                map_location="cpu",
+                weights_only=True,
+            )
+        )
+        self.pixel_batch_size = pixel_batch_size
+        self.model = model.encoder
+        self.month = 6  # default month
+    def construct_presto_input(
+        self,
+        s1: torch.Tensor | None = None,
+        s1_bands: torch.Tensor | None = None,
+        s2: torch.Tensor | None = None,
+        s2_bands: torch.Tensor | None = None,
+        era5: torch.Tensor | None = None,
+        era5_bands: torch.Tensor | None = None,
+        srtm: torch.Tensor | None = None,
+        srtm_bands: torch.Tensor | None = None,
+        dynamic_world: torch.Tensor | None = None,
+        months: torch.Tensor | None = None,
+        normalize: bool = True,
+    ) -> tuple[torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor]:
+        """Inputs are paired into a tensor input <X> and a list <X>_bands, which describes <X>.
+        <X> should have shape (b, num_timesteps, h, w len(<X>_bands)), with the following bands for
+        each input:
+        s1: ["VV", "VH"]
+        s2: ["B2", "B3", "B4", "B5", "B6", "B7", "B8", "B8A", "B9", "B11", "B12"]
+        era5: ["temperature_2m", "total_precipitation"]
+            "temperature_2m": Temperature of air at 2m above the surface of land,
+                sea or in-land waters in Kelvin (K)
+            "total_precipitation": Accumulated liquid and frozen water, including rain and snow,
+                that falls to the Earth's surface. Measured in metres (m)
+        srtm: ["elevation", "slope"]
+        dynamic_world is a 1d input of shape (num_timesteps,) representing the dynamic world classes
+            of each timestep for that pixel
+        """
+        bs = [x.shape[0] for x in [s1, s2, era5, srtm] if x is not None]
+        ts = [x.shape[2] for x in [s1, s2, era5, srtm] if x is not None]
+        hs = [x.shape[3] for x in [s1, s2, era5, srtm] if x is not None]
+        ws = [x.shape[4] for x in [s1, s2, era5, srtm] if x is not None]
+        devices = [x.device for x in [s1, s2, era5, srtm] if x is not None]
+        assert len(set(bs)) == 1
+        assert len(set(hs)) == 1
+        assert len(set(ws)) == 1
+        assert len(set(devices)) == 1
+        assert len(set(ts)) == 1
+        b, h, w, t, device = bs[0], hs[0], ws[0], ts[0], devices[0]
+        # these values will be initialized as
+        # we iterate through the data
+        x: torch.Tensor | None = None
+        mask: torch.Tensor | None = None
+        for band_group in [
+            (s1, s1_bands),
+            (s2, s2_bands),
+            (era5, era5_bands),
+            (srtm, srtm_bands),
+        ]:
+            data, input_bands = band_group
+            if data is not None:
+                assert input_bands is not None
+            else:
+                continue
+            data = rearrange(data, "b c t h w -> b t h w c")
+            if x is None:
+                x = torch.zeros(b, t, h, w, len(INPUT_PRESTO_BANDS), device=device)
+            if mask is None:
+                mask = torch.ones(b, t, h, w, len(INPUT_PRESTO_BANDS), device=device)
+            # construct a mapping from the input bands to the presto input bands
+            input_to_output_mapping = [
+                INPUT_PRESTO_BANDS.index(val) for val in input_bands
+            ]
+            x[:, :, :, :, input_to_output_mapping] = data
+            mask[:, :, :, :, input_to_output_mapping] = 0
+        assert x is not None
+        assert mask is not None
+        assert t is not None
+        if dynamic_world is None:
+            dynamic_world = (
+                torch.ones(b, t, h, w, device=device) * NUM_DYNAMIC_WORLD_CLASSES
+            )
+        if months is None:
+            months = torch.ones((b, t), device=device) * self.month
+        else:
+            assert months.shape[-1] == t
+        if normalize:
+            x = (x + PRESTO_ADD_BY.to(device=device)) / PRESTO_DIV_BY.to(device=device)
+        return x, mask, dynamic_world.long(), months.long()
+    @staticmethod
+    def time_ranges_to_timestamps(
+        time_ranges: list[tuple[datetime, datetime]],
+        device: torch.device,
+    ) -> torch.Tensor:
+        """Turn the time ranges stored in a RasterImage to timestamps accepted by Presto.
+        Presto only uses the month associated with each timestamp, so we take the midpoint
+        the time range. For some inputs (e.g. Sentinel 2) we take an image from a specific
+        time so that start_time == end_time == mid_time.
+        """
+        mid_ranges = [t[0] + ((t[1] - t[0]) / 2) for t in time_ranges]
+        # months are indexed 0-11
+        return torch.tensor(
+            [d.month - 1 for d in mid_ranges], dtype=torch.int32, device=device
+        )
+    def forward(self, context: ModelContext) -> FeatureMaps:
+        """Compute feature maps from the Presto backbone.
+        Args:
+            context: the model context. Input dicts should have some subset of Presto.input_keys.
+        Returns:
+            a FeatureMaps with one feature map that is at the same resolution as the
+                input (since Presto operates per-pixel).
+        """
+        time_modalities = ["s1", "s2", "era5"]
+        stacked_inputs = {}
+        latlons: torch.Tensor | None = None
+        months: torch.Tensor | None = None
+        for key in context.inputs[0].keys():
+            # assume all the keys in an input are consistent
+            if key in self.input_keys:
+                if key == "latlon":
+                    latlons = torch.stack(
+                        [inp[key].image for inp in context.inputs], dim=0
+                    )
+                else:
+                    stacked_inputs[key] = torch.stack(
+                        [inp[key].image for inp in context.inputs], dim=0
+                    )
+                if key in time_modalities:
+                    if months is None:
+                        if context.inputs[0][key].timestamps is not None:
+                            months = torch.stack(
+                                [
+                                    self.time_ranges_to_timestamps(
+                                        inp[key].timestamps,  # type: ignore
+                                        device=stacked_inputs[key].device,
+                                    )
+                                    for inp in context.inputs
+                                ],
+                                dim=0,
+                            )
+        if months is not None:
+            stacked_inputs["months"] = months
+        (
+            x,
+            mask,
+            dynamic_world,
+            months,
+        ) = self.construct_presto_input(
+            **stacked_inputs,
+            s1_bands=PRESTO_S1_BANDS,
+            s2_bands=INPUT_PRESTO_S2_BANDS,
+            era5_bands=ERA5_BANDS,
+            srtm_bands=SRTM_BANDS,
+            normalize=True,
+        )
+        b, _, h, w, _ = x.shape
+        output_features = torch.zeros(
+            b * h * w, self.model.embedding_size, device=x.device
+        )
+        x = rearrange(x, "b t h w d -> (b h w) t d")
+        mask = rearrange(mask, "b t h w d -> (b h w) t d")
+        dynamic_world = rearrange(dynamic_world, "b t h w -> (b h w) t")
+        months = repeat(months, "b t -> (b h w) t", h=h, w=w)
+        if latlons is not None:
+            latlons = rearrange(latlons, "b c h w -> (b h w) c")
+        for batch_idx in range(0, b * h * w, self.pixel_batch_size):
+            x_b = x[batch_idx : batch_idx + self.pixel_batch_size]
+            mask_b = mask[batch_idx : batch_idx + self.pixel_batch_size]
+            dw = dynamic_world[batch_idx : batch_idx + self.pixel_batch_size]
+            months_b = months[batch_idx : batch_idx + self.pixel_batch_size]
+            if latlons is not None:
+                l_b = latlons[batch_idx : batch_idx + self.pixel_batch_size]
+            else:
+                l_b = None
+            output_b = self.model(
+                x=x_b,
+                dynamic_world=dw,
+                mask=mask_b,
+                month=months_b,
+                latlons=l_b,
+                eval_task=True,
+            )
+            output_features[batch_idx : batch_idx + self.pixel_batch_size] = output_b
+        return FeatureMaps(
+            [rearrange(output_features, "(b h w) d -> b d h w", h=h, w=w, b=b)]
+        )
+    def get_backbone_channels(self) -> list:
+        """Returns the output channels of this model when used as a backbone.
+        The output channels is a list of (patch_size, depth) that corresponds
+        to the feature maps that the backbone returns.
+        Returns:
+            the output channels of the backbone as a list of (patch_size, depth) tuples.
+        """
+        return [(1, 128)]

rslearn 0.0.1__py3-none-any.whl → 0.0.21__py3-none-any.whl

rslearn 0.0.1py3-none-any.whl → 0.0.21py3-none-any.whl