PyPI - geoai-py - Versions diffs - 0.15.0__py2.py3-none-any.whl → 0.17.0__py2.py3-none-any.whl - Mend

geoai-py 0.15.0py2.py3-none-any.whl → 0.17.0py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

geoai/__init__.py +1 -1
geoai/agents/__init__.py +4 -0
geoai/agents/catalog_models.py +51 -0
geoai/agents/catalog_tools.py +907 -0
geoai/agents/geo_agents.py +925 -41
geoai/agents/stac_models.py +67 -0
geoai/agents/stac_tools.py +435 -0
geoai/change_detection.py +16 -6
geoai/download.py +5 -1
geoai/geoai.py +3 -0
geoai/train.py +573 -31
geoai/utils.py +752 -208
{geoai_py-0.15.0.dist-info → geoai_py-0.17.0.dist-info}/METADATA +2 -1
geoai_py-0.17.0.dist-info/RECORD +30 -0
geoai_py-0.15.0.dist-info/RECORD +0 -26
{geoai_py-0.15.0.dist-info → geoai_py-0.17.0.dist-info}/WHEEL +0 -0
{geoai_py-0.15.0.dist-info → geoai_py-0.17.0.dist-info}/entry_points.txt +0 -0
{geoai_py-0.15.0.dist-info → geoai_py-0.17.0.dist-info}/licenses/LICENSE +0 -0
{geoai_py-0.15.0.dist-info → geoai_py-0.17.0.dist-info}/top_level.txt +0 -0

geoai/agents/stac_models.py ADDED Viewed

@@ -0,0 +1,67 @@
+"""Structured output models for STAC catalog search results."""
+from typing import Any, Dict, List, Optional
+from pydantic import BaseModel, Field
+class STACCollectionInfo(BaseModel):
+    """Information about a STAC collection."""
+    id: str = Field(..., description="Collection identifier")
+    title: str = Field(..., description="Collection title")
+    description: Optional[str] = Field(None, description="Collection description")
+    license: Optional[str] = Field(None, description="License information")
+    temporal_extent: Optional[str] = Field(
+        None, description="Temporal extent (start/end dates)"
+    )
+    spatial_extent: Optional[str] = Field(None, description="Spatial bounding box")
+    providers: Optional[str] = Field(None, description="Data providers")
+    keywords: Optional[str] = Field(None, description="Keywords")
+class STACAssetInfo(BaseModel):
+    """Information about a STAC item asset."""
+    key: str = Field(..., description="Asset key/identifier")
+    title: Optional[str] = Field(None, description="Asset title")
+class STACItemInfo(BaseModel):
+    """Information about a STAC item."""
+    id: str = Field(..., description="Item identifier")
+    collection: str = Field(..., description="Collection ID")
+    datetime: Optional[str] = Field(None, description="Acquisition datetime")
+    bbox: Optional[List[float]] = Field(
+        None, description="Bounding box [west, south, east, north]"
+    )
+    assets: List[STACAssetInfo] = Field(
+        default_factory=list, description="Available assets"
+    )
+    # properties: Optional[Dict[str, Any]] = Field(
+    #     None, description="Additional metadata properties"
+    # )
+class STACSearchResult(BaseModel):
+    """Container for STAC search results."""
+    query: str = Field(..., description="Original search query")
+    collection: Optional[str] = Field(None, description="Collection searched")
+    item_count: int = Field(..., description="Number of items found")
+    items: List[STACItemInfo] = Field(
+        default_factory=list, description="List of STAC items"
+    )
+    bbox: Optional[List[float]] = Field(None, description="Search bounding box used")
+    time_range: Optional[str] = Field(None, description="Time range used for search")
+class LocationInfo(BaseModel):
+    """Geographic location information."""
+    name: str = Field(..., description="Location name")
+    bbox: List[float] = Field(
+        ..., description="Bounding box [west, south, east, north]"
+    )
+    center: List[float] = Field(..., description="Center coordinates [lon, lat]")

geoai/agents/stac_tools.py ADDED Viewed

@@ -0,0 +1,435 @@
+"""Tools for STAC catalog search and interaction."""
+import ast
+import json
+from typing import Any, Dict, List, Optional, Union
+from strands import tool
+from ..download import pc_collection_list, pc_stac_search
+from .stac_models import (
+    LocationInfo,
+    STACAssetInfo,
+    STACCollectionInfo,
+    STACItemInfo,
+    STACSearchResult,
+)
+class STACTools:
+    """Collection of tools for searching and interacting with STAC catalogs."""
+    # Common location cache to avoid repeated geocoding
+    _LOCATION_CACHE = {
+        "san francisco": {
+            "name": "San Francisco",
+            "bbox": [-122.5155, 37.7034, -122.3549, 37.8324],
+            "center": [-122.4194, 37.7749],
+        },
+        "new york": {
+            "name": "New York",
+            "bbox": [-74.0479, 40.6829, -73.9067, 40.8820],
+            "center": [-73.9352, 40.7306],
+        },
+        "new york city": {
+            "name": "New York City",
+            "bbox": [-74.0479, 40.6829, -73.9067, 40.8820],
+            "center": [-73.9352, 40.7306],
+        },
+        "paris": {
+            "name": "Paris",
+            "bbox": [2.2241, 48.8156, 2.4698, 48.9022],
+            "center": [2.3522, 48.8566],
+        },
+        "london": {
+            "name": "London",
+            "bbox": [-0.5103, 51.2868, 0.3340, 51.6919],
+            "center": [-0.1276, 51.5074],
+        },
+        "tokyo": {
+            "name": "Tokyo",
+            "bbox": [139.5694, 35.5232, 139.9182, 35.8173],
+            "center": [139.6917, 35.6895],
+        },
+        "los angeles": {
+            "name": "Los Angeles",
+            "bbox": [-118.6682, 33.7037, -118.1553, 34.3373],
+            "center": [-118.2437, 34.0522],
+        },
+        "chicago": {
+            "name": "Chicago",
+            "bbox": [-87.9401, 41.6445, -87.5241, 42.0230],
+            "center": [-87.6298, 41.8781],
+        },
+        "seattle": {
+            "name": "Seattle",
+            "bbox": [-122.4595, 47.4810, -122.2244, 47.7341],
+            "center": [-122.3321, 47.6062],
+        },
+        "california": {
+            "name": "California",
+            "bbox": [-124.4820, 32.5288, -114.1315, 42.0095],
+            "center": [-119.4179, 36.7783],
+        },
+        "las vegas": {
+            "name": "Las Vegas",
+            "bbox": [-115.3711, 35.9630, -114.9372, 36.2610],
+            "center": [-115.1400, 36.1177],
+        },
+    }
+    def __init__(
+        self,
+        endpoint: str = "https://planetarycomputer.microsoft.com/api/stac/v1",
+    ) -> None:
+        """Initialize STAC tools.
+        Args:
+            endpoint: STAC API endpoint URL. Defaults to Microsoft Planetary Computer.
+        """
+        self.endpoint = endpoint
+        # Runtime cache for geocoding results
+        self._geocode_cache = {}
+    @tool(
+        description="List and search available STAC collections from Planetary Computer"
+    )
+    def list_collections(
+        self,
+        filter_keyword: Optional[str] = None,
+        detailed: bool = False,
+    ) -> str:
+        """List available STAC collections from Planetary Computer.
+        Args:
+            filter_keyword: Optional keyword to filter collections (searches in id, title, description).
+            detailed: If True, return detailed information including temporal extent, license, etc.
+        Returns:
+            JSON string containing list of collections with their metadata.
+        """
+        try:
+            # Get collections using existing function
+            df = pc_collection_list(
+                endpoint=self.endpoint,
+                detailed=detailed,
+                filter_by=None,
+                sort_by="id",
+            )
+            # Apply keyword filtering if specified
+            if filter_keyword:
+                mask = df["id"].str.contains(filter_keyword, case=False, na=False) | df[
+                    "title"
+                ].str.contains(filter_keyword, case=False, na=False)
+                if "description" in df.columns:
+                    mask |= df["description"].str.contains(
+                        filter_keyword, case=False, na=False
+                    )
+                df = df[mask]
+            # Convert to list of dictionaries
+            collections = df.to_dict("records")
+            # Convert to structured models
+            collection_models = []
+            for col in collections:
+                collection_models.append(
+                    STACCollectionInfo(
+                        id=col.get("id", ""),
+                        title=col.get("title", ""),
+                        description=col.get("description"),
+                        license=col.get("license"),
+                        temporal_extent=col.get("temporal_extent"),
+                        spatial_extent=col.get("bbox"),
+                        providers=col.get("providers"),
+                        keywords=col.get("keywords"),
+                    )
+                )
+            result = {
+                "count": len(collection_models),
+                "filter_keyword": filter_keyword,
+                "collections": [c.model_dump() for c in collection_models],
+            }
+            return json.dumps(result, indent=2)
+        except Exception as e:
+            return json.dumps({"error": str(e)})
+    @tool(
+        description="Search for STAC items in a specific collection with optional filters"
+    )
+    def search_items(
+        self,
+        collection: str,
+        bbox: Optional[Union[str, List[float]]] = None,
+        time_range: Optional[str] = None,
+        query: Optional[Union[str, Dict[str, Any]]] = None,
+        limit: Optional[Union[str, int]] = 10,
+        max_items: Optional[Union[str, int]] = 1,
+    ) -> str:
+        """Search for STAC items in the Planetary Computer catalog.
+        Args:
+            collection: Collection ID to search (e.g., "sentinel-2-l2a", "naip", "landsat-c2-l2").
+            bbox: Bounding box as [west, south, east, north] in WGS84 coordinates.
+                Example: [-122.5, 37.7, -122.3, 37.8] for San Francisco area.
+            time_range: Time range as "start/end" string in ISO format.
+                Example: "2024-09-01/2024-09-30" or "2024-09-01/2024-09-01" for single day.
+            query: Query parameters for filtering.
+                Example: {"eo:cloud_cover": {"lt": 10}} for cloud cover less than 10%.
+            limit: Number of items to return per page.
+                Example: 10 for 10 items per page.
+            max_items: Maximum number of items to return (default: 10).
+        Returns:
+            JSON string containing search results with item details including IDs, URLs, and metadata.
+        """
+        try:
+            if isinstance(bbox, str):
+                bbox = ast.literal_eval(bbox)
+            # Fix nested list issue: [[x,y,z,w]] -> [x,y,z,w]
+            if isinstance(bbox, list) and len(bbox) == 1 and isinstance(bbox[0], list):
+                bbox = bbox[0]
+            if isinstance(query, str):
+                # Try to fix common JSON formatting issues from LLM
+                query_str = query.strip()
+                # Fix missing closing braces
+                if query_str.count("{") > query_str.count("}"):
+                    query_str = query_str + "}" * (
+                        query_str.count("{") - query_str.count("}")
+                    )
+                # Fix extra closing braces
+                elif query_str.count("}") > query_str.count("{"):
+                    # Remove extra closing braces from the end
+                    extra_braces = query_str.count("}") - query_str.count("{")
+                    for _ in range(extra_braces):
+                        query_str = query_str.rstrip("}")
+                query = ast.literal_eval(query_str)
+            if isinstance(limit, str):
+                limit = ast.literal_eval(limit)
+            if isinstance(max_items, str):
+                max_items = ast.literal_eval(max_items)
+            # Search using existing function
+            items = pc_stac_search(
+                collection=collection,
+                bbox=bbox,
+                time_range=time_range,
+                query=query,
+                limit=limit,
+                max_items=max_items,
+                quiet=True,
+                endpoint=self.endpoint,
+            )
+            # Convert to structured models
+            item_models = []
+            for item in items:
+                # Extract assets
+                assets = []
+                for key, asset in item.assets.items():
+                    assets.append(
+                        STACAssetInfo(
+                            key=key,
+                            title=asset.title,
+                        )
+                    )
+                item_models.append(
+                    STACItemInfo(
+                        id=item.id,
+                        collection=item.collection_id,
+                        datetime=str(item.datetime) if item.datetime else None,
+                        bbox=list(item.bbox) if item.bbox else None,
+                        assets=assets,
+                        # properties=item.properties,
+                    )
+                )
+            # Create search result
+            result = STACSearchResult(
+                query=f"Collection: {collection}",
+                collection=collection,
+                item_count=len(item_models),
+                items=item_models,
+                bbox=bbox,
+                time_range=time_range,
+            )
+            return json.dumps(result.model_dump(), indent=2)
+        except Exception as e:
+            return json.dumps({"error": str(e)})
+    @tool(description="Get detailed information about a specific STAC item")
+    def get_item_info(
+        self,
+        item_id: str,
+        collection: str,
+    ) -> str:
+        """Get detailed information about a specific STAC item.
+        Args:
+            item_id: The STAC item ID to retrieve.
+            collection: The collection ID containing the item.
+        Returns:
+            JSON string with detailed item information including all assets and metadata.
+        """
+        try:
+            # Search for the specific item
+            items = pc_stac_search(
+                collection=collection,
+                bbox=None,
+                time_range=None,
+                query={"id": {"eq": item_id}},
+                limit=1,
+                max_items=1,
+                quiet=True,
+                endpoint=self.endpoint,
+            )
+            if not items:
+                return json.dumps(
+                    {"error": f"Item {item_id} not found in collection {collection}"}
+                )
+            item = items[0]
+            # Extract all assets with full details
+            assets = []
+            for key, asset in item.assets.items():
+                asset_info = {
+                    "key": key,
+                    "href": asset.href,
+                    "type": asset.media_type,
+                    "title": asset.title,
+                    "description": getattr(asset, "description", None),
+                    "roles": getattr(asset, "roles", None),
+                }
+                assets.append(asset_info)
+            result = {
+                "id": item.id,
+                "collection": item.collection_id,
+                "datetime": str(item.datetime) if item.datetime else None,
+                "bbox": list(item.bbox) if item.bbox else None,
+                # "properties": item.properties,
+                "assets": assets,
+            }
+            return json.dumps(result, indent=2)
+        except Exception as e:
+            return json.dumps({"error": str(e)})
+    @tool(description="Parse a location name and return its bounding box coordinates")
+    def geocode_location(self, location_name: str) -> str:
+        """Convert a location name to geographic coordinates and bounding box.
+        This tool uses a geocoding service to find the coordinates for a given location name.
+        Args:
+            location_name: Name of the location (e.g., "San Francisco", "New York", "Paris, France").
+        Returns:
+            JSON string with location info including bounding box and center coordinates.
+        """
+        try:
+            # Check static cache first (common locations)
+            location_key = location_name.lower().strip()
+            if location_key in self._LOCATION_CACHE:
+                cached = self._LOCATION_CACHE[location_key]
+                location_info = LocationInfo(
+                    name=cached["name"],
+                    bbox=cached["bbox"],
+                    center=cached["center"],
+                )
+                return json.dumps(location_info.model_dump(), indent=2)
+            # Check runtime cache
+            if location_key in self._geocode_cache:
+                return self._geocode_cache[location_key]
+            # Geocode using Nominatim
+            import requests
+            url = "https://nominatim.openstreetmap.org/search"
+            params = {
+                "q": location_name,
+                "format": "json",
+                "limit": 1,
+            }
+            headers = {"User-Agent": "GeoAI-STAC-Agent/1.0"}
+            response = requests.get(url, params=params, headers=headers, timeout=10)
+            response.raise_for_status()
+            results = response.json()
+            if not results:
+                error_result = json.dumps(
+                    {"error": f"Location '{location_name}' not found"}
+                )
+                self._geocode_cache[location_key] = error_result
+                return error_result
+            result = results[0]
+            bbox = [
+                float(result["boundingbox"][2]),  # west
+                float(result["boundingbox"][0]),  # south
+                float(result["boundingbox"][3]),  # east
+                float(result["boundingbox"][1]),  # north
+            ]
+            center = [float(result["lon"]), float(result["lat"])]
+            location_info = LocationInfo(
+                name=result.get("display_name", location_name),
+                bbox=bbox,
+                center=center,
+            )
+            result_json = json.dumps(location_info.model_dump(), indent=2)
+            # Cache the result
+            self._geocode_cache[location_key] = result_json
+            return result_json
+        except Exception as e:
+            return json.dumps({"error": f"Geocoding error: {str(e)}"})
+    @tool(
+        description="Get common STAC collection IDs for different satellite/aerial imagery types"
+    )
+    def get_common_collections(self) -> str:
+        """Get a list of commonly used STAC collections from Planetary Computer.
+        Returns:
+            JSON string with collection IDs and descriptions for popular datasets.
+        """
+        common_collections = {
+            "sentinel-2-l2a": "Sentinel-2 Level-2A - Multispectral imagery (10m-60m resolution, global coverage)",
+            "landsat-c2-l2": "Landsat Collection 2 Level-2 - Multispectral imagery (30m resolution, global coverage)",
+            "naip": "NAIP - National Agriculture Imagery Program (1m resolution, USA only)",
+            "sentinel-1-grd": "Sentinel-1 GRD - Synthetic Aperture Radar imagery (global coverage)",
+            "aster-l1t": "ASTER L1T - Multispectral and thermal imagery (15m-90m resolution)",
+            "cop-dem-glo-30": "Copernicus DEM - Global Digital Elevation Model (30m resolution)",
+            "hgb": "HGB - High Resolution Building Footprints",
+            "io-lulc": "Impact Observatory Land Use/Land Cover - Annual 10m resolution land cover",
+            "modis": "MODIS - Moderate Resolution Imaging Spectroradiometer (250m-1km resolution)",
+            "daymet-daily-hi": "Daymet - Daily surface weather data for Hawaii",
+        }
+        result = {
+            "count": len(common_collections),
+            "collections": [
+                {"id": k, "description": v} for k, v in common_collections.items()
+            ],
+        }
+        return json.dumps(result, indent=2)

geoai/change_detection.py CHANGED Viewed

@@ -561,7 +561,15 @@ class ChangeDetection:
         return fig
-    def visualize_results(self, image1_path, image2_path, binary_path, prob_path):
+    def visualize_results(
+        self,
+        image1_path,
+        image2_path,
+        binary_path,
+        prob_path,
+        title1="Earlier Image",
+        title2="Later Image",
+    ):
         """Create enhanced visualization with probability analysis."""
         # Load data
@@ -594,11 +602,11 @@ class ChangeDetection:
         # Row 1: Original and overlays
         axes[0, 0].imshow(img1_crop)
-        axes[0, 0].set_title("2019 Image", fontweight="bold")
+        axes[0, 0].set_title(title1, fontweight="bold")
         axes[0, 0].axis("off")
         axes[0, 1].imshow(img2_crop)
-        axes[0, 1].set_title("2022 Image", fontweight="bold")
+        axes[0, 1].set_title(title2, fontweight="bold")
         axes[0, 1].axis("off")
         # Binary overlay
@@ -708,6 +716,8 @@ class ChangeDetection:
         image2_path,
         binary_path,
         prob_path,
+        title1="Earlier Image",
+        title2="Later Image",
         output_path="split_comparison.png",
     ):
         """Create a split comparison visualization showing before/after with change overlay."""
@@ -742,7 +752,7 @@ class ChangeDetection:
         # Create split comparison
         fig, ax = plt.subplots(1, 1, figsize=(15, 10))
-        # Create combined image - left half is 2019, right half is 2022
+        # Create combined image - left half is earlier, right half is later
         combined_img = np.zeros_like(img1)
         combined_img[:, : w // 2] = img1[:, : w // 2]
         combined_img[:, w // 2 :] = img2[:, w // 2 :]
@@ -763,7 +773,7 @@ class ChangeDetection:
         ax.text(
             w // 4,
             50,
-            "2019",
+            title1,
             fontsize=20,
             color="white",
             ha="center",
@@ -772,7 +782,7 @@ class ChangeDetection:
         ax.text(
             3 * w // 4,
             50,
-            "2022",
+            title2,
             fontsize=20,
             color="white",
             ha="center",

geoai/download.py CHANGED Viewed

@@ -1,5 +1,6 @@
 """This module provides functions to download data, including NAIP imagery and building data from Overture Maps."""
+import datetime
 import logging
 import os
 import subprocess
@@ -819,6 +820,7 @@ def pc_stac_search(
     query: Optional[Dict[str, Any]] = None,
     limit: int = 10,
     max_items: Optional[int] = None,
+    quiet: bool = False,
     endpoint: str = "https://planetarycomputer.microsoft.com/api/stac/v1",
 ) -> List["pystac.Item"]:
     """
@@ -839,6 +841,7 @@ def pc_stac_search(
         limit (int, optional): Number of items to return per page. Defaults to 10.
         max_items (int, optional): Maximum total number of items to return.
             Defaults to None (returns all matching items).
+        quiet: bool, optional): Whether to suppress print statements. Defaults to False.
         endpoint (str, optional): STAC API endpoint URL.
             Defaults to "https://planetarycomputer.microsoft.com/api/stac/v1".
@@ -896,7 +899,8 @@ def pc_stac_search(
     except Exception as e:
         raise Exception(f"Error retrieving search results: {str(e)}")
-    print(f"Found {len(items)} items matching search criteria")
+    if not quiet:
+        print(f"Found {len(items)} items matching search criteria")
     return items

geoai/geoai.py CHANGED Viewed

@@ -32,6 +32,9 @@ from .train import (
     instance_segmentation,
     instance_segmentation_batch,
     instance_segmentation_inference_on_geotiff,
+    lightly_embed_images,
+    lightly_train_model,
+    load_lightly_pretrained_model,
     object_detection,
     object_detection_batch,
     semantic_segmentation,

geoai-py 0.15.0__py2.py3-none-any.whl → 0.17.0__py2.py3-none-any.whl

geoai-py 0.15.0py2.py3-none-any.whl → 0.17.0py2.py3-none-any.whl