PyPI - terrakio-core - Versions diffs - 0.3.3__py3-none-any.whl → 0.3.6__py3-none-any.whl - Mend

terrakio-core 0.3.3py3-none-any.whl → 0.3.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of terrakio-core might be problematic. Click here for more details.

Files changed (28) hide show

terrakio_core/__init__.py +10 -1
terrakio_core/async_client.py +304 -0
terrakio_core/client.py +22 -1717
terrakio_core/config.py +8 -15
terrakio_core/convenience_functions/convenience_functions.py +296 -0
terrakio_core/endpoints/auth.py +180 -0
terrakio_core/endpoints/dataset_management.py +369 -0
terrakio_core/endpoints/group_management.py +228 -0
terrakio_core/endpoints/mass_stats.py +594 -0
terrakio_core/endpoints/model_management.py +385 -0
terrakio_core/endpoints/space_management.py +72 -0
terrakio_core/endpoints/user_management.py +131 -0
terrakio_core/helper/bounded_taskgroup.py +20 -0
terrakio_core/helper/decorators.py +58 -0
terrakio_core/{generation → helper}/tiles.py +1 -12
terrakio_core/sync_client.py +370 -0
{terrakio_core-0.3.3.dist-info → terrakio_core-0.3.6.dist-info}/METADATA +1 -1
terrakio_core-0.3.6.dist-info/RECORD +21 -0
terrakio_core/auth.py +0 -223
terrakio_core/dataset_management.py +0 -287
terrakio_core/decorators.py +0 -18
terrakio_core/group_access_management.py +0 -232
terrakio_core/mass_stats.py +0 -504
terrakio_core/space_management.py +0 -101
terrakio_core/user_management.py +0 -227
terrakio_core-0.3.3.dist-info/RECORD +0 -16
{terrakio_core-0.3.3.dist-info → terrakio_core-0.3.6.dist-info}/WHEEL +0 -0
{terrakio_core-0.3.3.dist-info → terrakio_core-0.3.6.dist-info}/top_level.txt +0 -0

terrakio_core/endpoints/model_management.py ADDED Viewed

@@ -0,0 +1,385 @@
+import os
+import json
+import time
+import textwrap
+import logging
+from typing import Dict, Any
+from google.cloud import storage
+from ..helper.decorators import require_token, require_api_key, require_auth
+class ModelManagement:
+    def __init__(self, client):
+        self._client = client
+    @require_api_key
+    def generate_ai_dataset(
+        self,
+        name: str,
+        aoi_geojson: str,
+        expression_x: str,
+        filter_x_rate: float,
+        filter_y_rate: float,
+        samples: int,
+        tile_size: int,
+        expression_y: str = "skip",
+        filter_x: str = "skip",
+        filter_y: str = "skip",
+        crs: str = "epsg:4326",
+        res: float = 0.001,
+        region: str = "aus",
+        start_year: int = None,
+        end_year: int = None,
+    ) -> dict:
+        """
+        Generate an AI dataset using specified parameters.
+        Args:
+            name (str): Name of the dataset to generate
+            aoi_geojson (str): Path to GeoJSON file containing area of interest
+            expression_x (str): Expression for X variable (e.g. "MSWX.air_temperature@(year=2021, month=1)")
+            filter_x (str): Filter for X variable (e.g. "MSWX.air_temperature@(year=2021, month=1)")
+            filter_x_rate (float): Filter rate for X variable (e.g. 0.5)
+            expression_y (str): Expression for Y variable with {year} placeholder
+            filter_y (str): Filter for Y variable (e.g. "MSWX.air_temperature@(year=2021, month=1)")
+            filter_y_rate (float): Filter rate for Y variable (e.g. 0.5)
+            samples (int): Number of samples to generate
+            tile_size (int): Size of tiles in degrees
+            crs (str, optional): Coordinate reference system. Defaults to "epsg:4326"
+            res (float, optional): Resolution in degrees. Defaults to 0.001
+            region (str, optional): Region code. Defaults to "aus"
+            start_year (int, optional): Start year for data generation. Required if end_year provided
+            end_year (int, optional): End year for data generation. Required if start_year provided
+        Returns:
+            dict: Response from the AI dataset generation API
+        Raises:
+            APIError: If the API request fails
+        """
+        # Build config for expressions and filters
+        config = {
+            "expressions": [{"expr": expression_x, "res": res, "prefix": "x"}],
+            "filters": []
+        }
+        if expression_y != "skip":
+            config["expressions"].append({"expr": expression_y, "res": res, "prefix": "y"})
+        if filter_x != "skip":
+            config["filters"].append({"expr": filter_x, "res": res, "rate": filter_x_rate})
+        if filter_y != "skip":
+            config["filters"].append({"expr": filter_y, "res": res, "rate": filter_y_rate})
+        # Replace year placeholders if start_year is provided
+        if start_year is not None:
+            expression_x = expression_x.replace("{year}", str(start_year))
+            if expression_y != "skip":
+                expression_y = expression_y.replace("{year}", str(start_year))
+            if filter_x != "skip":
+                filter_x = filter_x.replace("{year}", str(start_year))
+            if filter_y != "skip":
+                filter_y = filter_y.replace("{year}", str(start_year))
+        # Load AOI GeoJSON
+        with open(aoi_geojson, 'r') as f:
+            aoi_data = json.load(f)
+        task_response = self._client.mass_stats.random_sample(
+            name=name,
+            config=config,
+            aoi=aoi_data,
+            samples=samples,
+            year_range=[start_year, end_year],
+            crs=crs,
+            tile_size=tile_size,
+            res=res,
+            region=region,
+            output="netcdf",
+            server=self._client.url,
+            bucket="terrakio-mass-requests",
+            overwrite=True
+        )
+        task_id = task_response["task_id"]
+        # Wait for job completion with progress bar
+        while True:
+            result = self._client.track_mass_stats_job(ids=[task_id])
+            status = result[task_id]['status']
+            completed = result[task_id].get('completed', 0)
+            total = result[task_id].get('total', 1)
+            # Create progress bar
+            progress = completed / total if total > 0 else 0
+            bar_length = 50
+            filled_length = int(bar_length * progress)
+            bar = '█' * filled_length + '░' * (bar_length - filled_length)
+            percentage = progress * 100
+            # Print status with progress bar
+            print(f"\rJob status: {status} [{bar}] {percentage:.1f}% ({completed}/{total})", end='')
+            if status == "Completed":
+                print("\nJob completed successfully!")
+                break
+            elif status == "Error":
+                print("\n")  # New line before error message
+                raise Exception(f"Job {task_id} encountered an error")
+            # Wait 5 seconds before checking again
+            time.sleep(5)
+        # after all the random sample jobs are done, we then start the mass stats job
+        task_id = self._client.mass_stats.start_mass_stats_job(task_id)
+        return task_id
+    @require_api_key
+    async def upload_model(self, model_path: str):
+        """
+        Upload a model to the bucket so that it can be used for inference.
+        Args:
+            model_path: Path to the model file
+        Raises:
+            APIError: If the API request fails
+        """
+        uid = (await self._client.auth.get_user_info())["uid"]
+        model_name = os.path.basename(model_path)
+        client = storage.Client()
+        bucket = client.get_bucket('terrakio-mass-requests')
+        model_file_name = os.path.splitext(model_name)[0]
+        blob = bucket.blob(f'{uid}/{model_file_name}/models/{model_name}')
+        blob.upload_from_filename(model_path)
+        self._client.logger.info(f"Model uploaded successfully to {uid}/{model_name}/models/{model_name}")
+    @require_api_key
+    def upload_and_deploy_model(self, model_path: str, dataset: str, product: str, input_expression: str, dates_iso8601: list):
+        """
+        Upload a model to the bucket and deploy it.
+        Args:
+            model_path: Path to the model file
+            dataset Name of the dataset to create
+            product: Product name for the inference
+            input_expression: Input expression for the dataset
+            dates_iso8601: List of dates in ISO8601 format
+        """
+        self.upload_model(model_path =  model_path)
+        model_name = os.path.basename(model_path)
+        self.deploy_model(dataset = dataset, product = product, model_name = model_name, input_expression = input_expression, model_training_job_name = model_name, dates_iso8601 = dates_iso8601)
+    @require_api_key
+    def train_model(
+        self,
+        model_name: str,
+        training_dataset: str,
+        task_type: str,
+        model_category: str,
+        architecture: str,
+        region: str,
+        hyperparameters: dict = None
+    ) -> dict:
+        """
+        Train a model using the external model training API.
+        Args:
+            model_name (str): The name of the model to train.
+            training_dataset (str): The training dataset identifier.
+            task_type (str): The type of ML task (e.g., regression, classification).
+            model_category (str): The category of model (e.g., random_forest).
+            architecture (str): The model architecture.
+            region (str): The region identifier.
+            hyperparameters (dict, optional): Additional hyperparameters for training.
+        Returns:
+            dict: The response from the model training API.
+        Raises:
+            APIError: If the API request fails
+        """
+        payload = {
+            "model_name": model_name,
+            "training_dataset": training_dataset,
+            "task_type": task_type,
+            "model_category": model_category,
+            "architecture": architecture,
+            "region": region,
+            "hyperparameters": hyperparameters
+        }
+        return self._client._terrakio_request("POST", "/train_model", json=payload)
+    @require_api_key
+    def deploy_model(
+        self,
+        dataset: str,
+        product: str,
+        model_name: str,
+        input_expression: str,
+        model_training_job_name: str,
+        dates_iso8601: list
+    ) -> Dict[str, Any]:
+        """
+        Deploy a model by generating inference script and creating dataset.
+        Args:
+            dataset: Name of the dataset to create
+            product: Product name for the inference
+            model_name: Name of the trained model
+            input_expression: Input expression for the dataset
+            model_training_job_name: Name of the training job
+            dates_iso8601: List of dates in ISO8601 format
+        Returns:
+            dict: Response from the deployment process
+        Raises:
+            APIError: If the API request fails
+        """
+        # Get user info to get UID
+        user_info = self._client.get_user_info()
+        uid = user_info["uid"]
+        # Generate and upload script
+        script_content = self._generate_script(model_name, product, model_training_job_name, uid)
+        script_name = f"{product}.py"
+        self._upload_script_to_bucket(script_content, script_name, model_training_job_name, uid)
+        # Create dataset
+        return self._client.datasets.create_dataset(
+            name=dataset,
+            collection="terrakio-datasets",
+            products=[product],
+            path=f"gs://terrakio-mass-requests/{uid}/{model_training_job_name}/inference_scripts",
+            input=input_expression,
+            dates_iso8601=dates_iso8601,
+            padding=0
+        )
+    @require_api_key
+    def _generate_script(self, model_name: str, product: str, model_training_job_name: str, uid: str) -> str:
+        """
+        Generate Python inference script for the model.
+        Args:
+            model_name: Name of the model
+            product: Product name
+            model_training_job_name: Training job name
+            uid: User ID
+        Returns:
+            str: Generated Python script content
+        """
+        return textwrap.dedent(f'''
+            import logging
+            from io import BytesIO
+            import numpy as np
+            import pandas as pd
+            import xarray as xr
+            from google.cloud import storage
+            from onnxruntime import InferenceSession
+            logging.basicConfig(
+                level=logging.INFO
+            )
+            def get_model():
+                logging.info("Loading model for {model_name}...")
+                client = storage.Client()
+                bucket = client.get_bucket('terrakio-mass-requests')
+                blob = bucket.blob('{uid}/{model_training_job_name}/models/{model_name}.onnx')
+                model = BytesIO()
+                blob.download_to_file(model)
+                model.seek(0)
+                session = InferenceSession(model.read(), providers=["CPUExecutionProvider"])
+                return session
+            def {product}(*bands, model):
+                logging.info("start preparing data")
+                data_arrays = list(bands)
+                reference_array = data_arrays[0]
+                original_shape = reference_array.shape
+                logging.info(f"Original shape: {{original_shape}}")
+                if 'time' in reference_array.dims:
+                    time_coords = reference_array.coords['time']
+                    if len(time_coords) == 1:
+                        output_timestamp = time_coords[0]
+                    else:
+                        years = [pd.to_datetime(t).year for t in time_coords.values]
+                        unique_years = set(years)
+                        if len(unique_years) == 1:
+                            year = list(unique_years)[0]
+                            output_timestamp = pd.Timestamp(f"{{year}}-01-01")
+                        else:
+                            latest_year = max(unique_years)
+                            output_timestamp = pd.Timestamp(f"{{latest_year}}-01-01")
+                else:
+                    output_timestamp = pd.Timestamp("1970-01-01")
+                averaged_bands = []
+                for data_array in data_arrays:
+                    if 'time' in data_array.dims:
+                        averaged_band = np.mean(data_array.values, axis=0)
+                        logging.info(f"Averaged band from {{data_array.shape}} to {{averaged_band.shape}}")
+                    else:
+                        averaged_band = data_array.values
+                        logging.info(f"No time dimension, shape: {{averaged_band.shape}}")
+                    flattened_band = averaged_band.reshape(-1, 1)
+                    averaged_bands.append(flattened_band)
+                input_data = np.hstack(averaged_bands)
+                logging.info(f"Final input shape: {{input_data.shape}}")
+                output = model.run(None, {{"float_input": input_data.astype(np.float32)}})[0]
+                logging.info(f"Model output shape: {{output.shape}}")
+                if len(original_shape) >= 3:
+                    spatial_shape = original_shape[1:]
+                else:
+                    spatial_shape = original_shape
+                output_reshaped = output.reshape(spatial_shape)
+                output_with_time = np.expand_dims(output_reshaped, axis=0)
+                if 'time' in reference_array.dims:
+                    spatial_dims = [dim for dim in reference_array.dims if dim != 'time']
+                    spatial_coords = {{dim: reference_array.coords[dim] for dim in spatial_dims if dim in reference_array.coords}}
+                else:
+                    spatial_dims = list(reference_array.dims)
+                    spatial_coords = dict(reference_array.coords)
+                result = xr.DataArray(
+                    data=output_with_time.astype(np.float32),
+                    dims=['time'] + list(spatial_dims),
+                    coords={{
+                        'time': [output_timestamp.values],
+                        'y': spatial_coords['y'].values,
+                        'x': spatial_coords['x'].values
+                    }}
+                )
+                return result
+            ''').strip()
+    @require_api_key
+    def _upload_script_to_bucket(self, script_content: str, script_name: str, model_training_job_name: str, uid: str):
+        """Upload the generated script to Google Cloud Storage"""
+        client = storage.Client()
+        bucket = client.get_bucket('terrakio-mass-requests')
+        blob = bucket.blob(f'{uid}/{model_training_job_name}/inference_scripts/{script_name}')
+        blob.upload_from_string(script_content, content_type='text/plain')
+        logging.info(f"Script uploaded successfully to {uid}/{model_training_job_name}/inference_scripts/{script_name}")

terrakio_core/endpoints/space_management.py ADDED Viewed

@@ -0,0 +1,72 @@
+from typing import Dict, Any, Optional
+from ..helper.decorators import require_token, require_api_key, require_auth
+class SpaceManagement:
+    def __init__(self, client):
+        self._client = client
+    @require_api_key
+    def get_total_space_used(self) -> Dict[str, Any]:
+        """
+        Get total space used by the user.
+        Returns:
+            Dict[str, Any]: Total space used by the user.
+        Raises:
+            APIError: If the API request fails
+        """
+        return self._client._terrakio_request("GET", "/users/jobs")
+    @require_api_key
+    def get_space_used_by_job(self, name: str, region: str) -> Dict[str, Any]:
+        """
+        Get space used by a specific job.
+        Args:
+            name: The name of the job
+            region: The region of the job
+        Returns:
+            Dict[str, Any]: Space used by the job.
+        Raises:
+            APIError: If the API request fails
+        """
+        params = {"region": region}
+        return self._client._terrakio_request("GET", f"/users/jobs/{name}", params=params)
+    @require_api_key
+    def delete_user_job(self, name: str, region: str) -> Dict[str, Any]:
+        """
+        Delete a user job by name and region.
+        Args:
+            name: The name of the job
+            region: The region of the job
+        Returns:
+            Dict[str, Any]: Response from the delete operation.
+        Raises:
+            APIError: If the API request fails
+        """
+        params = {"region": region}
+        return self._client._terrakio_request("DELETE", f"/users/jobs/{name}", params=params)
+    @require_api_key
+    def delete_data_in_path(self, path: str, region: str) -> Dict[str, Any]:
+        """
+        Delete data in a GCS path for a given region.
+        Args:
+            path: The GCS path to delete data from
+            region: The region where the data is located
+        Returns:
+            Dict[str, Any]: Response from the delete operation.
+        Raises:
+            APIError: If the API request fails
+        """
+        params = {"path": path, "region": region}
+        return self._client._terrakio_request("DELETE", "/users/jobs", params=params)

terrakio_core/endpoints/user_management.py ADDED Viewed

@@ -0,0 +1,131 @@
+from typing import Dict, Any, List, Optional
+from ..helper.decorators import require_token, require_api_key, require_auth
+class UserManagement:
+    def __init__(self, client):
+        self._client = client
+    @require_api_key
+    def get_user_by_id(self, id: str) -> Dict[str, Any]:
+        """
+        Get user by ID.
+        Args:
+            user_id: User ID
+        Returns:
+            User information
+        Raises:
+            APIError: If the API request fails
+        """
+        return self._client._terrakio_request("GET", f"admin/users/{id}")
+    @require_api_key
+    def get_user_by_email(self, email: str) -> Dict[str, Any]:
+        """
+        Get user by email.
+        Args:
+            email: User email
+        Returns:
+            User information
+        Raises:
+            APIError: If the API request fails
+        """
+        return self._client._terrakio_request("GET", f"admin/users/email/{email}")
+    @require_api_key
+    def list_users(self, substring: Optional[str] = None, uid: bool = False) -> List[Dict[str, Any]]:
+        """
+        List users, optionally filtering by a substring.
+        Args:
+            substring: Optional substring to filter users
+            uid: If True, includes the user ID in the response (default: False)
+        Returns:
+            List of users
+        Raises:
+            APIError: If the API request fails
+        """
+        params = {"uid": str(uid).lower()}
+        if substring:
+            params['substring'] = substring
+        return self._client._terrakio_request("GET", "admin/users", params=params)
+    @require_api_key
+    def edit_user(
+        self,
+        uid: str,
+        email: Optional[str],
+        role: Optional[str],
+        apiKey: Optional[str],
+        groups: Optional[List[str]],
+        quota: Optional[int]
+    ) -> Dict[str, Any]:
+        """
+        Edit user info. Only provided fields will be updated.
+        Args:
+            uid: User ID
+            email: New user email
+            role: New user role
+            apiKey: New API key
+            groups: New list of groups
+            quota: New quota
+        Returns:
+            Updated user information
+        Raises:
+            APIError: If the API request fails
+        """
+        payload = {"uid": uid}
+        payload_mapping = {
+            "email": email,
+            "role": role,
+            "apiKey": apiKey,
+            "groups": groups,
+            "quota": quota
+        }
+        for key, value in payload_mapping.items():
+            if value is not None:
+                payload[key] = value
+        return self._client._terrakio_request("PATCH", "admin/users", json=payload)
+    @require_api_key
+    def reset_quota(self, email: str, quota: Optional[int] = None) -> Dict[str, Any]:
+        """
+        Reset the quota for a user by email.
+        Args:
+            email: The user's email (required)
+            quota: The new quota value (optional)
+        Returns:
+            API response as a dictionary
+        """
+        payload = {"email": email}
+        if quota is not None:
+            payload["quota"] = quota
+        return self._client._terrakio_request("PATCH", f"admin/users/reset_quota/{email}", json=payload)
+    @require_api_key
+    def delete_user(self, uid: str) -> Dict[str, Any]:
+        """
+        Delete a user by UID.
+        Args:
+            uid: The user's UID (required)
+        Returns:
+            API response as a dictionary
+        Raises:
+            APIError: If the API request fails
+        """
+        return self._client._terrakio_request("DELETE", f"admin/users/{uid}")

terrakio_core/helper/bounded_taskgroup.py ADDED Viewed

@@ -0,0 +1,20 @@
+import asyncio
+# Adapted from https://discuss.python.org/t/boundedtaskgroup-to-control-parallelism/27171
+class BoundedTaskGroup(asyncio.TaskGroup):
+    def __init__(self, *args, max_concurrency = 0, **kwargs):
+        super().__init__(*args)
+        if max_concurrency:
+            self._sem = asyncio.Semaphore(max_concurrency)
+        else:
+            self._sem = None
+    def create_task(self, coro, *args, **kwargs):
+        if self._sem:
+            async def _wrapped_coro(sem, coro):
+                async with sem:
+                    return await coro
+            coro = _wrapped_coro(self._sem, coro)
+        return super().create_task(coro, *args, **kwargs)

terrakio_core/helper/decorators.py ADDED Viewed

@@ -0,0 +1,58 @@
+# terrakio_core/decorators.py
+from functools import wraps
+from ..exceptions import ConfigurationError
+def require_token(func):
+    """Decorator to ensure a token is available before a method can be executed."""
+    @wraps(func)
+    def wrapper(self, *args, **kwargs):
+        # Check both direct token and client token
+        has_token = False
+        if hasattr(self, 'token') and self.token:
+            has_token = True
+        elif hasattr(self, '_client') and hasattr(self._client, 'token') and self._client.token:
+            has_token = True
+        if not has_token:
+            raise ConfigurationError("Authentication token required. Please login first.")
+        return func(self, *args, **kwargs)
+    wrapper._is_decorated = True
+    return wrapper
+def require_api_key(func):
+    """Decorator to ensure an API key is available before a method can be executed."""
+    @wraps(func)
+    def wrapper(self, *args, **kwargs):
+        # Check both direct key and client key
+        has_key = False
+        if hasattr(self, 'key') and self.key:
+            has_key = True
+        elif hasattr(self, '_client') and hasattr(self._client, 'key') and self._client.key:
+            has_key = True
+        if not has_key:
+            raise ConfigurationError("API key required. Please provide an API key or login first.")
+        return func(self, *args, **kwargs)
+    wrapper._is_decorated = True
+    return wrapper
+def require_auth(func):
+    """Decorator that requires either a token OR an API key"""
+    @wraps(func)
+    def wrapper(self, *args, **kwargs):
+        # Check both direct auth and client auth
+        has_token = (hasattr(self, 'token') and self.token) or \
+                   (hasattr(self, '_client') and hasattr(self._client, 'token') and self._client.token)
+        has_api_key = (hasattr(self, 'key') and self.key) or \
+                     (hasattr(self, '_client') and hasattr(self._client, 'key') and self._client.key)
+        if not has_token and not has_api_key:
+            raise ConfigurationError(
+                "Authentication required. Please provide either an API key or login to get a token."
+            )
+        return func(self, *args, **kwargs)
+    wrapper._is_decorated = True
+    return wrapper

terrakio-core 0.3.3__py3-none-any.whl → 0.3.6__py3-none-any.whl

Potentially problematic release.

terrakio-core 0.3.3py3-none-any.whl → 0.3.6py3-none-any.whl