PyPI - pyconvexity - Versions diffs - 0.4.3__py3-none-any.whl - Mend

pyconvexity 0.4.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of pyconvexity might be problematic. Click here for more details.

Files changed (42) hide show

pyconvexity/__init__.py +226 -0
pyconvexity/_version.py +1 -0
pyconvexity/core/__init__.py +60 -0
pyconvexity/core/database.py +485 -0
pyconvexity/core/errors.py +106 -0
pyconvexity/core/types.py +400 -0
pyconvexity/data/README.md +101 -0
pyconvexity/data/__init__.py +17 -0
pyconvexity/data/loaders/__init__.py +3 -0
pyconvexity/data/loaders/cache.py +213 -0
pyconvexity/data/schema/01_core_schema.sql +420 -0
pyconvexity/data/schema/02_data_metadata.sql +120 -0
pyconvexity/data/schema/03_validation_data.sql +506 -0
pyconvexity/data/sources/__init__.py +5 -0
pyconvexity/data/sources/gem.py +442 -0
pyconvexity/io/__init__.py +26 -0
pyconvexity/io/excel_exporter.py +1226 -0
pyconvexity/io/excel_importer.py +1381 -0
pyconvexity/io/netcdf_exporter.py +197 -0
pyconvexity/io/netcdf_importer.py +1833 -0
pyconvexity/models/__init__.py +195 -0
pyconvexity/models/attributes.py +730 -0
pyconvexity/models/carriers.py +159 -0
pyconvexity/models/components.py +611 -0
pyconvexity/models/network.py +503 -0
pyconvexity/models/results.py +148 -0
pyconvexity/models/scenarios.py +234 -0
pyconvexity/solvers/__init__.py +29 -0
pyconvexity/solvers/pypsa/__init__.py +24 -0
pyconvexity/solvers/pypsa/api.py +460 -0
pyconvexity/solvers/pypsa/batch_loader.py +307 -0
pyconvexity/solvers/pypsa/builder.py +675 -0
pyconvexity/solvers/pypsa/constraints.py +405 -0
pyconvexity/solvers/pypsa/solver.py +1509 -0
pyconvexity/solvers/pypsa/storage.py +2048 -0
pyconvexity/timeseries.py +330 -0
pyconvexity/validation/__init__.py +25 -0
pyconvexity/validation/rules.py +312 -0
pyconvexity-0.4.3.dist-info/METADATA +47 -0
pyconvexity-0.4.3.dist-info/RECORD +42 -0
pyconvexity-0.4.3.dist-info/WHEEL +5 -0
pyconvexity-0.4.3.dist-info/top_level.txt +1 -0

pyconvexity/core/types.py ADDED Viewed

@@ -0,0 +1,400 @@
+"""
+Core data types for PyConvexity.
+These types mirror the Rust implementation while providing Python-specific
+enhancements and better type safety.
+"""
+import json
+from dataclasses import dataclass
+from typing import Dict, Any, Optional, List, Union
+class StaticValue:
+    """
+    Represents a static (non-time-varying) attribute value.
+    Mirrors the Rust StaticValue enum while providing Python conveniences.
+    Supports float, int, bool, and string values with proper type conversion.
+    """
+    def __init__(self, value: Union[float, int, bool, str]):
+        # Check bool before int since bool is subclass of int in Python
+        if isinstance(value, bool):
+            self.data = {"Boolean": value}
+        elif isinstance(value, float):
+            self.data = {"Float": value}
+        elif isinstance(value, int):
+            self.data = {"Integer": value}
+        elif isinstance(value, str):
+            self.data = {"String": value}
+        else:
+            raise ValueError(f"Unsupported value type: {type(value)}")
+    def to_json(self) -> str:
+        """
+        Return raw value as JSON to match Rust serialization format.
+        Rust stores: 123.45, 42, true, "hello"
+        Not: {"Float": 123.45}, {"Integer": 42}, etc.
+        """
+        import math
+        if "Float" in self.data:
+            float_val = self.data["Float"]
+            # Ensure finite values only
+            if not math.isfinite(float_val):
+                raise ValueError(
+                    f"Cannot serialize non-finite float value: {float_val}"
+                )
+            return json.dumps(float_val)
+        elif "Integer" in self.data:
+            return json.dumps(self.data["Integer"])
+        elif "Boolean" in self.data:
+            return json.dumps(self.data["Boolean"])
+        elif "String" in self.data:
+            return json.dumps(self.data["String"])
+        else:
+            # Fallback to original format if unknown
+            return json.dumps(self.data)
+    def data_type(self) -> str:
+        """Get data type name - mirrors Rust implementation"""
+        if "Float" in self.data:
+            return "float"
+        elif "Integer" in self.data:
+            return "int"
+        elif "Boolean" in self.data:
+            return "boolean"
+        elif "String" in self.data:
+            return "string"
+        else:
+            return "unknown"
+    def as_f64(self) -> float:
+        """Convert to float, mirroring Rust implementation"""
+        if "Float" in self.data:
+            return self.data["Float"]
+        elif "Integer" in self.data:
+            return float(self.data["Integer"])
+        elif "Boolean" in self.data:
+            return 1.0 if self.data["Boolean"] else 0.0
+        else:
+            try:
+                return float(self.data["String"])
+            except ValueError:
+                return 0.0
+    def value(self) -> Union[float, int, bool, str]:
+        """Get the raw Python value"""
+        if "Float" in self.data:
+            return self.data["Float"]
+        elif "Integer" in self.data:
+            return self.data["Integer"]
+        elif "Boolean" in self.data:
+            return self.data["Boolean"]
+        elif "String" in self.data:
+            return self.data["String"]
+        else:
+            raise ValueError("Unknown data type in StaticValue")
+    def __repr__(self) -> str:
+        return f"StaticValue({self.value()})"
+    def __eq__(self, other) -> bool:
+        if isinstance(other, StaticValue):
+            return self.data == other.data
+        return False
+@dataclass
+class Timeseries:
+    """
+    Efficient timeseries data structure matching the new Rust implementation.
+    Stores values as a flat array for maximum performance, matching the
+    unified Rust Timeseries struct.
+    """
+    values: List[float]
+    length: int
+    start_index: int
+    data_type: str
+    unit: Optional[str]
+    is_input: bool
+    def __post_init__(self):
+        # Ensure length matches values array
+        self.length = len(self.values)
+        # Ensure all values are float32-compatible
+        self.values = [float(v) for v in self.values]
+    def get_value(self, index: int) -> Optional[float]:
+        """Get value at specific index."""
+        if 0 <= index < len(self.values):
+            return self.values[index]
+        return None
+    def get_range(self, start: int, end: int) -> List[float]:
+        """Get a range of values efficiently."""
+        end = min(end, len(self.values))
+        start = min(start, end)
+        return self.values[start:end]
+    def sample(self, max_points: int) -> "Timeseries":
+        """Apply sampling if the timeseries is too large."""
+        if len(self.values) <= max_points:
+            return self
+        step = len(self.values) // max_points
+        sampled_values = []
+        for i in range(0, len(self.values), max(1, step)):
+            sampled_values.append(self.values[i])
+        # Always include the last point if not already included
+        if self.values and sampled_values[-1] != self.values[-1]:
+            sampled_values.append(self.values[-1])
+        return Timeseries(
+            values=sampled_values,
+            length=len(sampled_values),
+            start_index=self.start_index,
+            data_type=self.data_type,
+            unit=self.unit,
+            is_input=self.is_input,
+        )
+    def slice(self, start_index: int, end_index: int) -> "Timeseries":
+        """Apply range filtering."""
+        start = max(0, start_index - self.start_index)
+        end = max(0, end_index - self.start_index)
+        end = min(end, len(self.values))
+        start = min(start, end)
+        return Timeseries(
+            values=self.values[start:end],
+            length=end - start,
+            start_index=self.start_index + start,
+            data_type=self.data_type,
+            unit=self.unit,
+            is_input=self.is_input,
+        )
+@dataclass
+class TimeseriesMetadata:
+    """
+    Metadata about a timeseries without loading the full data.
+    Mirrors Rust TimeseriesMetadata struct.
+    """
+    length: int
+    start_time: int
+    end_time: int
+    start_index: int
+    end_index: int
+    data_type: str
+    unit: Optional[str]
+    is_input: bool
+@dataclass
+class TimePeriod:
+    """
+    Represents a time period in the network's time axis.
+    Mirrors Rust TimePeriod structure.
+    """
+    timestamp: int
+    period_index: int
+    formatted_time: str
+@dataclass
+class TimeseriesValidationResult:
+    """
+    Result of validating timeseries alignment with network time periods.
+    Mirrors Rust TimeseriesValidationResult.
+    """
+    is_valid: bool
+    missing_periods: List[int]
+    extra_periods: List[int]
+    total_network_periods: int
+    provided_periods: int
+@dataclass
+class ValidationRule:
+    """
+    Validation rule for component attributes.
+    Mirrors Rust ValidationRule with all fields.
+    """
+    component_type: str
+    attribute_name: str
+    data_type: str
+    unit: Optional[str]
+    default_value_string: Optional[str]
+    allowed_storage_types: str
+    allows_static: bool
+    allows_timeseries: bool
+    is_required: bool
+    is_input: bool
+    description: Optional[str]
+    default_value: Optional[StaticValue]
+class AttributeValue:
+    """
+    Represents either a static value or timeseries data for a component attribute.
+    Uses efficient Timeseries format for optimal performance.
+    Mirrors Rust AttributeValue enum.
+    """
+    def __init__(self, value: Union[StaticValue, Timeseries]):
+        if isinstance(value, StaticValue):
+            self.variant = "Static"
+            self.static_value = value
+            self.timeseries_value = None
+        elif isinstance(value, Timeseries):
+            self.variant = "Timeseries"
+            self.static_value = None
+            self.timeseries_value = value
+        else:
+            raise ValueError(
+                f"AttributeValue must be StaticValue or Timeseries, got {type(value)}"
+            )
+    @classmethod
+    def static(cls, value: StaticValue) -> "AttributeValue":
+        """Create a static attribute value"""
+        return cls(value)
+    @classmethod
+    def timeseries(cls, timeseries: Timeseries) -> "AttributeValue":
+        """Create a timeseries attribute value (new format)"""
+        return cls(timeseries)
+    def is_static(self) -> bool:
+        """Check if this is a static value"""
+        return self.variant == "Static"
+    def is_timeseries(self) -> bool:
+        """Check if this is a timeseries value"""
+        return self.variant == "Timeseries"
+    def as_timeseries(self) -> Optional[Timeseries]:
+        """Get the timeseries data in new format"""
+        return self.timeseries_value if self.is_timeseries() else None
+    def __repr__(self) -> str:
+        if self.is_static():
+            return f"AttributeValue.static({self.static_value})"
+        else:
+            length = len(self.timeseries_value.values) if self.timeseries_value else 0
+            return f"AttributeValue.timeseries({length} points)"
+@dataclass
+class Component:
+    """
+    Represents a component in the energy system model (single network per database).
+    Mirrors Rust Component struct.
+    """
+    id: int
+    component_type: str
+    name: str
+    longitude: Optional[float] = None
+    latitude: Optional[float] = None
+    carrier_id: Optional[int] = None
+    bus_id: Optional[int] = None
+    bus0_id: Optional[int] = None
+    bus1_id: Optional[int] = None
+@dataclass
+class Network:
+    """
+    Represents a network/model in the system.
+    Enhanced version of network information with additional metadata.
+    """
+    id: int
+    name: str
+    description: Optional[str] = None
+    time_start: Optional[str] = None
+    time_end: Optional[str] = None
+    time_interval: Optional[str] = None
+    created_at: Optional[str] = None
+    updated_at: Optional[str] = None
+@dataclass
+class CreateComponentRequest:
+    """
+    Request structure for creating a new component (single network per database).
+    Mirrors Rust CreateComponentRequest.
+    """
+    component_type: str
+    name: str
+    description: Optional[str] = None
+    longitude: Optional[float] = None
+    latitude: Optional[float] = None
+    carrier_id: Optional[int] = None
+    bus_id: Optional[int] = None
+    bus0_id: Optional[int] = None
+    bus1_id: Optional[int] = None
+@dataclass
+class CreateNetworkRequest:
+    """
+    Request structure for creating a new network.
+    Mirrors Rust CreateNetworkRequest.
+    """
+    name: str
+    description: Optional[str] = None
+    time_resolution: Optional[str] = None
+    start_time: Optional[str] = None
+    end_time: Optional[str] = None
+@dataclass
+class Carrier:
+    """
+    Represents an energy carrier (e.g., electricity, heat, gas).
+    """
+    id: int
+    name: str
+    co2_emissions: float = 0.0
+    color: Optional[str] = None
+    nice_name: Optional[str] = None
+@dataclass
+class Scenario:
+    """
+    Represents a scenario within a network.
+    """
+    id: int
+    name: str
+    description: Optional[str] = None
+    is_master: bool = False
+    created_at: Optional[str] = None
+    updated_at: Optional[str] = None

pyconvexity/data/README.md ADDED Viewed

@@ -0,0 +1,101 @@
+# PyConvexity Data Module
+The `pyconvexity.data` module provides functions for loading external energy data and integrating it with PyConvexity models. This is a simple, expert-friendly toolbox for working with real-world energy data.
+## Installation
+Install PyConvexity with data dependencies:
+```bash
+pip install pyconvexity[data]
+```
+## Current Data Sources
+### Global Energy Monitor (GEM)
+Load power plant data from GEM's Global Integrated Power dataset.
+**Setup:**
+1. Download the GEM Excel file: `Global-Integrated-Power-August-2025.xlsx`
+2. Place it in a `data/raw/global-energy-monitor/` directory, or set the path manually
+**Usage:**
+```python
+import pyconvexity as px
+# Load generators for a specific country
+generators = px.data.get_generators_from_gem(
+    country="USA",  # ISO 3-letter country code
+    technology_types=["solar", "wind", "nuclear"],  # Optional filter
+    min_capacity_mw=100.0  # Optional minimum capacity
+)
+# Create a network and add generators
+px.create_database_with_schema("my_model.db")
+with px.database_context("my_model.db") as conn:
+    network_id = px.create_network(conn, network_req)
+    # Create carriers
+    carriers = {}
+    for carrier_name in generators['carrier'].unique():
+        carriers[carrier_name] = px.create_carrier(conn, network_id, carrier_name)
+    # Add generators to network
+    generator_ids = px.data.add_gem_generators_to_network(
+        conn, network_id, generators, carrier_mapping=carriers
+    )
+```
+## Data Output Format
+The `get_generators_from_gem()` function returns a pandas DataFrame with these columns:
+- `plant_name`: Name of the power plant
+- `country_iso_3`: ISO 3-letter country code
+- `category`: Energy category (nuclear, thermal, renewables, storage, etc.)
+- `carrier`: Energy carrier (coal, gas, solar, wind, nuclear, etc.)
+- `type`: Technology type (subcritical, combined-cycle, photovoltaic, etc.)
+- `capacity_mw`: Capacity in megawatts
+- `start_year`: Year the plant started operation
+- `latitude`: Latitude coordinate
+- `longitude`: Longitude coordinate
+## Technology Mapping
+GEM technologies are automatically mapped to a standardized schema:
+- **Nuclear**: pressurized-water-reactor, boiling-water-reactor, small-modular-reactor
+- **Thermal**: subcritical, supercritical, combined-cycle, gas-turbine
+- **Renewables**: photovoltaic, thermal (solar), onshore/offshore (wind), run-of-river (hydro)
+- **Storage**: lithium-ion (battery), pumped-hydro
+- **Bioenergy**: biomass, biogas
+## Caching
+Data is automatically cached for 7 days to improve performance. You can:
+```python
+# Disable caching
+generators = px.data.get_generators_from_gem(country="USA", use_cache=False)
+# Clear cache
+cache = px.data.DataCache()
+cache.clear_cache('gem_generators')
+```
+## Examples
+See `examples/gem_data_example.py` for a complete working example.
+## Future Data Sources
+The framework is designed to be extensible. Planned additions include:
+- IRENA Global Energy Atlas (renewable resource data)
+- World Bank energy statistics
+- IEA World Energy Outlook data
+- OpenStreetMap transmission infrastructure
+- NASA weather data for renewable profiles

pyconvexity/data/__init__.py ADDED Viewed

@@ -0,0 +1,17 @@
+"""
+PyConvexity Data Module
+Provides functions for loading external energy data and integrating it with PyConvexity models.
+This module offers a simple, expert-friendly toolbox for working with real-world energy data.
+"""
+from .sources.gem import get_generators_from_gem, add_gem_generators_to_network
+from .loaders.cache import DataCache
+__all__ = [
+    # GEM (Global Energy Monitor) functions
+    "get_generators_from_gem",
+    "add_gem_generators_to_network",
+    # Caching utilities
+    "DataCache",
+]

pyconvexity/data/loaders/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+"""
+Data loaders and caching utilities for PyConvexity.
+"""