PyPI - pyconvexity - Versions diffs - 0.4.8__py3-none-any.whl - Mend

pyconvexity 0.4.8__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of pyconvexity might be problematic. Click here for more details.

Files changed (44) hide show

pyconvexity/__init__.py +241 -0
pyconvexity/_version.py +1 -0
pyconvexity/core/__init__.py +60 -0
pyconvexity/core/database.py +485 -0
pyconvexity/core/errors.py +106 -0
pyconvexity/core/types.py +400 -0
pyconvexity/dashboard.py +265 -0
pyconvexity/data/README.md +101 -0
pyconvexity/data/__init__.py +17 -0
pyconvexity/data/loaders/__init__.py +3 -0
pyconvexity/data/loaders/cache.py +213 -0
pyconvexity/data/schema/01_core_schema.sql +420 -0
pyconvexity/data/schema/02_data_metadata.sql +120 -0
pyconvexity/data/schema/03_validation_data.sql +507 -0
pyconvexity/data/sources/__init__.py +5 -0
pyconvexity/data/sources/gem.py +442 -0
pyconvexity/io/__init__.py +26 -0
pyconvexity/io/excel_exporter.py +1226 -0
pyconvexity/io/excel_importer.py +1381 -0
pyconvexity/io/netcdf_exporter.py +191 -0
pyconvexity/io/netcdf_importer.py +1802 -0
pyconvexity/models/__init__.py +195 -0
pyconvexity/models/attributes.py +730 -0
pyconvexity/models/carriers.py +159 -0
pyconvexity/models/components.py +611 -0
pyconvexity/models/network.py +503 -0
pyconvexity/models/results.py +148 -0
pyconvexity/models/scenarios.py +234 -0
pyconvexity/solvers/__init__.py +29 -0
pyconvexity/solvers/pypsa/__init__.py +30 -0
pyconvexity/solvers/pypsa/api.py +446 -0
pyconvexity/solvers/pypsa/batch_loader.py +296 -0
pyconvexity/solvers/pypsa/builder.py +655 -0
pyconvexity/solvers/pypsa/clearing_price.py +678 -0
pyconvexity/solvers/pypsa/constraints.py +405 -0
pyconvexity/solvers/pypsa/solver.py +1442 -0
pyconvexity/solvers/pypsa/storage.py +2096 -0
pyconvexity/timeseries.py +330 -0
pyconvexity/validation/__init__.py +25 -0
pyconvexity/validation/rules.py +312 -0
pyconvexity-0.4.8.dist-info/METADATA +148 -0
pyconvexity-0.4.8.dist-info/RECORD +44 -0
pyconvexity-0.4.8.dist-info/WHEEL +5 -0
pyconvexity-0.4.8.dist-info/top_level.txt +1 -0

pyconvexity/timeseries.py ADDED Viewed

@@ -0,0 +1,330 @@
+"""
+High-level timeseries API for PyConvexity.
+This module provides the main interface for working with timeseries data,
+matching the efficient patterns used in the Rust implementation.
+Key Features:
+- Ultra-fast binary serialization (matches Rust exactly)
+- Array-based data structures for maximum performance
+- Unified API for getting/setting timeseries data
+- Backward compatibility with legacy point-based format
+- Efficient sampling and filtering operations
+"""
+import sqlite3
+from typing import List, Optional, Union
+import numpy as np
+from pyconvexity.core.database import database_context
+from pyconvexity.core.types import Timeseries, TimeseriesMetadata
+from pyconvexity.models.attributes import (
+    get_timeseries as _get_timeseries,
+    get_timeseries_metadata as _get_timeseries_metadata,
+    set_timeseries_attribute,
+    serialize_values_to_binary,
+    deserialize_values_from_binary,
+    get_timeseries_length_from_binary,
+)
+# ============================================================================
+# HIGH-LEVEL TIMESERIES API
+# ============================================================================
+def get_timeseries(
+    db_path: str,
+    component_id: int,
+    attribute_name: str,
+    scenario_id: Optional[int] = None,
+    start_index: Optional[int] = None,
+    end_index: Optional[int] = None,
+    max_points: Optional[int] = None,
+) -> Timeseries:
+    """
+    Get timeseries data with efficient array-based format.
+    This is the main function for retrieving timeseries data. It returns
+    a Timeseries object with values as a flat array for maximum performance.
+    Args:
+        db_path: Path to the database file
+        component_id: Component ID
+        attribute_name: Name of the attribute (e.g., 'p', 'p_set', 'marginal_cost')
+        scenario_id: Scenario ID (uses master scenario if None)
+        start_index: Start index for range queries (optional)
+        end_index: End index for range queries (optional)
+        max_points: Maximum number of points for sampling (optional)
+    Returns:
+        Timeseries object with efficient array-based data
+    Example:
+        >>> ts = get_timeseries("model.db", component_id=123, attribute_name="p")
+        >>> print(f"Length: {ts.length}, Values: {ts.values[:5]}")
+        Length: 8760, Values: [100.5, 95.2, 87.3, 92.1, 88.7]
+        # Get a subset of the data
+        >>> ts_subset = get_timeseries("model.db", 123, "p", start_index=100, end_index=200)
+        >>> print(f"Subset length: {ts_subset.length}")
+        Subset length: 100
+        # Sample large datasets
+        >>> ts_sampled = get_timeseries("model.db", 123, "p", max_points=1000)
+        >>> print(f"Sampled from {ts.length} to {ts_sampled.length} points")
+    """
+    with database_context(db_path, read_only=True) as conn:
+        return _get_timeseries(
+            conn,
+            component_id,
+            attribute_name,
+            scenario_id,
+            start_index,
+            end_index,
+            max_points,
+        )
+def get_timeseries_metadata(
+    db_path: str,
+    component_id: int,
+    attribute_name: str,
+    scenario_id: Optional[int] = None,
+) -> TimeseriesMetadata:
+    """
+    Get timeseries metadata without loading the full data.
+    This is useful for checking the size and properties of a timeseries
+    before deciding whether to load the full data.
+    Args:
+        db_path: Path to the database file
+        component_id: Component ID
+        attribute_name: Name of the attribute
+        scenario_id: Scenario ID (uses master scenario if None)
+    Returns:
+        TimeseriesMetadata with length and type information
+    Example:
+        >>> meta = get_timeseries_metadata("model.db", 123, "p")
+        >>> print(f"Length: {meta.length}, Type: {meta.data_type}, Unit: {meta.unit}")
+        Length: 8760, Type: float, Unit: MW
+    """
+    with database_context(db_path, read_only=True) as conn:
+        return _get_timeseries_metadata(conn, component_id, attribute_name, scenario_id)
+def set_timeseries(
+    db_path: str,
+    component_id: int,
+    attribute_name: str,
+    values: Union[List[float], np.ndarray, Timeseries],
+    scenario_id: Optional[int] = None,
+) -> None:
+    """
+    Set timeseries data using efficient array-based format.
+    This is the main function for storing timeseries data. It accepts
+    various input formats and stores them efficiently in the database.
+    Args:
+        db_path: Path to the database file
+        component_id: Component ID
+        attribute_name: Name of the attribute
+        values: Timeseries values as list, numpy array, or Timeseries object
+        scenario_id: Scenario ID (uses master scenario if None)
+    Example:
+        # Set from a list
+        >>> values = [100.5, 95.2, 87.3, 92.1, 88.7]
+        >>> set_timeseries("model.db", 123, "p_set", values)
+        # Set from numpy array
+        >>> import numpy as np
+        >>> values = np.random.normal(100, 10, 8760)  # Hourly data for a year
+        >>> set_timeseries("model.db", 123, "p_max_pu", values)
+        # Set from existing Timeseries object
+        >>> ts = get_timeseries("model.db", 456, "p")
+        >>> set_timeseries("model.db", 123, "p_set", ts)
+    """
+    # Convert input to list of floats
+    if isinstance(values, Timeseries):
+        values_list = values.values
+    elif isinstance(values, np.ndarray):
+        values_list = values.tolist()
+    elif isinstance(values, list):
+        values_list = [float(v) for v in values]
+    else:
+        raise ValueError("values must be List[float], numpy.ndarray, or Timeseries")
+    with database_context(db_path) as conn:
+        set_timeseries_attribute(
+            conn, component_id, attribute_name, values_list, scenario_id
+        )
+def get_multiple_timeseries(
+    db_path: str, requests: List[dict], max_points: Optional[int] = None
+) -> List[Timeseries]:
+    """
+    Get multiple timeseries efficiently in a single database connection.
+    This is more efficient than calling get_timeseries multiple times
+    when you need to load many timeseries from the same database.
+    Args:
+        db_path: Path to the database file
+        requests: List of dicts with keys: component_id, attribute_name, scenario_id (optional)
+        max_points: Maximum number of points for sampling (applied to all)
+    Returns:
+        List of Timeseries objects in the same order as requests
+    Example:
+        >>> requests = [
+        ...     {"component_id": 123, "attribute_name": "p"},
+        ...     {"component_id": 124, "attribute_name": "p"},
+        ...     {"component_id": 125, "attribute_name": "p", "scenario_id": 2}
+        ... ]
+        >>> timeseries_list = get_multiple_timeseries("model.db", requests)
+        >>> print(f"Loaded {len(timeseries_list)} timeseries")
+    """
+    results = []
+    with database_context(db_path, read_only=True) as conn:
+        for request in requests:
+            component_id = request["component_id"]
+            attribute_name = request["attribute_name"]
+            scenario_id = request.get("scenario_id")
+            ts = _get_timeseries(
+                conn, component_id, attribute_name, scenario_id, None, None, max_points
+            )
+            results.append(ts)
+    return results
+# ============================================================================
+# UTILITY FUNCTIONS
+# ============================================================================
+def timeseries_to_numpy(timeseries: Timeseries) -> np.ndarray:
+    """
+    Convert Timeseries to numpy array for scientific computing.
+    Args:
+        timeseries: Timeseries object
+    Returns:
+        numpy array with float32 dtype for memory efficiency
+    Example:
+        >>> ts = get_timeseries("model.db", 123, "p")
+        >>> arr = timeseries_to_numpy(ts)
+        >>> print(f"Mean: {arr.mean():.2f}, Std: {arr.std():.2f}")
+    """
+    return np.array(timeseries.values, dtype=np.float32)
+def numpy_to_timeseries(
+    array: np.ndarray,
+    data_type: str = "float",
+    unit: Optional[str] = None,
+    is_input: bool = True,
+) -> Timeseries:
+    """
+    Convert numpy array to Timeseries object.
+    Args:
+        array: numpy array of values
+        data_type: Data type string (default: "float")
+        unit: Unit string (optional)
+        is_input: Whether this is input data (default: True)
+    Returns:
+        Timeseries object
+    Example:
+        >>> import numpy as np
+        >>> arr = np.random.normal(100, 10, 8760)
+        >>> ts = numpy_to_timeseries(arr, unit="MW")
+        >>> print(f"Created timeseries with {ts.length} points")
+    """
+    values = array.tolist() if hasattr(array, "tolist") else list(array)
+    return Timeseries(
+        values=[float(v) for v in values],
+        length=len(values),
+        start_index=0,
+        data_type=data_type,
+        unit=unit,
+        is_input=is_input,
+    )
+def validate_timeseries_alignment(
+    db_path: str, values: Union[List[float], np.ndarray, Timeseries]
+) -> dict:
+    """
+    Validate that timeseries data aligns with network time periods.
+    Args:
+        db_path: Path to the database file
+        values: Timeseries values to validate
+    Returns:
+        Dictionary with validation results
+    Example:
+        >>> values = [100.0] * 8760  # Hourly data for a year
+        >>> result = validate_timeseries_alignment("model.db", 1, values)
+        >>> if result["is_valid"]:
+        ...     print("Timeseries is properly aligned")
+        ... else:
+        ...     print(f"Alignment issues: {result['issues']}")
+    """
+    # Convert to list of floats
+    if isinstance(values, Timeseries):
+        values_list = values.values
+    elif isinstance(values, np.ndarray):
+        values_list = values.tolist()
+    elif isinstance(values, list):
+        values_list = [float(v) for v in values]
+    else:
+        raise ValueError("values must be List[float], numpy.ndarray, or Timeseries")
+    with database_context(db_path, read_only=True) as conn:
+        # Get network time periods
+        from pyconvexity.models.network import get_network_time_periods
+        try:
+            time_periods = get_network_time_periods(conn)
+            expected_length = len(time_periods)
+            actual_length = len(values_list)
+            is_valid = actual_length == expected_length
+            issues = []
+            if actual_length < expected_length:
+                issues.append(f"Missing {expected_length - actual_length} time periods")
+            elif actual_length > expected_length:
+                issues.append(f"Extra {actual_length - expected_length} time periods")
+            return {
+                "is_valid": is_valid,
+                "expected_length": expected_length,
+                "actual_length": actual_length,
+                "issues": issues,
+            }
+        except Exception as e:
+            return {
+                "is_valid": False,
+                "expected_length": 0,
+                "actual_length": len(values_list),
+                "issues": [f"Failed to get network time periods: {e}"],
+            }

pyconvexity/validation/__init__.py ADDED Viewed

@@ -0,0 +1,25 @@
+"""
+Validation module for PyConvexity.
+Contains data validation rules and type checking functionality.
+"""
+from pyconvexity.validation.rules import (
+    get_validation_rule,
+    list_validation_rules,
+    get_all_validation_rules,
+    validate_static_value,
+    validate_timeseries_alignment,
+    parse_default_value,
+    get_attribute_setter_info,
+)
+__all__ = [
+    "get_validation_rule",
+    "list_validation_rules",
+    "get_all_validation_rules",
+    "validate_static_value",
+    "validate_timeseries_alignment",
+    "parse_default_value",
+    "get_attribute_setter_info",
+]

pyconvexity/validation/rules.py ADDED Viewed

@@ -0,0 +1,312 @@
+"""
+Validation rules and operations for PyConvexity.
+Provides validation logic for component attributes, data types, and timeseries alignment.
+"""
+import sqlite3
+import json
+import logging
+from typing import Dict, Any, Optional, List
+from pyconvexity.core.types import (
+    ValidationRule,
+    StaticValue,
+    TimePeriod,
+    TimeseriesValidationResult,
+)
+from pyconvexity.core.errors import ValidationError, InvalidDataType
+logger = logging.getLogger(__name__)
+def get_validation_rule(
+    conn: sqlite3.Connection, component_type: str, attribute_name: str
+) -> ValidationRule:
+    """
+    Get validation rule for a specific component type and attribute.
+    Args:
+        conn: Database connection
+        component_type: Type of component (e.g., "BUS", "GENERATOR")
+        attribute_name: Name of the attribute
+    Returns:
+        ValidationRule object with all validation information
+    Raises:
+        ValidationError: If no validation rule is found
+    """
+    cursor = conn.execute(
+        """
+        SELECT component_type, attribute_name, data_type, unit, default_value, allowed_storage_types,
+               is_required, is_input, description
+        FROM attribute_validation_rules
+        WHERE component_type = ? AND attribute_name = ?
+    """,
+        (component_type, attribute_name),
+    )
+    row = cursor.fetchone()
+    if not row:
+        raise ValidationError(
+            f"No validation rule found for {component_type}.{attribute_name}"
+        )
+    allowed_storage_types = row[5]
+    allows_static = allowed_storage_types in ("static", "static_or_timeseries")
+    allows_timeseries = allowed_storage_types in ("timeseries", "static_or_timeseries")
+    # Parse default value
+    default_value = None
+    if row[4]:  # default_value_string
+        default_value = parse_default_value(row[4])
+    return ValidationRule(
+        component_type=row[0],
+        attribute_name=row[1],
+        data_type=row[2],
+        unit=row[3],
+        default_value_string=row[4],
+        allowed_storage_types=allowed_storage_types,
+        allows_static=allows_static,
+        allows_timeseries=allows_timeseries,
+        is_required=bool(row[6]),
+        is_input=bool(row[7]),
+        description=row[8],
+        default_value=default_value,
+    )
+def list_validation_rules(
+    conn: sqlite3.Connection, component_type: str
+) -> List[ValidationRule]:
+    """
+    List validation rules for a component type.
+    Args:
+        conn: Database connection
+        component_type: Type of component
+    Returns:
+        List of ValidationRule objects
+    """
+    cursor = conn.execute(
+        """
+        SELECT component_type, attribute_name, data_type, unit, default_value, allowed_storage_types,
+               is_required, is_input, description
+        FROM attribute_validation_rules
+        WHERE component_type = ?
+        ORDER BY attribute_name
+    """,
+        (component_type,),
+    )
+    rules = []
+    for row in cursor.fetchall():
+        allowed_storage_types = row[5]
+        allows_static = allowed_storage_types in ("static", "static_or_timeseries")
+        allows_timeseries = allowed_storage_types in (
+            "timeseries",
+            "static_or_timeseries",
+        )
+        # Parse default value
+        default_value = None
+        if row[4]:  # default_value_string
+            default_value = parse_default_value(row[4])
+        rules.append(
+            ValidationRule(
+                component_type=row[0],
+                attribute_name=row[1],
+                data_type=row[2],
+                unit=row[3],
+                default_value_string=row[4],
+                allowed_storage_types=allowed_storage_types,
+                allows_static=allows_static,
+                allows_timeseries=allows_timeseries,
+                is_required=bool(row[6]),
+                is_input=bool(row[7]),
+                description=row[8],
+                default_value=default_value,
+            )
+        )
+    return rules
+def get_all_validation_rules(conn: sqlite3.Connection) -> Dict[str, Any]:
+    """
+    Get all validation rules from the database.
+    This replaces the need to load the entire JSON file into memory.
+    Args:
+        conn: Database connection
+    Returns:
+        Dictionary mapping component types to their validation rules
+    """
+    try:
+        cursor = conn.execute(
+            """
+            SELECT component_type, attribute_name, data_type, unit, default_value, allowed_storage_types,
+                   is_required, is_input, description
+            FROM attribute_validation_rules
+        """
+        )
+        rules = {}
+        for row in cursor.fetchall():
+            component_type = row[0]
+            attribute_name = row[1]
+            data_type = row[2]
+            unit = row[3]
+            default_value = row[4]
+            allowed_storage_types = row[5]
+            is_required = bool(row[6])
+            is_input = bool(row[7])
+            description = row[8]
+            if component_type not in rules:
+                rules[component_type] = {}
+            rules[component_type][attribute_name] = {
+                "data_type": data_type,
+                "unit": unit,
+                "default_value": default_value,
+                "allowed_storage_types": allowed_storage_types,
+                "is_required": is_required,
+                "is_input": is_input,
+                "description": description,
+            }
+        return rules
+    except Exception as e:
+        logger.error(f"Error getting all validation rules: {e}")
+        return {}
+def validate_static_value(value: StaticValue, rule: ValidationRule) -> None:
+    """
+    Validate static value against rule.
+    Args:
+        value: StaticValue to validate
+        rule: ValidationRule to validate against
+    Raises:
+        InvalidDataType: If value type doesn't match rule
+    """
+    value_type = value.data_type()
+    if value_type != rule.data_type:
+        raise InvalidDataType(expected=rule.data_type, actual=value_type)
+def validate_timeseries_alignment(
+    conn: sqlite3.Connection, timeseries: List[float]
+) -> TimeseriesValidationResult:
+    """
+    Validate timeseries alignment with network periods (single network per database).
+    Args:
+        conn: Database connection
+        timeseries: List of timeseries points to validate
+    Returns:
+        TimeseriesValidationResult with validation details
+    """
+    # Get network time periods
+    from pyconvexity.models.network import get_network_time_periods
+    network_periods = get_network_time_periods(conn)
+    network_period_indices = {p.period_index for p in network_periods}
+    # Get provided period indices
+    provided_period_indices = {p.period_index for p in timeseries}
+    # Find missing and extra periods
+    missing_periods = list(network_period_indices - provided_period_indices)
+    extra_periods = list(provided_period_indices - network_period_indices)
+    is_valid = len(missing_periods) == 0 and len(extra_periods) == 0
+    return TimeseriesValidationResult(
+        is_valid=is_valid,
+        missing_periods=missing_periods,
+        extra_periods=extra_periods,
+        total_network_periods=len(network_periods),
+        provided_periods=len(timeseries),
+    )
+def parse_default_value(s: str) -> Optional[StaticValue]:
+    """
+    Parse default value string.
+    Args:
+        s: String representation of default value
+    Returns:
+        StaticValue object or None if parsing fails
+    """
+    # Try to parse as JSON first
+    try:
+        value = json.loads(s)
+        if isinstance(value, float):
+            return StaticValue(value)
+        elif isinstance(value, int):
+            return StaticValue(value)
+        elif isinstance(value, bool):
+            return StaticValue(value)
+        elif isinstance(value, str):
+            return StaticValue(value)
+        else:
+            return None
+    except (json.JSONDecodeError, ValueError):
+        # Fallback to string
+        return StaticValue(s)
+def get_attribute_setter_info(
+    conn: sqlite3.Connection,
+    component_type: str,
+    attribute_name: str,
+) -> Dict[str, Any]:
+    """
+    Get the appropriate function name for setting an attribute.
+    Args:
+        conn: Database connection
+        component_type: Type of component
+        attribute_name: Name of the attribute
+    Returns:
+        Dictionary with setter function information
+    Raises:
+        ValidationError: If attribute or data type is unknown
+    """
+    rule = get_validation_rule(conn, component_type, attribute_name)
+    function_name = {
+        "float": "set_float_attribute",
+        "int": "set_integer_attribute",
+        "boolean": "set_boolean_attribute",
+        "string": "set_string_attribute",
+    }.get(rule.data_type)
+    if not function_name:
+        raise ValidationError(f"Unknown data type: {rule.data_type}")
+    return {
+        "function_name": function_name,
+        "data_type": rule.data_type,
+        "allows_static": rule.allows_static,
+        "allows_timeseries": rule.allows_timeseries,
+        "is_required": rule.is_required,
+        "default_value": rule.default_value_string,
+        "unit": rule.unit,
+        "description": rule.description,
+    }