PyPI - voxcity - Versions diffs - 0.6.26__py3-none-any.whl → 1.0.2__py3-none-any.whl - Mend

voxcity 0.6.26py3-none-any.whl → 1.0.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (81) hide show

voxcity/__init__.py +10 -4
voxcity/downloader/__init__.py +2 -1
voxcity/downloader/gba.py +210 -0
voxcity/downloader/gee.py +5 -1
voxcity/downloader/mbfp.py +1 -1
voxcity/downloader/oemj.py +80 -8
voxcity/downloader/utils.py +73 -73
voxcity/errors.py +30 -0
voxcity/exporter/__init__.py +9 -1
voxcity/exporter/cityles.py +129 -34
voxcity/exporter/envimet.py +51 -26
voxcity/exporter/magicavoxel.py +42 -5
voxcity/exporter/netcdf.py +27 -0
voxcity/exporter/obj.py +103 -28
voxcity/generator/__init__.py +47 -0
voxcity/generator/api.py +721 -0
voxcity/generator/grids.py +381 -0
voxcity/generator/io.py +94 -0
voxcity/generator/pipeline.py +282 -0
voxcity/generator/update.py +429 -0
voxcity/generator/voxelizer.py +392 -0
voxcity/geoprocessor/__init__.py +75 -6
voxcity/geoprocessor/conversion.py +153 -0
voxcity/geoprocessor/draw.py +1488 -1169
voxcity/geoprocessor/heights.py +199 -0
voxcity/geoprocessor/io.py +101 -0
voxcity/geoprocessor/merge_utils.py +91 -0
voxcity/geoprocessor/mesh.py +26 -10
voxcity/geoprocessor/network.py +35 -6
voxcity/geoprocessor/overlap.py +84 -0
voxcity/geoprocessor/raster/__init__.py +82 -0
voxcity/geoprocessor/raster/buildings.py +435 -0
voxcity/geoprocessor/raster/canopy.py +258 -0
voxcity/geoprocessor/raster/core.py +150 -0
voxcity/geoprocessor/raster/export.py +93 -0
voxcity/geoprocessor/raster/landcover.py +159 -0
voxcity/geoprocessor/raster/raster.py +110 -0
voxcity/geoprocessor/selection.py +85 -0
voxcity/geoprocessor/utils.py +824 -820
voxcity/models.py +113 -0
voxcity/simulator/common/__init__.py +22 -0
voxcity/simulator/common/geometry.py +98 -0
voxcity/simulator/common/raytracing.py +450 -0
voxcity/simulator/solar/__init__.py +66 -0
voxcity/simulator/solar/integration.py +336 -0
voxcity/simulator/solar/kernels.py +62 -0
voxcity/simulator/solar/radiation.py +648 -0
voxcity/simulator/solar/sky.py +668 -0
voxcity/simulator/solar/temporal.py +792 -0
voxcity/simulator/view.py +36 -2286
voxcity/simulator/visibility/__init__.py +29 -0
voxcity/simulator/visibility/landmark.py +392 -0
voxcity/simulator/visibility/view.py +508 -0
voxcity/utils/__init__.py +11 -0
voxcity/utils/classes.py +194 -0
voxcity/utils/lc.py +80 -39
voxcity/utils/logging.py +61 -0
voxcity/utils/orientation.py +51 -0
voxcity/utils/shape.py +230 -0
voxcity/utils/weather/__init__.py +26 -0
voxcity/utils/weather/epw.py +146 -0
voxcity/utils/weather/files.py +36 -0
voxcity/utils/weather/onebuilding.py +486 -0
voxcity/visualizer/__init__.py +24 -0
voxcity/visualizer/builder.py +43 -0
voxcity/visualizer/grids.py +141 -0
voxcity/visualizer/maps.py +187 -0
voxcity/visualizer/palette.py +228 -0
voxcity/visualizer/renderer.py +1145 -0
{voxcity-0.6.26.dist-info → voxcity-1.0.2.dist-info}/METADATA +162 -48
voxcity-1.0.2.dist-info/RECORD +81 -0
voxcity/generator.py +0 -1302
voxcity/geoprocessor/grid.py +0 -1739
voxcity/geoprocessor/polygon.py +0 -1344
voxcity/simulator/solar.py +0 -2339
voxcity/utils/visualization.py +0 -2849
voxcity/utils/weather.py +0 -1038
voxcity-0.6.26.dist-info/RECORD +0 -38
{voxcity-0.6.26.dist-info → voxcity-1.0.2.dist-info}/WHEEL +0 -0
{voxcity-0.6.26.dist-info → voxcity-1.0.2.dist-info}/licenses/AUTHORS.rst +0 -0
{voxcity-0.6.26.dist-info → voxcity-1.0.2.dist-info}/licenses/LICENSE +0 -0

voxcity/utils/weather.py DELETED Viewed

@@ -1,1038 +0,0 @@
-"""
-Weather data utilities for VoxelCity.
-This module provides functionality to download and process Energyplus Weather (EPW) files
-from Climate.OneBuilding.Org based on geographical coordinates. It includes utilities for:
-- Automatically finding the nearest weather station to given coordinates
-- Downloading EPW files from various global regions
-- Processing EPW files into pandas DataFrames for analysis
-- Extracting solar radiation data for solar simulations
-The main function get_nearest_epw_from_climate_onebuilding() provides a comprehensive
-solution for obtaining weather data for any global location by automatically detecting
-the appropriate region and finding the closest available weather station.
-"""
-import requests
-import xml.etree.ElementTree as ET
-import re
-from math import radians, sin, cos, sqrt, atan2
-from pathlib import Path
-from typing import Optional, Dict, List, Tuple, Union
-import json
-import zipfile
-import pandas as pd
-import io
-import os
-import numpy as np
-from datetime import datetime
-# =============================================================================
-# FILE HANDLING UTILITIES
-# =============================================================================
-def safe_rename(src: Path, dst: Path) -> Path:
-    """
-    Safely rename a file, handling existing files by adding a number suffix.
-    This function prevents file conflicts by automatically generating unique filenames
-    when the target destination already exists. It appends incremental numbers to
-    the base filename until a unique name is found.
-    Args:
-        src: Source file path
-        dst: Destination file path
-    Returns:
-        Path: Final destination path used
-    """
-    # If destination doesn't exist, simple rename
-    if not dst.exists():
-        src.rename(dst)
-        return dst
-    # If file exists, add number suffix
-    base = dst.stem
-    ext = dst.suffix
-    counter = 1
-    # Keep incrementing counter until we find a name that doesn't exist
-    while True:
-        new_dst = dst.with_name(f"{base}_{counter}{ext}")
-        if not new_dst.exists():
-            src.rename(new_dst)
-            return new_dst
-        counter += 1
-def safe_extract(zip_ref: zipfile.ZipFile, filename: str, extract_dir: Path) -> Path:
-    """
-    Safely extract a file from zip, handling existing files.
-    This function handles the case where a file with the same name already exists
-    in the extraction directory by using a temporary filename with random suffix.
-    Args:
-        zip_ref: Open ZipFile reference
-        filename: Name of file to extract
-        extract_dir: Directory to extract to
-    Returns:
-        Path: Path to extracted file
-    """
-    try:
-        zip_ref.extract(filename, extract_dir)
-        return extract_dir / filename
-    except FileExistsError:
-        # If file exists, extract to temporary name and return path
-        temp_name = f"temp_{os.urandom(4).hex()}_{filename}"
-        zip_ref.extract(filename, extract_dir, temp_name)
-        return extract_dir / temp_name
-# =============================================================================
-# EPW FILE PROCESSING
-# =============================================================================
-def process_epw(epw_path: Union[str, Path]) -> Tuple[pd.DataFrame, Dict]:
-    """
-    Process an EPW file into a pandas DataFrame.
-    EPW (EnergyPlus Weather) files contain standardized weather data in a specific format.
-    The first 8 lines contain metadata, followed by 8760 lines of hourly weather data
-    for a typical meteorological year.
-    Args:
-        epw_path: Path to the EPW file
-    Returns:
-        Tuple containing:
-        - DataFrame with hourly weather data indexed by datetime
-        - Dictionary with EPW header metadata including location information
-    """
-    # EPW column names (these are standardized across all EPW files)
-    columns = [
-        'Year', 'Month', 'Day', 'Hour', 'Minute',
-        'Data Source and Uncertainty Flags',
-        'Dry Bulb Temperature', 'Dew Point Temperature',
-        'Relative Humidity', 'Atmospheric Station Pressure',
-        'Extraterrestrial Horizontal Radiation',
-        'Extraterrestrial Direct Normal Radiation',
-        'Horizontal Infrared Radiation Intensity',
-        'Global Horizontal Radiation',
-        'Direct Normal Radiation', 'Diffuse Horizontal Radiation',
-        'Global Horizontal Illuminance',
-        'Direct Normal Illuminance', 'Diffuse Horizontal Illuminance',
-        'Zenith Luminance', 'Wind Direction', 'Wind Speed',
-        'Total Sky Cover', 'Opaque Sky Cover', 'Visibility',
-        'Ceiling Height', 'Present Weather Observation',
-        'Present Weather Codes', 'Precipitable Water',
-        'Aerosol Optical Depth', 'Snow Depth',
-        'Days Since Last Snowfall', 'Albedo',
-        'Liquid Precipitation Depth', 'Liquid Precipitation Quantity'
-    ]
-    # Read EPW file - EPW files are always in comma-separated format
-    with open(epw_path, 'r') as f:
-        lines = f.readlines()
-    # Extract header metadata (first 8 lines contain standardized metadata)
-    headers = {
-        'LOCATION': lines[0].strip(),
-        'DESIGN_CONDITIONS': lines[1].strip(),
-        'TYPICAL_EXTREME_PERIODS': lines[2].strip(),
-        'GROUND_TEMPERATURES': lines[3].strip(),
-        'HOLIDAYS_DAYLIGHT_SAVINGS': lines[4].strip(),
-        'COMMENTS_1': lines[5].strip(),
-        'COMMENTS_2': lines[6].strip(),
-        'DATA_PERIODS': lines[7].strip()
-    }
-    # Parse location data from first header line
-    # Format: LOCATION,City,State,Country,Source,WMO,Latitude,Longitude,TimeZone,Elevation
-    location = headers['LOCATION'].split(',')
-    if len(location) >= 10:
-        headers['LOCATION'] = {
-            'City': location[1].strip(),
-            'State': location[2].strip(),
-            'Country': location[3].strip(),
-            'Data Source': location[4].strip(),
-            'WMO': location[5].strip(),
-            'Latitude': float(location[6]),
-            'Longitude': float(location[7]),
-            'Time Zone': float(location[8]),
-            'Elevation': float(location[9])
-        }
-    # Create DataFrame from weather data (skipping 8 header lines)
-    data = [line.strip().split(',') for line in lines[8:]]
-    df = pd.DataFrame(data, columns=columns)
-    # Convert numeric columns to appropriate data types
-    # All weather parameters should be numeric except uncertainty flags and weather codes
-    numeric_columns = [
-        'Year', 'Month', 'Day', 'Hour', 'Minute',
-        'Dry Bulb Temperature', 'Dew Point Temperature',
-        'Relative Humidity', 'Atmospheric Station Pressure',
-        'Extraterrestrial Horizontal Radiation',
-        'Extraterrestrial Direct Normal Radiation',
-        'Horizontal Infrared Radiation Intensity',
-        'Global Horizontal Radiation',
-        'Direct Normal Radiation', 'Diffuse Horizontal Radiation',
-        'Global Horizontal Illuminance',
-        'Direct Normal Illuminance', 'Diffuse Horizontal Illuminance',
-        'Zenith Luminance', 'Wind Direction', 'Wind Speed',
-        'Total Sky Cover', 'Opaque Sky Cover', 'Visibility',
-        'Ceiling Height', 'Precipitable Water',
-        'Aerosol Optical Depth', 'Snow Depth',
-        'Days Since Last Snowfall', 'Albedo',
-        'Liquid Precipitation Depth', 'Liquid Precipitation Quantity'
-    ]
-    # Convert to numeric, handling any parsing errors gracefully
-    for col in numeric_columns:
-        df[col] = pd.to_numeric(df[col], errors='coerce')
-    # Create datetime index for time series analysis
-    # EPW hours are 1-24, but pandas expects 0-23 for proper datetime handling
-    df['datetime'] = pd.to_datetime({
-        'year': df['Year'],
-        'month': df['Month'],
-        'day': df['Day'],
-        'hour': df['Hour'] - 1,  # EPW hours are 1-24, pandas expects 0-23
-        'minute': df['Minute']
-    })
-    df.set_index('datetime', inplace=True)
-    return df, headers
-# =============================================================================
-# MAIN WEATHER DATA DOWNLOAD FUNCTION
-# =============================================================================
-def get_nearest_epw_from_climate_onebuilding(longitude: float, latitude: float, output_dir: str = "./", max_distance: Optional[float] = None,
-                extract_zip: bool = True, load_data: bool = True, region: Optional[Union[str, List[str]]] = None,
-                allow_insecure_ssl: bool = False, allow_http_fallback: bool = False,
-                ssl_verify: Union[bool, str] = True) -> Tuple[Optional[str], Optional[pd.DataFrame], Optional[Dict]]:
-    """
-    Download and process EPW weather file from Climate.OneBuilding.Org based on coordinates.
-    This function automatically finds and downloads the nearest available weather station
-    data from Climate.OneBuilding.Org's global database. It supports region-based searching
-    for improved performance and can automatically detect the appropriate region based on
-    coordinates.
-    The function performs the following steps:
-    1. Determines which regional KML files to scan based on coordinates or user input
-    2. Downloads and parses KML files to extract weather station metadata
-    3. Calculates distances to find the nearest station
-    4. Downloads the EPW file from the nearest station
-    5. Optionally processes the EPW data into a pandas DataFrame
-    Args:
-        longitude (float): Longitude of the location (-180 to 180)
-        latitude (float): Latitude of the location (-90 to 90)
-        output_dir (str): Directory to save the EPW file (defaults to current directory)
-        max_distance (float, optional): Maximum distance in kilometers to search for stations.
-                                       If no stations within this distance, uses closest available.
-        extract_zip (bool): Whether to extract the ZIP file (default True)
-        load_data (bool): Whether to load the EPW data into a DataFrame (default True)
-        region (str or List[str], optional): Specific region(s) or dataset(s) to scan for stations.
-                                            Regions: "Africa", "Asia", "South_America",
-                                            "North_and_Central_America", "Southwest_Pacific",
-                                            "Europe", "Antarctica".
-                                            Sub-datasets (can be used alone or auto-included by region):
-                                            "Japan", "India", "CSWD", "CityUHK", "PHIKO",
-                                            "Argentina", "INMET_TRY", "AMTUes", "BrazFuture",
-                                            plus legacy "Canada", "USA", "Caribbean" (Region 4).
-                                            Use "all" to scan every dataset.
-                                            If None, will auto-detect region based on coordinates.
-            allow_insecure_ssl (bool): If True, on SSL errors retry with certificate verification disabled.
-            allow_http_fallback (bool): If True, on SSL/network errors, also try HTTP (insecure) fallback.
-            ssl_verify (bool|str): Passed to requests as 'verify' parameter for HTTPS; can be False or CA bundle path.
-    Returns:
-        Tuple containing:
-        - Path to the EPW file (or None if download fails)
-        - DataFrame with hourly weather data (if load_data=True, else None)
-        - Dictionary with EPW header metadata (if load_data=True, else None)
-    Raises:
-        ValueError: If invalid region specified or no weather stations found
-        requests.exceptions.RequestException: If network requests fail
-    """
-    # Regional KML sources from Climate.OneBuilding.Org (2024+ TMYx structure)
-    # Each WMO region maintains a primary KML in /sources with the naming pattern:
-    #   Region{N}_{Name}_TMYx_EPW_Processing_locations.kml
-    # Keep sub-region keys for backward compatibility (mapping to the Region KML where applicable)
-    KML_SOURCES = {
-        # WMO Region 1
-        "Africa": "https://climate.onebuilding.org/sources/Region1_Africa_TMYx_EPW_Processing_locations.kml",
-        # WMO Region 2
-        "Asia": "https://climate.onebuilding.org/sources/Region2_Asia_TMYx_EPW_Processing_locations.kml",
-        # Subsets/datasets within Asia that still publish dedicated KMLs
-        "Japan": "https://climate.onebuilding.org/sources/JGMY_EPW_Processing_locations.kml",
-        "India": "https://climate.onebuilding.org/sources/ITMY_EPW_Processing_locations.kml",
-        "CSWD": "https://climate.onebuilding.org/sources/CSWD_EPW_Processing_locations.kml",
-        "CityUHK": "https://climate.onebuilding.org/sources/CityUHK_EPW_Processing_locations.kml",
-        "PHIKO": "https://climate.onebuilding.org/sources/PHIKO_EPW_Processing_locations.kml",
-        # WMO Region 3
-        "South_America": "https://climate.onebuilding.org/sources/Region3_South_America_TMYx_EPW_Processing_locations.kml",
-        # Historical/legacy dataset for Argentina maintained separately
-        "Argentina": "https://climate.onebuilding.org/sources/ArgTMY_EPW_Processing_locations.kml",
-        "INMET_TRY": "https://climate.onebuilding.org/sources/INMET_TRY_EPW_Processing_locations.kml",
-        "AMTUes": "https://climate.onebuilding.org/sources/AMTUes_EPW_Processing_locations.kml",
-        "BrazFuture": "https://climate.onebuilding.org/sources/BrazFuture_EPW_Processing_locations.kml",
-        # WMO Region 4 (use subregion KMLs; umbrella selection expands to these)
-        # Note: There is no single unified Region 4 KML in /sources as of 2024.
-        # Use these three subregion KMLs instead.
-        "Canada": "https://climate.onebuilding.org/sources/Region4_Canada_TMYx_EPW_Processing_locations.kml",
-        "USA": "https://climate.onebuilding.org/sources/Region4_USA_TMYx_EPW_Processing_locations.kml",
-        "Caribbean": "https://climate.onebuilding.org/sources/Region4_NA_CA_Caribbean_TMYx_EPW_Processing_locations.kml",
-        # WMO Region 5
-        "Southwest_Pacific": "https://climate.onebuilding.org/sources/Region5_Southwest_Pacific_TMYx_EPW_Processing_locations.kml",
-        # WMO Region 6
-        "Europe": "https://climate.onebuilding.org/sources/Region6_Europe_TMYx_EPW_Processing_locations.kml",
-        # WMO Region 7
-        "Antarctica": "https://climate.onebuilding.org/sources/Region7_Antarctica_TMYx_EPW_Processing_locations.kml",
-    }
-    # Group region selections to include relevant sub-datasets automatically
-    REGION_DATASET_GROUPS = {
-        "Africa": ["Africa"],
-        "Asia": ["Asia", "Japan", "India", "CSWD", "CityUHK", "PHIKO"],
-        "South_America": ["South_America", "Argentina", "INMET_TRY", "AMTUes", "BrazFuture"],
-        "North_and_Central_America": ["North_and_Central_America", "Canada", "USA", "Caribbean"],
-        "Southwest_Pacific": ["Southwest_Pacific"],
-        "Europe": ["Europe"],
-        "Antarctica": ["Antarctica"],
-    }
-    # Define approximate geographical boundaries for automatic region detection
-    # These bounds help determine which regional KML files to scan based on coordinates
-    REGION_BOUNDS = {
-        # WMO Region 1 - Africa (includes islands in Indian Ocean and Spanish territories off N. Africa)
-        "Africa": {"lon_min": -25, "lon_max": 80, "lat_min": -55, "lat_max": 45},
-        # WMO Region 2 - Asia (includes SE Asia, West Asia, Asian Russia, and BIOT)
-        "Asia": {"lon_min": 20, "lon_max": 180, "lat_min": -10, "lat_max": 80},
-        # Subsets
-        "Japan": {"lon_min": 127, "lon_max": 146, "lat_min": 24, "lat_max": 46},
-        "India": {"lon_min": 68, "lon_max": 97, "lat_min": 6, "lat_max": 36},
-        # WMO Region 3 - South America (includes Falklands, South Georgia/Sandwich, Galapagos)
-        "South_America": {"lon_min": -92, "lon_max": -20, "lat_min": -60, "lat_max": 15},
-        # Legacy/compatibility subset
-        "Argentina": {"lon_min": -75, "lon_max": -53, "lat_min": -55, "lat_max": -22},
-        # WMO Region 4 - North and Central America (includes Greenland and Caribbean)
-        "North_and_Central_America": {"lon_min": -180, "lon_max": 20, "lat_min": -10, "lat_max": 85},
-        # Backward-compatible subsets mapped to Region 4 KML
-        "Canada": {"lon_min": -141, "lon_max": -52, "lat_min": 42, "lat_max": 83},
-        "USA": {"lon_min": -170, "lon_max": -65, "lat_min": 20, "lat_max": 72},
-        "Caribbean": {"lon_min": -90, "lon_max": -59, "lat_min": 10, "lat_max": 27},
-        # WMO Region 5 - Southwest Pacific (covers SE Asia + Pacific islands + Hawaii via antimeridian)
-        "Southwest_Pacific": {
-            "boxes": [
-                {"lon_min": 90, "lon_max": 180, "lat_min": -50, "lat_max": 25},
-                {"lon_min": -180, "lon_max": -140, "lat_min": -50, "lat_max": 25},
-            ]
-        },
-        # WMO Region 6 - Europe (includes Middle East countries listed and Greenland)
-        "Europe": {"lon_min": -75, "lon_max": 60, "lat_min": 25, "lat_max": 85},
-        # WMO Region 7 - Antarctica
-        "Antarctica": {"lon_min": -180, "lon_max": 180, "lat_min": -90, "lat_max": -60}
-    }
-    def detect_regions(lon: float, lat: float) -> List[str]:
-        """
-        Detect which region(s) the coordinates belong to.
-        Uses the REGION_BOUNDS to determine appropriate regions to search.
-        If coordinates don't fall within any region, returns the 3 closest regions.
-        Args:
-            lon: Longitude coordinate
-            lat: Latitude coordinate
-        Returns:
-            List of region names to search
-        """
-        matching_regions = []
-        # Handle special case of longitude wrap around 180/-180
-        # Normalize longitude to standard -180 to 180 range
-        lon_adjusted = lon
-        if lon < -180:
-            lon_adjusted = lon + 360
-        elif lon > 180:
-            lon_adjusted = lon - 360
-        # Helper to test point within a single box
-        def _in_box(bx: Dict[str, float], lon_v: float, lat_v: float) -> bool:
-            return (bx["lon_min"] <= lon_v <= bx["lon_max"] and
-                    bx["lat_min"] <= lat_v <= bx["lat_max"])
-        # Check if coordinates fall within any region bounds (support multi-box)
-        for region_name, bounds in REGION_BOUNDS.items():
-            if "boxes" in bounds:
-                for bx in bounds["boxes"]:
-                    if _in_box(bx, lon_adjusted, lat):
-                        matching_regions.append(region_name)
-                        break
-            else:
-                if _in_box(bounds, lon_adjusted, lat):
-                    matching_regions.append(region_name)
-        # If no regions matched, find the closest regions by boundary distance
-        if not matching_regions:
-            # Calculate "distance" to each region's boundary (simplified metric)
-            region_distances = []
-            for region_name, bounds in REGION_BOUNDS.items():
-                def _box_distance(bx: Dict[str, float]) -> float:
-                    lon_dist = 0
-                    if lon_adjusted < bx["lon_min"]:
-                        lon_dist = bx["lon_min"] - lon_adjusted
-                    elif lon_adjusted > bx["lon_max"]:
-                        lon_dist = lon_adjusted - bx["lon_max"]
-                    lat_dist = 0
-                    if lat < bx["lat_min"]:
-                        lat_dist = bx["lat_min"] - lat
-                    elif lat > bx["lat_max"]:
-                        lat_dist = lat - bx["lat_max"]
-                    return (lon_dist**2 + lat_dist**2)**0.5
-                if "boxes" in bounds:
-                    d = min(_box_distance(bx) for bx in bounds["boxes"])
-                else:
-                    d = _box_distance(bounds)
-                region_distances.append((region_name, d))
-            # Get 3 closest regions to ensure we find stations
-            closest_regions = sorted(region_distances, key=lambda x: x[1])[:3]
-            matching_regions = [r[0] for r in closest_regions]
-        return matching_regions
-    def try_decode(content: bytes) -> str:
-        """
-        Try different encodings to decode content.
-        KML files from different regions may use various text encodings.
-        This function tries common encodings to successfully decode the content.
-        Args:
-            content: Raw bytes content
-        Returns:
-            Decoded string content
-        """
-        # Try common encodings in order of preference
-        encodings = ['utf-8', 'latin1', 'iso-8859-1', 'cp1252']
-        for encoding in encodings:
-            try:
-                return content.decode(encoding)
-            except UnicodeDecodeError:
-                continue
-        # If all else fails, try to decode with replacement characters
-        return content.decode('utf-8', errors='replace')
-    def clean_xml(content: str) -> str:
-        """
-        Clean XML content of invalid characters.
-        Some KML files contain characters that cause XML parsing issues.
-        This function replaces or removes problematic characters to ensure
-        successful XML parsing.
-        Args:
-            content: Raw XML content string
-        Returns:
-            Cleaned XML content string
-        """
-        # Replace problematic Spanish characters that cause XML parsing issues
-        content = content.replace('&ntilde;', 'n')
-        content = content.replace('&Ntilde;', 'N')
-        content = content.replace('ñ', 'n')
-        content = content.replace('Ñ', 'N')
-        # Remove other invalid XML characters using regex
-        # Keep only valid XML characters: tab, newline, carriage return, printable ASCII, and extended Latin
-        content = re.sub(r'[^\x09\x0A\x0D\x20-\x7E\x85\xA0-\xFF]', '', content)
-        return content
-    def haversine_distance(lon1: float, lat1: float, lon2: float, lat2: float) -> float:
-        """
-        Calculate the great circle distance between two points on Earth.
-        Uses the Haversine formula to calculate the shortest distance between
-        two points on a sphere (Earth) given their latitude and longitude.
-        Args:
-            lon1, lat1: Coordinates of first point
-            lon2, lat2: Coordinates of second point
-        Returns:
-            Distance in kilometers
-        """
-        R = 6371  # Earth's radius in kilometers
-        # Convert coordinates to radians
-        lat1, lon1, lat2, lon2 = map(radians, [lat1, lon1, lat2, lon2])
-        dlat = lat2 - lat1
-        dlon = lon2 - lon1
-        # Haversine formula calculation
-        a = sin(dlat/2)**2 + cos(lat1) * cos(lat2) * sin(dlon/2)**2
-        c = 2 * atan2(sqrt(a), sqrt(1-a))
-        return R * c
-    def parse_coordinates(point_text: str) -> Tuple[float, float, float]:
-        """
-        Parse coordinates from KML Point text.
-        KML Point elements contain coordinates in the format "longitude,latitude,elevation".
-        This function extracts and converts these values to float.
-        Args:
-            point_text: Raw coordinate text from KML Point element
-        Returns:
-            Tuple of (latitude, longitude, elevation) or None if parsing fails
-        """
-        try:
-            coords = point_text.strip().split(',')
-            if len(coords) >= 2:
-                lon, lat = map(float, coords[:2])
-                elevation = float(coords[2]) if len(coords) > 2 else 0
-                return lat, lon, elevation
-        except (ValueError, IndexError):
-            pass
-        return None
-    def parse_station_from_description(desc: str, point_coords: Optional[Tuple[float, float, float]] = None) -> Dict:
-        """
-        Parse station metadata from KML description.
-        KML description fields contain detailed station information including:
-        - Download URL for EPW file
-        - Coordinates in degrees/minutes format
-        - Station metadata (WMO code, climate zone, etc.)
-        - Design conditions and climate statistics
-        Args:
-            desc: KML description text containing station metadata
-            point_coords: Fallback coordinates from KML Point element
-        Returns:
-            Dictionary with parsed station metadata or None if parsing fails
-        """
-        if not desc:
-            return None
-        # Extract download URL - this is required for station to be valid
-        url_match = re.search(r'URL (https://.*?\.zip)', desc)
-        if not url_match:
-            return None
-        url = url_match.group(1)
-        # First try to parse coordinates in degrees/minutes format from description
-        # Format: N XX°YY.YY' W ZZ°AA.AA'
-        coord_match = re.search(r'([NS]) (\d+)&deg;\s*(\d+\.\d+)\'.*?([EW]) (\d+)&deg;\s*(\d+\.\d+)\'', desc)
-        if coord_match:
-            # Convert degrees/minutes to decimal degrees
-            ns, lat_deg, lat_min, ew, lon_deg, lon_min = coord_match.groups()
-            lat = float(lat_deg) + float(lat_min)/60
-            if ns == 'S':
-                lat = -lat
-            lon = float(lon_deg) + float(lon_min)/60
-            if ew == 'W':
-                lon = -lon
-        elif point_coords:
-            # Fall back to coordinates from KML Point element
-            lat, lon, _ = point_coords
-        else:
-            # No coordinates available - station is not usable
-            return None
-        # Extract metadata with error handling using helper function
-        def extract_value(pattern: str, default: str = None) -> str:
-            """Extract value using regex pattern, return default if not found."""
-            match = re.search(pattern, desc)
-            return match.group(1) if match else default
-        # Build comprehensive station metadata dictionary
-        metadata = {
-            'url': url,
-            'longitude': lon,
-            'latitude': lat,
-            'elevation': int(extract_value(r'Elevation <b>(-?\d+)</b>', '0')),
-            'name': extract_value(r'<b>(.*?)</b>'),
-            'wmo': extract_value(r'WMO <b>(\d+)</b>'),
-            'climate_zone': extract_value(r'Climate Zone <b>(.*?)</b>'),
-            'period': extract_value(r'Period of Record=(\d{4}-\d{4})'),
-            'heating_db': extract_value(r'99% Heating DB <b>(.*?)</b>'),
-            'cooling_db': extract_value(r'1% Cooling DB <b>(.*?)</b>'),
-            'hdd18': extract_value(r'HDD18 <b>(\d+)</b>'),
-            'cdd10': extract_value(r'CDD10 <b>(\d+)</b>'),
-            'time_zone': extract_value(r'Time Zone {GMT <b>([-+]?\d+\.\d+)</b>')
-        }
-        return metadata
-    def try_download_station_zip(original_url: str, timeout_s: int = 30) -> Optional[bytes]:
-        """
-        Try downloading station archive; on 404s, attempt smart fallbacks.
-        Fallback strategies:
-        - Country rename: /TUR_Turkey/ -> /TUR_Turkiye/ (per Oct 2024 site update)
-        - TMYx period variants: .2009-2023.zip, .2007-2021.zip, .zip, .2004-2018.zip
-        Args:
-            original_url: URL extracted from KML
-            timeout_s: request timeout seconds
-        Returns:
-            Bytes of the downloaded zip on success, otherwise None
-        """
-        def candidate_urls(url: str) -> List[str]:
-            urls = []
-            urls.append(url)
-            # Country rename variants
-            if "/TUR_Turkey/" in url:
-                urls.append(url.replace("/TUR_Turkey/", "/TUR_Turkiye/"))
-            if "/TUR_Turkiye/" in url:
-                urls.append(url.replace("/TUR_Turkiye/", "/TUR_Turkey/"))
-            # TMYx period variants
-            m = re.search(r"(.*_TMYx)(?:\.(\d{4}-\d{4}))?\.zip$", url)
-            if m:
-                base = m.group(1)
-                suffix = m.group(2)
-                variants = [
-                    f"{base}.2009-2023.zip",
-                    f"{base}.2007-2021.zip",
-                    f"{base}.zip",
-                    f"{base}.2004-2018.zip",
-                ]
-                for v in variants:
-                    if v not in urls:
-                        urls.append(v)
-                # Also apply country rename to each variant
-                extra = []
-                for v in variants:
-                    if "/TUR_Turkey/" in url:
-                        extra.append(v.replace("/TUR_Turkey/", "/TUR_Turkiye/"))
-                    if "/TUR_Turkiye/" in url:
-                        extra.append(v.replace("/TUR_Turkiye/", "/TUR_Turkey/"))
-                for v in extra:
-                    if v not in urls:
-                        urls.append(v)
-            return urls
-        tried = set()
-        for u in candidate_urls(original_url):
-            if u in tried:
-                continue
-            tried.add(u)
-            try:
-                resp = requests.get(u, timeout=timeout_s, verify=ssl_verify)
-                resp.raise_for_status()
-                return resp.content
-            except requests.exceptions.SSLError:
-                # Retry with user-controlled insecure SSL
-                if allow_insecure_ssl:
-                    try:
-                        resp = requests.get(u, timeout=timeout_s, verify=False)
-                        resp.raise_for_status()
-                        return resp.content
-                    except requests.exceptions.RequestException:
-                        if allow_http_fallback and u.lower().startswith("https://"):
-                            insecure_url = "http://" + u.split("://", 1)[1]
-                            try:
-                                resp = requests.get(insecure_url, timeout=timeout_s)
-                                resp.raise_for_status()
-                                return resp.content
-                            except requests.exceptions.RequestException:
-                                pass
-                        continue
-                else:
-                    if allow_http_fallback and u.lower().startswith("https://"):
-                        insecure_url = "http://" + u.split("://", 1)[1]
-                        try:
-                            resp = requests.get(insecure_url, timeout=timeout_s)
-                            resp.raise_for_status()
-                            return resp.content
-                        except requests.exceptions.RequestException:
-                            pass
-                    continue
-            except requests.exceptions.HTTPError as he:
-                # Only continue on 404; raise on other HTTP errors
-                if getattr(he.response, "status_code", None) == 404:
-                    continue
-                else:
-                    raise
-            except requests.exceptions.RequestException:
-                # On network errors, try next candidate
-                continue
-        return None
-    def get_stations_from_kml(kml_url: str) -> List[Dict]:
-        """
-        Get weather stations from a KML file.
-        Downloads and parses a KML file containing weather station information.
-        Each Placemark in the KML represents a weather station with metadata
-        in the description field and coordinates in Point elements.
-        Args:
-            kml_url: URL to the KML file
-        Returns:
-            List of dictionaries containing station metadata
-        """
-        try:
-            # Download KML file with timeout (secure first)
-            try:
-                response = requests.get(kml_url, timeout=30, verify=ssl_verify)
-                response.raise_for_status()
-            except requests.exceptions.SSLError:
-                if allow_insecure_ssl:
-                    # Retry with certificate verification disabled (last resort)
-                    try:
-                        response = requests.get(kml_url, timeout=30, verify=False)
-                        response.raise_for_status()
-                    except requests.exceptions.RequestException:
-                        # Try HTTP fallback if original was HTTPS and allowed
-                        if allow_http_fallback and kml_url.lower().startswith("https://"):
-                            insecure_url = "http://" + kml_url.split("://", 1)[1]
-                            response = requests.get(insecure_url, timeout=30)
-                            response.raise_for_status()
-                        else:
-                            raise
-                else:
-                    # Try HTTP fallback only if allowed and original was HTTPS
-                    if allow_http_fallback and kml_url.lower().startswith("https://"):
-                        insecure_url = "http://" + kml_url.split("://", 1)[1]
-                        response = requests.get(insecure_url, timeout=30)
-                        response.raise_for_status()
-                    else:
-                        raise
-            # Try to decode content with multiple encodings
-            content = try_decode(response.content)
-            content = clean_xml(content)
-            # Parse XML content
-            try:
-                root = ET.fromstring(content.encode('utf-8'))
-            except ET.ParseError as e:
-                print(f"Error parsing KML file {kml_url}: {e}")
-                return []
-            # Define KML namespace for element searching
-            ns = {'kml': 'http://earth.google.com/kml/2.1'}
-            stations = []
-            # Find all Placemark elements (each represents a weather station)
-            for placemark in root.findall('.//kml:Placemark', ns):
-                name = placemark.find('kml:name', ns)
-                desc = placemark.find('kml:description', ns)
-                point = placemark.find('.//kml:Point/kml:coordinates', ns)
-                # Skip placemarks without description or that don't contain weather data
-                if desc is None or not desc.text or "Data Source" not in desc.text:
-                    continue
-                # Get coordinates from Point element if available
-                point_coords = None
-                if point is not None and point.text:
-                    point_coords = parse_coordinates(point.text)
-                # Parse comprehensive station data from description
-                station_data = parse_station_from_description(desc.text, point_coords)
-                if station_data:
-                    # Add station name and source information
-                    station_data['name'] = name.text if name is not None else "Unknown"
-                    station_data['kml_source'] = kml_url
-                    stations.append(station_data)
-            return stations
-        except requests.exceptions.RequestException as e:
-            print(f"Error accessing KML file {kml_url}: {e}")
-            return []
-        except Exception as e:
-            print(f"Error processing KML file {kml_url}: {e}")
-            return []
-    try:
-        # Create output directory if it doesn't exist
-        Path(output_dir).mkdir(parents=True, exist_ok=True)
-        # Determine which regions to scan based on user input or auto-detection
-        regions_to_scan = {}
-        def _add_selection(selection_name: str, mapping: Dict[str, str], out: Dict[str, str]):
-            """Expand a region or dataset selection into concrete KML URLs."""
-            if selection_name in REGION_DATASET_GROUPS:
-                for key in REGION_DATASET_GROUPS[selection_name]:
-                    if key in KML_SOURCES:
-                        out[key] = KML_SOURCES[key]
-            elif selection_name in KML_SOURCES:
-                out[selection_name] = KML_SOURCES[selection_name]
-            else:
-                valid = sorted(list(REGION_DATASET_GROUPS.keys()) + list(KML_SOURCES.keys()))
-                raise ValueError(f"Invalid region/dataset: '{selection_name}'. Valid options include: {', '.join(valid)}")
-        if region is None:
-            # Auto-detect regions based on coordinates
-            detected_regions = detect_regions(longitude, latitude)
-            if detected_regions:
-                print(f"Auto-detected regions: {', '.join(detected_regions)}")
-                for r in detected_regions:
-                    _add_selection(r, KML_SOURCES, regions_to_scan)
-            else:
-                # Fallback to all regions if detection fails
-                print("Could not determine region from coordinates. Scanning all regions.")
-                regions_to_scan = dict(KML_SOURCES)
-        elif isinstance(region, str):
-            # Handle string input for region selection
-            if region.lower() == "all":
-                regions_to_scan = dict(KML_SOURCES)
-            else:
-                _add_selection(region, KML_SOURCES, regions_to_scan)
-        else:
-            # Handle list input for multiple regions
-            for r in region:
-                _add_selection(r, KML_SOURCES, regions_to_scan)
-        # Get stations from selected KML sources
-        print("Fetching weather station data from Climate.OneBuilding.Org...")
-        all_stations = []
-        # Process each selected region
-        scanned_urls = set()
-        for region_name, url in regions_to_scan.items():
-            if url in scanned_urls:
-                continue
-            scanned_urls.add(url)
-            print(f"Scanning {region_name}...")
-            stations = get_stations_from_kml(url)
-            all_stations.extend(stations)
-            print(f"Found {len(stations)} stations in {region_name}")
-        print(f"\nTotal stations found: {len(all_stations)}")
-        if not all_stations:
-            # Fallback: if no stations found, try scanning all available datasets
-            if not (isinstance(region, str) and region.lower() == "all"):
-                print("No stations found from detected/selected regions. Falling back to global scan...")
-                regions_to_scan = dict(KML_SOURCES)
-                all_stations = []
-                scanned_urls = set()
-                for region_name, url in regions_to_scan.items():
-                    if url in scanned_urls:
-                        continue
-                    scanned_urls.add(url)
-                    print(f"Scanning {region_name}...")
-                    stations = get_stations_from_kml(url)
-                    all_stations.extend(stations)
-                    print(f"Found {len(stations)} stations in {region_name}")
-                print(f"\nTotal stations found after global scan: {len(all_stations)}")
-            if not all_stations:
-                raise ValueError("No weather stations found")
-        # Calculate distances from target coordinates to all stations
-        stations_with_distances = [
-            (station, haversine_distance(longitude, latitude, station['longitude'], station['latitude']))
-            for station in all_stations
-        ]
-        # Filter by maximum distance if specified
-        if max_distance is not None:
-            close_stations = [
-                (station, distance)
-                for station, distance in stations_with_distances
-                if distance <= max_distance
-            ]
-            if not close_stations:
-                # If no stations within max_distance, find the closest one anyway
-                closest_station, min_distance = min(stations_with_distances, key=lambda x: x[1])
-                print(f"\nNo stations found within {max_distance} km. Closest station is {min_distance:.1f} km away.")
-                print("Using closest available station.")
-                stations_with_distances = [(closest_station, min_distance)]
-            else:
-                stations_with_distances = close_stations
-        # Find the nearest weather station
-        nearest_station, distance = min(stations_with_distances, key=lambda x: x[1])
-        # Download the EPW archive from the nearest station with fallbacks
-        print(f"\nDownloading EPW file for {nearest_station['name']}...")
-        archive_bytes = try_download_station_zip(nearest_station['url'], timeout_s=30)
-        if archive_bytes is None:
-            raise ValueError(f"Failed to download EPW archive from station URL and fallbacks: {nearest_station['url']}")
-        # Create a temporary directory for zip extraction
-        temp_dir = Path(output_dir) / "temp"
-        temp_dir.mkdir(parents=True, exist_ok=True)
-        # Save the downloaded zip file temporarily
-        zip_file = temp_dir / "weather_data.zip"
-        with open(zip_file, 'wb') as f:
-            f.write(archive_bytes)
-        final_epw = None
-        try:
-            # Extract the EPW file from the zip archive
-            if extract_zip:
-                with zipfile.ZipFile(zip_file, 'r') as zip_ref:
-                    # Find the EPW file in the archive (should be exactly one)
-                    epw_files = [f for f in zip_ref.namelist() if f.lower().endswith('.epw')]
-                    if not epw_files:
-                        raise ValueError("No EPW file found in the downloaded archive")
-                    # Extract the EPW file
-                    epw_filename = epw_files[0]
-                    extracted_epw = safe_extract(zip_ref, epw_filename, temp_dir)
-                    # Move the EPW file to the final location with cleaned filename
-                    final_epw = Path(output_dir) / f"{nearest_station['name'].replace(' ', '_').replace(',', '').lower()}.epw"
-                    final_epw = safe_rename(extracted_epw, final_epw)
-        finally:
-            # Clean up temporary files regardless of success or failure
-            try:
-                if zip_file.exists():
-                    zip_file.unlink()
-                if temp_dir.exists() and not any(temp_dir.iterdir()):
-                    temp_dir.rmdir()
-            except Exception as e:
-                print(f"Warning: Could not clean up temporary files: {e}")
-        if final_epw is None:
-            raise ValueError("Failed to extract EPW file")
-        # Save station metadata alongside the EPW file
-        metadata_file = final_epw.with_suffix('.json')
-        with open(metadata_file, 'w') as f:
-            json.dump(nearest_station, f, indent=2)
-        # Print comprehensive station information
-        print(f"\nDownloaded EPW file for {nearest_station['name']}")
-        print(f"Distance: {distance:.2f} km")
-        print(f"Station coordinates: {nearest_station['longitude']}, {nearest_station['latitude']}")
-        if nearest_station['wmo']:
-            print(f"WMO: {nearest_station['wmo']}")
-        if nearest_station['climate_zone']:
-            print(f"Climate zone: {nearest_station['climate_zone']}")
-        if nearest_station['period']:
-            print(f"Data period: {nearest_station['period']}")
-        print(f"Files saved:")
-        print(f"- EPW: {final_epw}")
-        print(f"- Metadata: {metadata_file}")
-        # Load the EPW data into DataFrame if requested
-        df = None
-        headers = None
-        if load_data:
-            print("\nLoading EPW data...")
-            df, headers = process_epw(final_epw)
-            print(f"Loaded {len(df)} hourly records")
-        return str(final_epw), df, headers
-    except Exception as e:
-        print(f"Error processing data: {e}")
-        return None, None, None
-# =============================================================================
-# SOLAR SIMULATION UTILITIES
-# =============================================================================
-def read_epw_for_solar_simulation(epw_file_path):
-    """
-    Read EPW file specifically for solar simulation purposes.
-    This function extracts essential solar radiation data and location metadata
-    from an EPW file for use in solar energy calculations. It focuses on the
-    Direct Normal Irradiance (DNI) and Diffuse Horizontal Irradiance (DHI)
-    which are the primary inputs for solar simulation models.
-    Args:
-        epw_file_path: Path to the EPW weather file
-    Returns:
-        Tuple containing:
-        - DataFrame with time-indexed DNI and DHI data
-        - Longitude (degrees)
-        - Latitude (degrees)
-        - Time zone offset (hours from UTC)
-        - Elevation (meters above sea level)
-    Raises:
-        ValueError: If LOCATION line not found or data parsing fails
-    """
-    # Validate input path
-    if epw_file_path is None:
-        raise TypeError("EPW file path is None. Provide a valid path or ensure download succeeded.")
-    epw_path_obj = Path(epw_file_path)
-    if not epw_path_obj.exists() or not epw_path_obj.is_file():
-        raise FileNotFoundError(f"EPW file not found: {epw_file_path}")
-    # Read the entire EPW file
-    with open(epw_path_obj, 'r', encoding='utf-8') as f:
-        lines = f.readlines()
-    # Find the LOCATION line (first line in EPW format)
-    location_line = None
-    for line in lines:
-        if line.startswith("LOCATION"):
-            location_line = line.strip().split(',')
-            break
-    if location_line is None:
-        raise ValueError("Could not find LOCATION line in EPW file.")
-    # Parse LOCATION line format:
-    # LOCATION,City,State/Country,Country,DataSource,WMO,Latitude,Longitude,Time Zone,Elevation
-    # Example: LOCATION,Marina.Muni.AP,CA,USA,SRC-TMYx,690070,36.68300,-121.7670,-8.0,43.0
-    lat = float(location_line[6])
-    lon = float(location_line[7])
-    tz = float(location_line[8])  # local standard time offset from UTC
-    elevation_m = float(location_line[9])
-    # Find start of weather data (after 8 header lines)
-    data_start_index = None
-    for i, line in enumerate(lines):
-        vals = line.strip().split(',')
-        # Weather data lines have more than 30 columns and start after line 8
-        if i >= 8 and len(vals) > 30:
-            data_start_index = i
-            break
-    if data_start_index is None:
-        raise ValueError("Could not find start of weather data lines in EPW file.")
-    # Parse weather data focusing on solar radiation components
-    data = []
-    for l in lines[data_start_index:]:
-        vals = l.strip().split(',')
-        if len(vals) < 15:  # Skip malformed lines
-            continue
-        # Extract time components and solar radiation data
-        year = int(vals[0])
-        month = int(vals[1])
-        day = int(vals[2])
-        hour = int(vals[3]) - 1  # Convert EPW 1-24 hours to 0-23
-        dni = float(vals[14])    # Direct Normal Irradiance (Wh/m²)
-        dhi = float(vals[15])    # Diffuse Horizontal Irradiance (Wh/m²)
-        # Create pandas timestamp for time series indexing
-        timestamp = pd.Timestamp(year, month, day, hour)
-        data.append([timestamp, dni, dhi])
-    # Create DataFrame with time index for efficient time series operations
-    df = pd.DataFrame(data, columns=['time', 'DNI', 'DHI']).set_index('time')
-    df = df.sort_index()
-    return df, lon, lat, tz, elevation_m

voxcity 0.6.26__py3-none-any.whl → 1.0.2__py3-none-any.whl

voxcity 0.6.26py3-none-any.whl → 1.0.2py3-none-any.whl