PyPI - hspf - Versions diffs - 2.0.0__py3-none-any.whl - Mend

hspf 2.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

hspf/__init__.py +0 -0
hspf/data/ParseTable.csv +2541 -0
hspf/data/Timeseries Catalog/IMPLND/IQUAL.txt +10 -0
hspf/data/Timeseries Catalog/IMPLND/IWATER.txt +9 -0
hspf/data/Timeseries Catalog/IMPLND/IWTGAS.txt +6 -0
hspf/data/Timeseries Catalog/IMPLND/SOLIDS.txt +2 -0
hspf/data/Timeseries Catalog/PERLND/MSTLAY.txt +2 -0
hspf/data/Timeseries Catalog/PERLND/PQUAL.txt +19 -0
hspf/data/Timeseries Catalog/PERLND/PSTEMP.txt +4 -0
hspf/data/Timeseries Catalog/PERLND/PWATER.txt +39 -0
hspf/data/Timeseries Catalog/PERLND/PWATGAS.txt +21 -0
hspf/data/Timeseries Catalog/PERLND/SEDMNT.txt +8 -0
hspf/data/Timeseries Catalog/PERLND/SNOW.txt +22 -0
hspf/data/Timeseries Catalog/RCHRES/CONS.txt +7 -0
hspf/data/Timeseries Catalog/RCHRES/GQUAL.txt +22 -0
hspf/data/Timeseries Catalog/RCHRES/HTRCH.txt +8 -0
hspf/data/Timeseries Catalog/RCHRES/HYDR.txt +27 -0
hspf/data/Timeseries Catalog/RCHRES/NUTRX.txt +50 -0
hspf/data/Timeseries Catalog/RCHRES/OXRX.txt +8 -0
hspf/data/Timeseries Catalog/RCHRES/PLANK.txt +24 -0
hspf/data/Timeseries Catalog/RCHRES/SEDTRN.txt +8 -0
hspf/hbn.py +487 -0
hspf/helpers.py +94 -0
hspf/hspfModel.py +203 -0
hspf/parser/__init__.py +6 -0
hspf/parser/graph.py +934 -0
hspf/parser/parsers.py +516 -0
hspf/reports.py +1230 -0
hspf/uci.py +643 -0
hspf/wdm.py +355 -0
hspf/wdmReader.py +588 -0
hspf-2.0.0.dist-info/METADATA +19 -0
hspf-2.0.0.dist-info/RECORD +34 -0
hspf-2.0.0.dist-info/WHEEL +4 -0

hspf/wdm.py ADDED Viewed

@@ -0,0 +1,355 @@
+''' Copyright (c) 2020 by RESPEC, INC.
+Author: Robert Heaphy, Ph.D.
+Based on MATLAB program by Seth Kenner, RESPEC
+License: LGPL2
+'''
+import numpy as np
+import pandas as pd
+#from numba import jit, njit
+import datetime
+from pathlib import Path
+# look up attributes NAME, data type (Integer; Real; String) and data length by attribute number
+attrinfo = {1:('TSTYPE','S',4),     2:('STAID','S',16),    11:('DAREA','R',1),
+           17:('TCODE','I',1),     27:('TSBYR','I',1),     28:('TSBMO','I',1),
+           29:('TSBDY','I',1),     30:('TSBHR','I',1),     32:('TFILL', 'R',1),
+           33:('TSSTEP','I',1),    34:('TGROUP','I',1),    45:('STNAM','S',48),
+           83:('COMPFG','I',1),    84:('TSFORM','I',1),    85:('VBTIME','I',1),
+          444:('DATMOD','S',12),  443:('DATCRE','S',12),   22:('DCODE','I',1),
+           10:('DESCRP','S', 80),   7:('ELEV','R',1),       8:('LATDEG','R',1),
+            9:('LNGDEG','R',1),   288:('SCENARIO','S',8), 289:('CONSTITUENT','S',8),
+          290:('LOCATION','S',8)}
+freq = {7:'100YS', 6:'YS', 5:'MS', 4:'D', 3:'H', 2:'min', 1:'S'}   # pandas date_range() frequency by TCODE, TGROUP
+class wdmInterface():
+    def __init__(self,file_paths:list):
+        #self.names = [file_path for file_path in file_paths]
+        self.wdms = {Path(file_path).name:hdf5WDM(Path(file_path).with_suffix('.hdf5')) for file_path in file_paths}
+        self.filepaths =  {Path(file_path).name:Path(file_path) for file_path in file_paths}
+    def series(self, wdm_file,dsn):
+        return self.wdms[wdm_file].series(dsn)
+class hdf5WDM():
+    def __init__(self,wdm_path:list):
+        self.wdm_path = Path(wdm_path)
+        df = pd.read_hdf(wdm_path, '/TIMESERIES/SUMMARY')
+        df = df.reset_index(drop=False,names='hdf5_name')
+        df.index = df['hdf5_name'].str[2:].astype(int)
+        self.summary = df
+    def series(self,dsn):
+        hdf5_name = self.summary.loc[dsn,'hdf5_name']
+        return pd.read_hdf(self.wdm_path,f'/TIMESERIES/{hdf5_name}')
+class WDM():
+    def __init__(self,wdmfile):
+        self.name = wdmfile
+        self._iarray = np.fromfile(wdmfile, dtype=np.int32)
+        self._farray = np.fromfile(wdmfile, dtype=np.float32)
+        if self._iarray[0] != -998:
+            raise ValueError ('Provided file does not match WDM format. First int32 should be -998.')
+        self.nrecords    = self._iarray[28]    # first record is File Definition Record
+        self.ntimeseries = self._iarray[31]
+        dsnlist = {}
+        for index in range(512, self.nrecords * 512, 512):
+            if not (self._iarray[index]==0 and self._iarray[index+1]==0 and self._iarray[index+2]==0 and self._iarray[index+3]==0) and self._iarray[index+5]==1:
+                dsnlist[self._iarray[index+4]] = index
+                #dsnlist.append(index)
+        if len(dsnlist.keys()) != self.ntimeseries:
+            print(f'Warning: Wrong number of Time Series Records found expecting:{self.ntimeseries} found:{len(dsnlist)}')#raise RuntimeError (f'Wrong number of Time Series Records found expecting:{self.ntimeseries} found:{len(dsnlist)}')
+        self.dsnlist = dsnlist
+        self.dsns = list(self.dsnlist.keys())
+        self.columns = check_columns(self.dsnlist.values(),self._iarray,self._farray)
+        self.summary = None #pd.DataFrame(columns = self.columns)
+        self.data = {}
+    def series(self,dsn):
+        if dsn in self.data.keys():
+            return self.data[dsn]
+        else:
+            summary,series = get_series(self.dsnlist[dsn],self._iarray,self._farray,self.columns)
+            self.summary = pd.concat([self.summary,summary])
+            self.data[dsn] = series
+            return self.data[dsn]
+def check_columns(dsnlist,iarray,farray):
+    # check to see which extra attributes are on each dsn
+    columns_to_add = []
+    search = ['STAID', 'STNAM', 'SCENARIO', 'CONSTITUENT', 'LOCATION']
+    for att in search:
+        found_in_all = True
+        for index in dsnlist:
+            dattr = {}
+            psa = iarray[index + 9]
+            if psa > 0:
+                sacnt = iarray[index + psa - 1]
+            for i in range(psa + 1, psa + 1 + 2 * sacnt, 2):
+                id = iarray[index + i]
+                ptr = iarray[index + i + 1] - 1 + index
+                if id not in attrinfo:
+                    continue
+                name, atype, length = attrinfo[id]
+                if atype == 'I':
+                    dattr[name] = iarray[ptr]
+                elif atype == 'R':
+                    dattr[name] = farray[ptr]
+                else:
+                    dattr[name] = ''.join([_inttostr(iarray[k]) for k in range(ptr, ptr + length // 4)]).strip()
+            if att not in dattr:
+                found_in_all = False
+        if found_in_all:
+            columns_to_add.append(att)
+    return columns_to_add
+def get_series(dsn_index,iarray,farray,columns_to_add):
+    date_epoch = np.datetime64(0,'Y')
+    dt_year = np.timedelta64(1, 'Y')
+    dt_month = np.timedelta64(1, 'M')
+    dt_day = np.timedelta64(1, 'D')
+    dt_hour = np.timedelta64(1, 'h')
+    dt_minute = np.timedelta64(1, 'm')
+    dt_second = np.timedelta64(1, 's')
+    index = dsn_index
+    # get layout information for TimeSeries Dataset frame
+    dsn   = iarray[index+4]
+    psa   = iarray[index+9]
+    if psa > 0:
+        sacnt = iarray[index+psa-1]
+    pdat  = iarray[index+10]
+    pdatv = iarray[index+11]
+    print(f'{dsn} reading from wdm')
+    # get attributes
+    dattr = {'TSBDY':1, 'TSBHR':1, 'TSBMO':1, 'TSBYR':1900, 'TFILL':-999.}   # preset defaults
+    for i in range(psa+1, psa+1 + 2*sacnt, 2):
+        id = iarray[index + i]
+        ptr = iarray[index + i + 1] - 1 + index
+        if id not in attrinfo:
+            # print('PROGRAM ERROR: ATTRIBUTE INDEX not found', id, 'Attribute pointer', iarray[index + i+1])
+            continue
+        name, atype, length = attrinfo[id]
+        if atype == 'I':
+            dattr[name] = iarray[ptr]
+        elif atype == 'R':
+            dattr[name] = farray[ptr]
+        else:
+            dattr[name] = ''.join([_inttostr(iarray[k]) for k in range(ptr, ptr + length//4)]).strip()
+    # Get timeseries timebase data
+    records = []
+    offsets = []
+    for i in range(pdat+1, pdatv-1):
+        a = iarray[index+i]
+        if a != 0:
+            record, offset = _splitposition(a)
+            records.append(record)
+            offsets.append(offset)
+    # if len(records) == 0:
+    #     continue
+    # calculate number of data points in each group, tindex is final index for storage
+    tgroup = dattr['TGROUP']
+    tstep  = dattr['TSSTEP']
+    tcode  = dattr['TCODE']
+    records = np.asarray(records)
+    offsets = np.asarray(offsets)
+    dates, values, stop_datetime = _process_groups(iarray, farray, records, offsets, tgroup)
+    stop_datetime = datetime.datetime(*_bits_to_date(stop_datetime))
+    dates = np.array(dates)
+    dates_converted = _date_convert(dates, date_epoch, dt_year, dt_month, dt_day, dt_hour, dt_minute, dt_second)
+    series = pd.Series(values, index=dates_converted)
+    try:
+        series.index.freq = str(tstep) + freq[tcode]
+    except ValueError:
+        series.index.freq = None
+    data = [
+        str(series.index[0]), str(stop_datetime), str(tstep) + freq[tcode],
+        len(series),  dattr['TSTYPE'], dattr['TFILL']
+        ]
+    columns = ['Start', 'Stop', 'Freq','Length', 'TSTYPE', 'TFILL']
+    for x in columns_to_add:
+        if x in dattr:
+            data.append(dattr[x])
+            columns.append(x)
+    summary = pd.DataFrame({k:[v] for k,v in zip(columns,data)},index = [dsn])
+    return summary,series
+#@njit
+def _splitdate(x):
+    year = np.int64(x >> 14)
+    month = np.int64(x >> 10 & 0xF)
+    day = np.int64(x >> 5 & 0x1F)
+    hour = np.int64(x & 0x1F)
+    return _correct_date(year, month, day, hour, 0,0)
+#@njit
+def _splitcontrol(x):
+    nval = x >> 16
+    ltstep = x >> 10 & 0x3f
+    ltcode = x >> 7 & 0x7
+    comp = x >> 5 & 0x3
+    qual  = x & 0x1f
+    return nval, ltstep, ltcode, comp, qual
+#@njit
+def _splitposition(x):
+    return((x>>9) - 1, (x&0x1FF) - 1) #args: record, offset
+#@njit
+def _inttostr(i):
+    return chr(i & 0xFF) + chr(i>>8 & 0xFF) + chr(i>>16 & 0xFF) + chr(i>>24 & 0xFF)
+#@njit
+def _bits_to_date(x):
+    year = x >> 26
+    month = x >> 22 & 0xf
+    day = x >> 17 & 0x1f
+    hour = x >> 12 & 0x1f
+    minute = x >> 6 & 0x3f
+    second = x & 0x3f
+    return year, month, day, hour, minute, second
+#@njit
+def _date_to_bits(year, month, day, hour, minute, second):
+    x = year << 26 | month << 22 | day << 17 | hour << 12 | minute << 6 | second
+    return x
+#@njit
+def _increment_date(date, timecode, timestep):
+    year, month, day, hour, minute, second = _bits_to_date(date)
+    if timecode == 7: year += 100 * timestep
+    elif timecode == 6 : year += timestep
+    elif timecode == 5 : month += timestep
+    elif timecode == 4 : day += timestep
+    elif timecode == 3 : hour += timestep
+    elif timecode == 2 : minute += timestep
+    elif timecode == 1 : second += timestep
+    return _correct_date(year, month, day, hour, minute, second)
+#@njit
+def _correct_date(year, month, day, hour, minute, second):
+    while second >= 60:
+        second -= 60
+        minute += 1
+    while minute >= 60:
+        minute -= 60
+        hour += 1
+    while hour >= 24:
+        hour -= 24
+        day += 1
+    while day > _days_in_month(year, month):
+        day -= _days_in_month(year, month)
+        month += 1
+    while month > 12:
+        month -= 12
+        year += 1
+    return _date_to_bits(year, month, day, hour, minute, second)
+#@njit
+def _days_in_month(year, month):
+    if month > 12: month %= 12
+    if month in (1,3,5,7,8,10,12):
+        return 31
+    elif month in (4,6,9,11):
+        return 30
+    elif month == 2:
+        if _is_leapyear(year): return 29
+        else: return 28
+#@njit
+def _is_leapyear(year):
+    if year % 400 == 0:
+        return True
+    if year % 100 == 0:
+        return False
+    if year % 4 == 0:
+        return True
+    else:
+        return False
+#@njit
+def _date_convert(dates, date_epoch, dt_year, dt_month, dt_day, dt_hour, dt_minute, dt_second):
+    converted_dates = []
+    for x in dates:
+        year, month, day, hour, minute, second = _bits_to_date(x)
+        date = date_epoch
+        date += (year - 1970) * dt_year
+        date += (month - 1) * dt_month
+        date += (day - 1) * dt_day
+        date += hour * dt_hour
+        date += minute * dt_minute
+        date += second * dt_second
+        converted_dates.append(date)
+    return converted_dates
+#@njit
+def _process_groups(iarray, farray, records, offsets, tgroup):
+    date_array = [0] #need initialize with a type for numba
+    value_array = [0.0]
+    for i in range(0,len(records)):
+        record = records[i]
+        offset = offsets[i]
+        index = record * 512 + offset
+        pscfwr = iarray[record * 512 + 3] #should be 0 for last record in timeseries
+        current_date = _splitdate(iarray[index])
+        group_enddate = _increment_date(current_date, tgroup, 1)
+        offset +=1
+        index +=1
+        while current_date < group_enddate:
+            nval, ltstep, ltcode, comp, qual = _splitcontrol(iarray[index])
+            #compressed - only has single value which applies to full range
+            if comp == 1:
+                for i in range(0, nval, 1):
+                    date_array.append(current_date)
+                    current_date = _increment_date(current_date, ltcode, ltstep)
+                    value_array.append(farray[index + 1])
+                index += 2
+                offset +=2
+            else:
+                for i in range(0, nval, 1):
+                    date_array.append(current_date)
+                    current_date = _increment_date(current_date, ltcode, ltstep)
+                    value_array.append(farray[index + 1 + i])
+                index += 1 + nval
+                offset +=1 + nval
+            if offset >= 511:
+                offset = 4
+                index = (pscfwr - 1) * 512 + offset
+                record = pscfwr
+                pscfwr = iarray[(record - 1) * 512 + 3] #should be 0 for last record in timeseries
+    date_array = date_array[1:]
+    value_array = value_array[1:]
+    return date_array, value_array, group_enddate