PyPI - mpcaHydro - Versions diffs - 2.0.4__py3-none-any.whl → 2.0.6__py3-none-any.whl - Mend

mpcaHydro 2.0.4py3-none-any.whl → 2.0.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

mpcaHydro/data/WISKI_QUALITY_CODES.csv +71 -0
mpcaHydro/data/outlets.duckdb +0 -0
mpcaHydro/data/stations_EQUIS.gpkg +0 -0
mpcaHydro/data/stations_wiski.gpkg +0 -0
mpcaHydro/data_manager.py +142 -314
mpcaHydro/equis.py +488 -0
mpcaHydro/etlSWD.py +4 -5
mpcaHydro/etlWISKI.py +39 -23
mpcaHydro/etlWPLMN.py +2 -2
mpcaHydro/outlets.py +371 -0
mpcaHydro/pywisk.py +381 -0
mpcaHydro/reports.py +80 -0
mpcaHydro/warehouse.py +581 -0
mpcaHydro/warehouseManager.py +47 -0
mpcaHydro/wiski.py +308 -0
mpcaHydro/xref.py +74 -0
{mpcahydro-2.0.4.dist-info → mpcahydro-2.0.6.dist-info}/METADATA +3 -1
mpcahydro-2.0.6.dist-info/RECORD +23 -0
{mpcahydro-2.0.4.dist-info → mpcahydro-2.0.6.dist-info}/WHEEL +1 -1
mpcaHydro/WISKI.py +0 -352
mpcaHydro/helpers.py +0 -0
mpcahydro-2.0.4.dist-info/RECORD +0 -13

mpcaHydro/etlWISKI.py CHANGED Viewed

@@ -6,10 +6,9 @@ Created on Tue Oct  3 08:04:49 2023
 """
 import pandas as pd
-from mpcaHydro.WISKI import pyWISK
+from mpcaHydro import pywisk
 #from hspf_tools.orm.models import Station
 import time
-wiski = pyWISK()
 '''
@@ -45,8 +44,8 @@ PARAMETERTYPE_MAP ={'11522': 'TP',
                     '11521': 'TKN',
                     '11500' : 'Q',
                     '11504': 'WT',
-                    '11533': 'DO',
-                    '11507':'WL'}
+                    '11533': 'DO'}
+#                    '11507':'WL'}
 #STATIONPARAMETER_NOS = ['262*','450*','451*','863*','866*','5034' ,'5035','5005', '5004','5014' ,'5015','5024'  ,'5025','5044' ,'5045']
 STATIONPARAMETER_NOS = ['262*','450*','451*','863*','866*']
@@ -115,7 +114,12 @@ TS_NAME_SELECTOR = {'Q':{'Internal':{'daily':'20.Day.Mean.Archive',
                     'DO':{'Internal':{'daily':'20.Day.Mean',
                                       'unit': '09.Archive'},
                           'External': {'daily': '20.Day.Mean',
-                                       'unit': '08.Provisional.Edited'}}}
+                                       'unit': '08.Provisional.Edited'}},
+                    'TRB':{'Internal':{'daily':'20.Day.Mean',
+                                    'unit': '09.Archive'},
+                        'External': {'daily': '20.Day.Mean',
+                                    'unit': '08.Provisional.Edited'}},
+                }
@@ -123,9 +127,11 @@ CONSTITUENT_NAME_NO = {'Q'  :['262*'],#,'263'],
                        'WT' :['450*', '451*'], # '450.42','451.42'],
                        'OP' :['863*'],
                        'DO' :['866*'],
+                       'TRB': ['811*'],
+                       'TDS': ['2175*'],
                        'TP' :None,
                        'TSS':None,
-                       'N'  :None,
+                       'N'  :['341*'],
                        'TKN':None}
 CONSTITUENT_NAME_NO_WPLMN = {'Q'  :['262*'],#,'263'],
@@ -137,7 +143,7 @@ CONSTITUENT_NAME_NO_WPLMN = {'Q'  :['262*'],#,'263'],
                        'N'  :['5024'  ,'5025'],
                        'TKN':['5044' ,'5045']}
-VALID_CONSTITUENTS = ['Q','WT','OP','DO','TP','TSS','N','TKN']
+VALID_CONSTITUENTS = ['Q','WT','OP','DO','TP','TSS','N','TKN','TRB']
 # def _info(station_nos):
 #     station_info = info(station_nos)
@@ -174,7 +180,7 @@ def extract(station_nos, constituent, dbpath, start_year = 1996, end_year = 2030
     else:
         constituent_nos = CONSTITUENT_NAME_NO[constituent]
-    ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+    ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
                         stationparameter_no = constituent_nos,
                         ts_name = ts_names['unit'])
@@ -182,6 +188,16 @@ def extract(station_nos, constituent, dbpath, start_year = 1996, end_year = 2030
     for ts_id in ts_ids:
         jsons.append(download_chunk(ts_id,start_year,end_year,as_json = True))
         time.sleep(.1)
+    # Connect to DuckDB (in-memory database)
+    con = duckdb.connect(database=':memory:')
+    # Register the Python list of dictionaries as a virtual table
+    # DuckDB can automatically infer the schema from this list.
+    con.register("my_json_table", json_data)
     return jsons
@@ -208,7 +224,7 @@ def extract(station_nos, constituent, dbpath, start_year = 1996, end_year = 2030
 def info(station_nos):
-    ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+    ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
                         stationparameter_no = STATIONPARAMETER_NOS)
     ts_ids = ts_ids.drop_duplicates(subset = 'parametertype_name')
     ts_ids['constituent'] = ts_ids['parametertype_id'].map(PARAMETERTYPE_MAP)
@@ -221,7 +237,7 @@ def download(station_nos,start_year = 1996, end_year = 2030, raw = False,wplmn =
     print('Downloading Timeseries Data')
     df = pd.concat([_download(constituent,station_nos,start_year,end_year,raw,wplmn) for constituent in VALID_CONSTITUENTS])
-    station_metadata = wiski.get_stations(station_no = station_nos,returnfields = ['stationgroup_id'])
+    station_metadata = pywisk.get_stations(station_no = station_nos,returnfields = ['stationgroup_id'])
     if any(station_metadata['stationgroup_id'].isin(['1319204'])):
         df['wplmn_flag'] = 1
     else:
@@ -254,14 +270,14 @@ def transform(data):
     data.loc[:,'unit'] = data['unit'].str.lower()
     data.replace({'unit':'°f'},'degF',inplace = True)
     data['data_type'] = 'continuous'
-    data['source'] = 'wiski'
+    data['station_origin'] = 'wiski'
     data.set_index('datetime',drop=True,inplace=True)
     data.index = data.index.tz_convert('UTC-06:00')
     data.index = data.index.round('h').round('h')
     data = data.reset_index()
-    data = data.groupby(['datetime','variable','unit','station_id','station_name','constituent','interval_minutes','data_format','data_type','source']).mean()
+    data = data.groupby(['datetime','variable','unit','station_id','station_name','constituent','interval_minutes','data_format','data_type','station_origin']).mean()
     data = data.reset_index()
     data = data.set_index('datetime')
@@ -287,13 +303,13 @@ def _download(constituent,station_nos,start_year = 1996,end_year = 2030, raw = F
     else:
         constituent_nos = CONSTITUENT_NAME_NO[constituent]
-    ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+    ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
                         stationparameter_no = constituent_nos,
                         ts_name = ts_names['unit'])
     interval_minutes = 60
     if ts_ids.empty:
-        ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+        ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
                             stationparameter_no = constituent_nos,
                             ts_name = ts_names['daily'])
         interval_minutes = 1440
@@ -323,7 +339,7 @@ def download_chunk(ts_id,start_year = 1996,end_year = 2030, interval = 5, as_jso
         end = int(start + interval-1)
         if end > end_year:
             end = end_year
-        df = wiski.get_ts(ts_id,start_date = f'{start}-01-01',end_date = f'{end}-12-31',as_json = as_json)
+        df = pywisk.get_ts(ts_id,start_date = f'{start}-01-01',end_date = f'{end}-12-31',as_json = as_json)
         if not df.empty: frames.append(df)
         df.index = pd.to_datetime(df['Timestamp'])
         time.sleep(.1)
@@ -380,7 +396,7 @@ def tkn(station_nos,start_year = 1996,end_year = 2030,raw=False):
 #     else:
 #         ts_names = ['15.Rated']
-#     ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+#     ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
 #                         stationparameter_no = ['262*'],
 #                         ts_name = ts_names)
@@ -406,7 +422,7 @@ def tkn(station_nos,start_year = 1996,end_year = 2030,raw=False):
 #         ts_names = ['09.Archive']
-#     ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+#     ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
 #                       stationparameter_no = ['450*','450.42*','451*','451.42*'],
 #                       ts_name = ts_names)
@@ -433,7 +449,7 @@ def tkn(station_nos,start_year = 1996,end_year = 2030,raw=False):
 #     else:
 #         ts_names = ['09.Archive']
-#     ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+#     ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
 #                       stationparameter_no = ['866*'],
 #                       ts_name = ts_names)
@@ -450,7 +466,7 @@ def tkn(station_nos,start_year = 1996,end_year = 2030,raw=False):
 # def orthophosphate(station_nos,start_year = 1996,end_year = 2030,raw=False):
-#     ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+#     ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
 #                       stationparameter_no = ['5034','5035'],
 #                       ts_name = ['20.Day.Mean'])
@@ -469,7 +485,7 @@ def tkn(station_nos,start_year = 1996,end_year = 2030,raw=False):
 # def total_phosphorous(station_nos,start_year = 1996,end_year = 2030,raw=False):
-#     ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+#     ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
 #                       stationparameter_no = ['5004','5005'],
 #                       ts_name = ['20.Day.Mean'])
 #     if ts_ids.empty:
@@ -487,7 +503,7 @@ def tkn(station_nos,start_year = 1996,end_year = 2030,raw=False):
 # def total_suspended_solids(station_nos,start_year = 1996,end_year = 2030,raw=False):
-#     ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+#     ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
 #                       stationparameter_no = ['5014','5015'],
 #                       ts_name = ['20.Day.Mean'])
 #     if ts_ids.empty:
@@ -505,7 +521,7 @@ def tkn(station_nos,start_year = 1996,end_year = 2030,raw=False):
 # def tkn(station_nos,start_year = 1996,end_year = 2030,raw=False):
-#     ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+#     ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
 #                       stationparameter_no = ['5044','5045'],
 #                       ts_name = ['20.Day.Mean'])
@@ -524,7 +540,7 @@ def tkn(station_nos,start_year = 1996,end_year = 2030,raw=False):
 # def nitrogen(station_nos,start_year = 1996,end_year = 2030,raw=False):
-#     ts_ids = wiski.get_ts_ids(station_nos = station_nos,
+#     ts_ids = pywisk.get_ts_ids(station_nos = station_nos,
 #                       stationparameter_no = ['5024','5025'],
 #                       ts_name = ['20.Day.Mean'])

mpcaHydro/etlWPLMN.py CHANGED Viewed

@@ -8,7 +8,7 @@ Created on Tue Oct  3 08:04:49 2023
 import pandas as pd
-from WISKI import pyWISK
+from mpcaHydro.pyWISK import pyWISK
 import time
@@ -83,7 +83,7 @@ def transform(data):
     data = data.loc[:,['datetime','value','variable','unit','quality_id','station_id','station_name','constituent']]
     data['unit'].replace('ft³/s','cfs',inplace=True)
-    data['source'] = 'wplmn'
+    data['station_origin'] = 'wplmn'
     return data
     # data['Timestamp'] = pd.to_datetime(data['Timestamp']).dt.date

mpcaHydro/outlets.py ADDED Viewed

@@ -0,0 +1,371 @@
+# -*- coding: utf-8 -*-
+"""
+Created on Thu May  1 09:51:51 2025
+@author: mfratki
+"""
+#import sqlite3
+from pathlib import Path
+import geopandas as gpd
+import pandas as pd
+import duckdb
+#from hspf_tools.calibrator import etlWISKI, etlSWD
+#stations_wiski = gpd.read_file('C:/Users/mfratki/Documents/GitHub/pyhcal/src/pyhcal/data/stations_wiski.gpkg')
+_stations_wiski = gpd.read_file(str(Path(__file__).resolve().parent/'data\\stations_wiski.gpkg'))
+stations_wiski = _stations_wiski.dropna(subset='opnids')[['station_id','true_opnid','opnids','comments','modeled','repository_name','wplmn_flag']]
+stations_wiski['source'] = 'wiski'
+_stations_equis = gpd.read_file(str(Path(__file__).resolve().parent/'data\\stations_EQUIS.gpkg'))
+stations_equis = _stations_equis.dropna(subset='opnids')[['station_id','true_opnid','opnids','comments','modeled','repository_name']]
+stations_equis['source'] = 'equis'
+stations_equis['wplmn_flag'] = 0
+DB_PATH = str(Path(__file__).resolve().parent/'data\\outlets.duckdb')
+MODL_DB = pd.concat([stations_wiski,stations_equis])
+MODL_DB['opnids'] = MODL_DB['opnids'].str.strip().replace('',pd.NA)
+MODL_DB = MODL_DB.dropna(subset='opnids')
+MODL_DB = MODL_DB.drop_duplicates(['station_id','source']).reset_index(drop=True)
+def _reload():
+    global _stations_wiski, stations_wiski, _stations_equis, stations_equis, MODL_DB
+    _stations_wiski = gpd.read_file(str(Path(__file__).resolve().parent/'data\\stations_wiski.gpkg'))
+    stations_wiski = _stations_wiski.dropna(subset='opnids')[['station_id','true_opnid','opnids','comments','modeled','repository_name','wplmn_flag']]
+    stations_wiski['source'] = 'wiski'
+    _stations_equis = gpd.read_file(str(Path(__file__).resolve().parent/'data\\stations_EQUIS.gpkg'))
+    stations_equis = _stations_equis.dropna(subset='opnids')[['station_id','true_opnid','opnids','comments','modeled','repository_name']]
+    stations_equis['source'] = 'equis'
+    stations_equis['wplmn_flag'] = 0
+    MODL_DB = pd.concat([stations_wiski,stations_equis])
+    MODL_DB['opnids'] = MODL_DB['opnids'].str.strip().replace('',pd.NA)
+    MODL_DB = MODL_DB.dropna(subset='opnids')
+    MODL_DB = MODL_DB.drop_duplicates(['station_id','source']).reset_index(drop=True)
+def get_model_db(model_name: str):
+    return MODL_DB.query('repository_name == @model_name')
+def split_opnids(opnids: list):
+    return [abs(int(float(j))) for i in opnids for j in i]
+def valid_models():
+    return MODL_DB['repository_name'].unique().tolist()
+def wplmn_station_opnids(model_name):
+    opnids = MODL_DB.query('repository_name == @model_name and wplmn_flag == 1 and source == "wiski"')['opnids'].str.split(',').to_list()
+    return split_opnids(opnids)
+def wiski_station_opnids(model_name):
+    opnids = MODL_DB.query('repository_name == @model_name and source == "wiski"')['opnids'].str.split(',').to_list()
+    return split_opnids(opnids)
+def equis_station_opnids(model_name):
+    opnids = MODL_DB.query('repository_name == @model_name and source == "equis"')['opnids'].str.split(',').to_list()
+    return split_opnids(opnids)
+def station_opnids(model_name):
+    opnids = MODL_DB.query('repository_name == @model_name')['opnids'].str.split(',').to_list()
+    return split_opnids(opnids)
+def equis_stations(model_name):
+    return MODL_DB.query('repository_name == @model_name and source == "equis"')['station_id'].tolist()
+def wiski_stations(model_name):
+    return MODL_DB.query('repository_name == @model_name and source == "wiski"')['station_id'].tolist()
+def wplmn_stations(model_name):
+    return MODL_DB.query('repository_name == @model_name and wplmn_flag == 1 and source == "wiski"')['station_id'].tolist()
+def outlets(model_name):
+    return [group for _, group in MODL_DB.query('repository_name == @model_name').groupby(by = ['opnids','repository_name'])]
+def outlet_stations(model_name):
+    return [group['station_id'].to_list() for _, group in MODL_DB.query('repository_name == @model_name').groupby(by = ['opnids','repository_name'])]
+def _split_opnids(opnids: list):
+    return [int(float(j)) for i in opnids for j in i]
+def connect(db_path, read_only=True):
+    Path(db_path).parent.mkdir(parents=True, exist_ok=True)
+    return duckdb.connect(db_path,read_only=read_only)
+def init_db(db_path: str,reset: bool = False):
+    """
+    Initialize the DuckDB database: create staging and analytics schemas
+    """
+    db_path = Path(db_path)
+    if reset and db_path.exists():
+        db_path.unlink()
+    with connect(db_path.as_posix()) as con:
+        con.execute(OUTLETS_SCHEMA)
+# Accessors:
+def get_outlets_by_model(model_name: str):
+    with connect(DB_PATH) as con:
+        df = con.execute(
+            """
+            SELECT r.*
+            FROM outlets.station_reach_pairs r
+            WHERE r.repository_name = ?
+            """,
+            [model_name]
+        ).fetchdf()
+    return df
+def get_outlets_by_reach(reach_id: int, model_name: str):
+    """
+    Return all outlet rows for outlets that include the given reach_id in the given model_name.
+    """
+    with connect(DB_PATH) as con:
+        df = con.execute(
+            """
+            SELECT r.*
+            FROM outlets.station_reach_pairs r
+            WHERE r.reach_id = ? AND r.repository_name = ?
+            """,
+        [reach_id, model_name]).fetchdf()
+    return df
+def get_outlets_by_station(station_id: str, station_origin: str):
+    """
+    Return all outlet rows for outlets that include the given reach_id in the given model_name.
+    """
+    with connect(DB_PATH) as con:
+        df = con.execute(
+        """
+        SELECT r.*
+        FROM outlets.station_reach_pairs r
+        WHERE r.station_id = ? AND r.station_origin = ?
+        """,
+        [station_id, station_origin]).fetchdf()
+    return df
+class OutletGateway:
+    def __init__(self, model_name: str):
+        self.model_name = model_name
+        self.db_path = DB_PATH
+        self.modl_db = get_model_db(model_name)
+    # Legacy methods to access functions
+    def wplmn_station_opnids(self):
+        return wplmn_station_opnids(self.model_name)
+    def wiski_station_opnids(self):
+        return wiski_station_opnids(self.model_name)
+    def equis_station_opnids(self):
+        return equis_station_opnids(self.model_name)
+    def station_opnids(self):
+        return station_opnids(self.model_name)
+    def equis_stations(self):
+        return equis_stations(self.model_name)
+    def wiski_stations(self):
+        return wiski_stations(self.model_name)
+    def wplmn_stations(self):
+        return wplmn_stations(self.model_name)
+    def outlets(self):
+        return outlets(self.model_name)
+    def outlet_stations(self):
+        return outlet_stations(self.model_name)
+    # Accessors for outlets
+    def get_outlets(self):
+        return get_outlets_by_model(self.model_name)
+    def get_outlets_by_reach(self, reach_id: int):
+        return get_outlets_by_reach(reach_id, self.model_name)
+    def get_outlets_by_station(self, station_id: str, station_origin: str):
+        assert(station_id in self.wiski_stations() + self.equis_stations()), f"Station ID {station_id} not found in model {self.model_name}"
+        return get_outlets_by_station(station_id, station_origin)
+# constructors:
+def build_outlet_db(db_path: str = None):
+    if db_path is None:
+        db_path = DB_PATH
+    init_db(db_path,reset=True)
+    with connect(db_path) as con:
+        build_outlets(con)
+def build_outlets(con, model_name: str = None):
+    if model_name is not None:
+        modl_db = get_model_db(model_name)
+    else:
+        modl_db = MODL_DB
+    for index, (_, group) in enumerate(modl_db.drop_duplicates(['station_id','source']).groupby(by = ['opnids','repository_name'])):
+        repo_name = group['repository_name'].iloc[0]
+        add_outlet(con, outlet_id = index, outlet_name = None, repository_name = repo_name, notes = None)
+        opnids = set(_split_opnids(group['opnids'].str.split(',').to_list()))
+        for opnid in opnids:
+            if opnid < 0:
+                exclude = 1
+            else:
+                exclude = 0
+            add_reach(con, outlet_id = index, reach_id = abs(opnid),exclude = exclude, repository_name = repo_name)
+        for _, row in group.drop_duplicates(subset=['station_id', 'source']).iterrows():
+            add_station(con, outlet_id = index, station_id = row['station_id'], station_origin = row['source'], true_opnid = row['true_opnid'], repository_name= repo_name, comments = row['comments'])
+def create_outlet_schema(con, model_name : str):
+    for index, (_, group) in enumerate(modl_db.outlets(model_name)):
+        repo_name = group['repository_name'].iloc[0]
+        add_outlet(con, outlet_id = index, outlet_name = None, repository_name = repo_name, notes = None)
+        opnids = set(_split_opnids(group['opnids'].str.split(',').to_list()))
+        for opnid in opnids:
+            if opnid < 0:
+                exclude = 1
+            else:
+                exclude = 0
+            add_reach(con, outlet_id = index, reach_id = abs(opnid),exclude = exclude, repository_name = repo_name)
+        for _, row in group.drop_duplicates(subset=['station_id', 'source']).iterrows():
+            add_station(con, outlet_id = index, station_id = row['station_id'], station_origin = row['source'], true_opnid = row['true_opnid'], repository_name= repo_name, comments = row['comments'])
+def add_outlet(con,
+               outlet_id: str,
+               repository_name: str,
+               outlet_name = None,
+               notes = None):
+    """
+    Insert an outlet. repository_name is required.
+    """
+    con.execute(
+        "INSERT INTO outlets.outlets (outlet_id, repository_name, outlet_name, notes) VALUES (?, ?, ?, ?)",
+        [outlet_id, repository_name, outlet_name, notes]
+    )
+def add_station(con,
+                outlet_id: str,
+                station_id: str,
+                station_origin: str,
+                true_opnid: str,
+                repository_name: str,
+                comments = None):
+    """
+    Insert a station membership for an outlet.
+    Constraints:
+    - PRIMARY KEY (station_id, station_origin): unique per origin across all outlets.
+    - true_opnid and true_opnid_repository_name are required per schema.
+    """
+    con.execute(
+        """INSERT INTO outlets.outlet_stations
+           (outlet_id, station_id, station_origin, true_opnid, repository_name, comments)
+           VALUES (?, ?, ?, ?, ?, ?)""",
+        [outlet_id, station_id, station_origin, true_opnid, repository_name, comments]
+    )
+def add_reach(con,
+              outlet_id: str,
+              reach_id: str,
+              repository_name: str,
+              exclude: int = 0):
+    """
+    Insert a reach membership for an outlet.
+    - repository_name is required and participates in the PK (reach_id, repository_name).
+    - exclude = 1 to mark a reach as excluded from association views.
+    """
+    con.execute(
+        """INSERT INTO outlets.outlet_reaches (outlet_id, reach_id, repository_name, exclude)
+           VALUES (?, ?, ?, ?)""",
+        [outlet_id, reach_id, repository_name, int(exclude)]
+    )
+OUTLETS_SCHEMA  = """-- schema.sql
+-- Simple 3-table design to manage associations between model reaches and observation stations via outlets.
+-- Compatible with DuckDB and SQLite.
+-- Table 1: outlets
+-- Represents a logical grouping that ties stations and reaches together.
+CREATE TABLE IF NOT EXISTS outlets (
+  outlet_id TEXT PRIMARY KEY,
+  repository_name TEXT NOT NULL,
+  outlet_name TEXT,
+  notes TEXT             -- optional: general notes about the outlet grouping
+);
+-- Table 2: outlet_stations
+-- One-to-many: outlet -> stations
+CREATE TABLE IF NOT EXISTS outlet_stations (
+  outlet_id TEXT NOT NULL,
+  station_id TEXT NOT NULL,
+  station_origin TEXT NOT NULL,       -- e.g., 'wiski', 'equis'
+  repository_name TEXT NOT NULL,  -- repository model the station is physically located in
+  true_opnid TEXT NOT NULL,           -- The specific reach the station physically sits on (optional)
+  comments TEXT,             -- Per-station comments, issues, etc.
+  CONSTRAINT uq_station_origin UNIQUE (station_id, station_origin),
+  FOREIGN KEY (outlet_id) REFERENCES outlets(outlet_id)
+);
+-- Table 3: outlet_reaches
+-- One-to-many: outlet -> reaches
+-- A reach can appear in multiple outlets, enabling many-to-many overall.
+CREATE TABLE IF NOT EXISTS outlet_reaches (
+  outlet_id TEXT NOT NULL,
+  reach_id TEXT NOT NULL,    -- model reach identifier (aka opind)
+  repository_name TEXT NOT NULL,  -- optional: where the mapping comes from
+  exclude INTEGER DEFAULT 0, -- flag to indicate if this reach should be excluded (1) or included (0)
+  FOREIGN KEY (outlet_id) REFERENCES outlets(outlet_id)
+);
+-- Useful views:
+-- View: station_reach_pairs
+-- Derives the implicit many-to-many station <-> reach relationship via shared outlet_id
+CREATE VIEW IF NOT EXISTS station_reach_pairs AS
+SELECT
+  s.outlet_id,
+  s.station_id,
+  s.station_origin,
+  r.reach_id,
+  r.exclude,
+  r.repository_name,
+FROM outlet_stations s
+JOIN outlet_reaches r
+  ON s.outlet_id = r.outlet_id;
+"""
+#row = modl_db.MODL_DB.iloc[0]
+#info = etlWISKI.info(row['station_id'])
+#modl_db.MODL_DB.query('source == "equis"')
+# outlet_dict = {'stations': {'wiski': ['E66050001'],
+#                'equis': ['S002-118']},
+#                'reaches': {'Clearwater': [650]}
+# station_ids = ['S002-118']
+# #station_ids = ['E66050001']
+# reach_ids = [650]
+# flow_station_ids =  ['E66050001']

mpcaHydro 2.0.4__py3-none-any.whl → 2.0.6__py3-none-any.whl

mpcaHydro 2.0.4py3-none-any.whl → 2.0.6py3-none-any.whl