PyPI - tsp - Versions diffs - 1.8.1__py3-none-any.whl → 1.10.2__py3-none-any.whl - Mend

tsp 1.8.1py3-none-any.whl → 1.10.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (127) hide show

tsp/__init__.py +11 -11
tsp/__meta__.py +1 -1
tsp/concatenation.py +159 -153
tsp/core.py +1306 -1162
tsp/data/2023-01-06_755-test-Dataset_2031-Constant_Over_Interval-Hourly-Ground_Temperature-Thermistor_Automated.timeserie.csv +4 -4
tsp/data/2023-01-06_755-test.metadata.txt +208 -208
tsp/data/NTGS_example_csv.csv +6 -6
tsp/data/NTGS_example_slash_dates.csv +6 -6
tsp/data/NTGS_gtr_example_excel.xlsx +0 -0
tsp/data/example_geotop.csv +5240 -5240
tsp/data/example_gtnp.csv +1298 -1298
tsp/data/example_permos.csv +7 -7
tsp/data/ntgs-db-multi.txt +3872 -0
tsp/data/ntgs-db-single.txt +2251 -0
tsp/data/test_geotop_has_space.txt +5 -5
tsp/data/tsp_format_long.csv +10 -0
tsp/data/tsp_format_wide_1.csv +7 -0
tsp/data/tsp_format_wide_2.csv +7 -0
tsp/dataloggers/AbstractReader.py +43 -43
tsp/dataloggers/FG2.py +110 -110
tsp/dataloggers/GP5W.py +114 -114
tsp/dataloggers/Geoprecision.py +34 -34
tsp/dataloggers/HOBO.py +930 -914
tsp/dataloggers/RBRXL800.py +190 -190
tsp/dataloggers/RBRXR420.py +371 -308
tsp/dataloggers/Vemco.py +84 -0
tsp/dataloggers/__init__.py +15 -15
tsp/dataloggers/logr.py +196 -115
tsp/dataloggers/test_files/004448.DAT +2543 -2543
tsp/dataloggers/test_files/004531.DAT +17106 -17106
tsp/dataloggers/test_files/004531.HEX +3587 -3587
tsp/dataloggers/test_files/004534.HEX +3587 -3587
tsp/dataloggers/test_files/010252.dat +1731 -1731
tsp/dataloggers/test_files/010252.hex +1739 -1739
tsp/dataloggers/test_files/010274.hex +1291 -1291
tsp/dataloggers/test_files/010278.hex +3544 -3544
tsp/dataloggers/test_files/012064.dat +1286 -1286
tsp/dataloggers/test_files/012064.hex +1294 -1294
tsp/dataloggers/test_files/012064_modified_start.hex +1294 -0
tsp/dataloggers/test_files/012081.hex +3532 -3532
tsp/dataloggers/test_files/013138_recovery_stamp.hex +1123 -0
tsp/dataloggers/test_files/014037-2007.hex +95 -0
tsp/dataloggers/test_files/019360_20160918_1146_SlumpIslandTopofHill.hex +11253 -0
tsp/dataloggers/test_files/019360_20160918_1146_SlumpIslandTopofHill.xls +0 -0
tsp/dataloggers/test_files/07B1592.DAT +1483 -1483
tsp/dataloggers/test_files/07B1592.HEX +1806 -1806
tsp/dataloggers/test_files/07B4450.DAT +2234 -2234
tsp/dataloggers/test_files/07B4450.HEX +2559 -2559
tsp/dataloggers/test_files/2022018_2025-09-18T22-16-16.txt +36 -0
tsp/dataloggers/test_files/2022018_2025-09-18T22-16-16_raw.csv +2074 -0
tsp/dataloggers/test_files/2022018_2025-09-18T22-16-16_temp.csv +2074 -0
tsp/dataloggers/test_files/2025004_2025-12-02T17-07-28_cfg.txt +30 -0
tsp/dataloggers/test_files/2025004_2025-12-02T17-07-28_raw.csv +35 -0
tsp/dataloggers/test_files/2025004_2025-12-02T17-07-28_temp.csv +35 -0
tsp/dataloggers/test_files/204087.xlsx +0 -0
tsp/dataloggers/test_files/Asc-1455As02.000 +2982 -0
tsp/dataloggers/test_files/Asc-1456As02.000 +2992 -0
tsp/dataloggers/test_files/Asc-1457As02.000 +2917 -0
tsp/dataloggers/test_files/BGC_BH15_019362_20140610_1253.hex +1729 -0
tsp/dataloggers/test_files/Bin2944.csv +759 -0
tsp/dataloggers/test_files/Bin5494.csv +2972 -0
tsp/dataloggers/test_files/Bin6786.csv +272 -0
tsp/dataloggers/test_files/FG2_399.csv +9881 -9881
tsp/dataloggers/test_files/GP5W.csv +1121 -1121
tsp/dataloggers/test_files/GP5W_260.csv +1884 -1884
tsp/dataloggers/test_files/GP5W_270.csv +2210 -2210
tsp/dataloggers/test_files/H08-030-08_HOBOware.csv +998 -998
tsp/dataloggers/test_files/Minilog-II-T_350763_20190711_1.csv +2075 -0
tsp/dataloggers/test_files/Minilog-II-T_350769_20190921_1.csv +6384 -0
tsp/dataloggers/test_files/Minilog-II-T_354284_20190921_1.csv +4712 -0
tsp/dataloggers/test_files/Minilog-T_7943_20140920_1.csv +5826 -0
tsp/dataloggers/test_files/Minilog-T_8979_20140806_1.csv +2954 -0
tsp/dataloggers/test_files/Minilog-T_975_20110824_1.csv +4343 -0
tsp/dataloggers/test_files/RBR_01.dat +1046 -1046
tsp/dataloggers/test_files/RBR_02.dat +2426 -2426
tsp/dataloggers/test_files/RI03b_062831_20240905_1801.rsk +0 -0
tsp/dataloggers/test_files/RI03b_062831_20240905_1801.xlsx +0 -0
tsp/dataloggers/test_files/RSTDT2055.csv +2152 -2152
tsp/dataloggers/test_files/U23-001_HOBOware.csv +1001 -1001
tsp/dataloggers/test_files/hobo-negative-2.txt +6396 -6396
tsp/dataloggers/test_files/hobo-negative-3.txt +5593 -5593
tsp/dataloggers/test_files/hobo-positive-number-1.txt +1000 -1000
tsp/dataloggers/test_files/hobo-positive-number-2.csv +1003 -1003
tsp/dataloggers/test_files/hobo-positive-number-3.csv +1133 -1133
tsp/dataloggers/test_files/hobo-positive-number-4.csv +1209 -1209
tsp/dataloggers/test_files/hobo2.csv +8702 -8702
tsp/dataloggers/test_files/hobo_1_AB.csv +21732 -21732
tsp/dataloggers/test_files/hobo_1_AB_Details.txt +133 -133
tsp/dataloggers/test_files/hobo_1_AB_classic.csv +4373 -4373
tsp/dataloggers/test_files/hobo_1_AB_defaults.csv +21732 -21732
tsp/dataloggers/test_files/hobo_1_AB_minimal.txt +1358 -1358
tsp/dataloggers/test_files/hobo_1_AB_var2.csv +3189 -3189
tsp/dataloggers/test_files/hobo_1_AB_var3.csv +2458 -2458
tsp/dataloggers/test_files/logR_ULogC16-32_1.csv +106 -106
tsp/dataloggers/test_files/logR_ULogC16-32_2.csv +100 -100
tsp/dataloggers/test_files/mon_3_Ta_2010-08-18_2013-02-08.txt +21724 -21724
tsp/dataloggers/test_files/rbr_001.dat +1133 -1133
tsp/dataloggers/test_files/rbr_001.hex +1139 -1139
tsp/dataloggers/test_files/rbr_001_no_comment.dat +1132 -1132
tsp/dataloggers/test_files/rbr_001_no_comment.hex +1138 -1138
tsp/dataloggers/test_files/rbr_002.dat +1179 -1179
tsp/dataloggers/test_files/rbr_002.hex +1185 -1185
tsp/dataloggers/test_files/rbr_003.hex +1292 -1292
tsp/dataloggers/test_files/rbr_xl_001.DAT +1105 -1105
tsp/dataloggers/test_files/rbr_xl_002.DAT +1126 -1126
tsp/dataloggers/test_files/rbr_xl_003.DAT +4622 -4622
tsp/dataloggers/test_files/rbr_xl_003.HEX +3587 -3587
tsp/gtnp.py +148 -148
tsp/labels.py +3 -3
tsp/misc.py +90 -90
tsp/physics.py +101 -101
tsp/plots/static.py +388 -374
tsp/readers.py +829 -548
tsp/standardization/__init__.py +0 -0
tsp/standardization/metadata.py +95 -0
tsp/standardization/metadata_ref.py +0 -0
tsp/standardization/validator.py +535 -0
tsp/time.py +45 -45
tsp/tspwarnings.py +27 -15
tsp/utils.py +131 -101
tsp/version.py +1 -1
{tsp-1.8.1.dist-info → tsp-1.10.2.dist-info}/METADATA +95 -86
tsp-1.10.2.dist-info/RECORD +132 -0
{tsp-1.8.1.dist-info → tsp-1.10.2.dist-info}/licenses/LICENSE +674 -674
{tsp-1.8.1.dist-info → tsp-1.10.2.dist-info}/top_level.txt +1 -0
tsp-1.8.1.dist-info/RECORD +0 -94
{tsp-1.8.1.dist-info → tsp-1.10.2.dist-info}/WHEEL +0 -0

tsp/dataloggers/Vemco.py ADDED Viewed

@@ -0,0 +1,84 @@
+# -*- coding: utf-8 -*-
+"""
+*DESCRIPTION*
+Author: rparker
+Created: 2024-01-10
+"""
+import os
+import pathlib
+import pandas as pd
+import datetime as dt
+from .AbstractReader import AbstractReader
+class Vemco(AbstractReader):
+    def __init__(self):
+        self.META = {}
+    def read(self, file_path: str):
+        file_extention = pathlib.Path(file_path).suffix.lower()
+        if file_extention == ".000":
+            try:
+                with open(file_path, "r", encoding="cp1252") as file:
+                    first_line = file.readline()
+                if first_line.startswith("*"):
+                    self._read_old_000_logger_file(file_path)
+                else:
+                    raise IOError(f"{os.path.basename(file_path)} unreadable. Try opening this file in Logger VUE and "
+                                  f"exporting it as a .csv")
+            except UnicodeDecodeError as e:
+                raise IOError(f"{os.path.basename(file_path)} unreadable. Try opening this file in Logger VUE and "
+                              f"exporting it as a .csv")
+        elif file_extention == ".csv":
+            self._read_logger_vue_csv(file_path)
+        else:
+            raise ValueError("File is not a .csv or .000")
+        return self.DATA
+    def _read_old_000_logger_file(self, file_path):
+        with open(file_path, "r", encoding="cp1252") as file:
+            lines = file.readlines()
+        header_lines = lines[:6]
+        data_lines = [l.strip().split(",") for l in lines[6:]]
+        self.META["logger_model"] = header_lines[0].split("=")[-1].strip()
+        self.META["logger_sn"] = header_lines[1].split("=")[-1].strip()
+        self.META["study_id"] = header_lines[2].split("=")[-1].strip()
+        self.META["logging_start"] = dt.datetime.strptime(header_lines[3].split("=")[-1].strip(), "%d/%m/%Y %H:%M:%S")
+        self.META["download_date"] = dt.datetime.strptime(header_lines[4].split("=")[-1].strip(), "%d/%m/%Y %H:%M:%S")
+        sample_interval = dt.datetime.strptime(header_lines[5].split("=")[-1].strip(), "%H:%M:%S")
+        self.META["sample_interval"] = dt.timedelta(hours=sample_interval.hour, minutes=sample_interval.minute,
+                                                    seconds=sample_interval.second)
+        self.META['raw'] = "".join(header_lines)
+        self.DATA = pd.DataFrame(data_lines[1:], columns=["TIME", "TEMPERATURE"])
+        self.DATA["TIME"] = pd.to_datetime(self.DATA["TIME"], format="%d/%m/%Y %H:%M:%S")
+        self.DATA["TEMPERATURE"] = pd.to_numeric(self.DATA["TEMPERATURE"], errors='coerce')
+        return
+    def _read_logger_vue_csv(self, file_path):
+        with open(file_path, "r", encoding="cp1252") as file:
+            lines = file.readlines()
+        header_lines = lines[:7]
+        data_lines = [l.strip().split(",") for l in lines[7:]]
+        model_and_sn = header_lines[1][15:-1]
+        self.META["logger_sn"] = model_and_sn.split("-")[-1]
+        self.META["logger_model"] = "-".join(model_and_sn.split("-")[:-1])
+        self.META["study_id"] = header_lines[2].split(":")[-1].strip()
+        self.META["logging_start"] = dt.datetime.strptime(header_lines[4][18:-1], "%Y-%m-%d %H:%M:%S")
+        self.META["download_date"] = dt.datetime.strptime(header_lines[5][17:-1], "%Y-%m-%d %H:%M:%S")
+        if header_lines[3].endswith(")"):
+            data_tz = dt.timezone(dt.timedelta(hours=int(header_lines[3][45:-2])))
+            self.META["logging_start"] = self.META["logging_start"].replace(tzinfo=data_tz)
+            self.META["download_date"] = self.META["download_date"].replace(tzinfo=data_tz)
+            self.META["utc_offset"] = data_tz
+        sample_interval = dt.datetime.strptime(header_lines[6][17:-1], "%H:%M:%S")
+        self.META["sample_interval"] = dt.timedelta(hours=sample_interval.hour, minutes=sample_interval.minute,
+                                                    seconds=sample_interval.second)
+        self.META['raw'] = "".join(header_lines)
+        self.DATA = pd.DataFrame(data_lines[1:], columns=["date", "time", "TEMPERATURE"])
+        self.DATA["TIME"] = pd.to_datetime(self.DATA["date"] + " " + self.DATA["time"], format="%Y-%m-%d %H:%M:%S")
+        self.DATA["TEMPERATURE"] = pd.to_numeric(self.DATA["TEMPERATURE"], errors='coerce')
+        self.DATA.drop(columns=["date", "time"], inplace=True)
+        return

tsp/dataloggers/__init__.py CHANGED Viewed

@@ -1,15 +1,15 @@
-from .HOBO import HOBO, HOBOProperties
-from .FG2 import FG2
-from .GP5W import GP5W
-from .Geoprecision import detect_geoprecision_type
-from .logr import LogR
-HOBO.__module__ = __name__
-HOBOProperties.__module__ = __name__
-FG2.__module__ =__name__
-GP5W.__module__ = __name__
-LogR.__module__ = __name__
-__all__ = ['HOBO','HOBOProperties',
-           'FG2','GP5W', 'detect_geoprecision_type',
-           'LogR']
+from .HOBO import HOBO, HOBOProperties
+from .FG2 import FG2
+from .GP5W import GP5W
+from .Geoprecision import detect_geoprecision_type
+from .logr import LogR
+HOBO.__module__ = __name__
+HOBOProperties.__module__ = __name__
+FG2.__module__ =__name__
+GP5W.__module__ = __name__
+LogR.__module__ = __name__
+__all__ = ['HOBO','HOBOProperties',
+           'FG2','GP5W', 'detect_geoprecision_type',
+           'LogR']

tsp/dataloggers/logr.py CHANGED Viewed

@@ -1,115 +1,196 @@
-import pandas as pd
-import regex as re
-import numpy as np
-class LogR:
-    SEP = ","
-    def __init__(self):
-        pass
-    def read(self, file):
-        headers = read_logr_header(file)
-        columns = [line.strip().split(',') for line in headers if is_columns_row(line)][0]
-        labels = [line.strip().split(',') for line in headers if is_label_row(line)][0]
-        data = pd.read_csv(file, skiprows=len(headers))
-        data.columns = ["TIME" if c == 'timestamp' else c for c in columns]
-        data['TIME'] = pd.to_datetime(data['TIME'], format=dateformat())
-        channels = pd.Series(data.columns).str.match("^CH")
-        self.DATA = data
-        self.META = {
-            'label': labels,
-            'guessed_depths': guess_depths(labels)[-sum(channels):]
-        }
-        return self.DATA
-def read_logr_header(file: str) -> "list":
-    """ Read metadata / header lines from LogR file
-    Parameters
-    ----------
-    file : str
-        path to a LogR file
-    Returns
-    -------
-    list
-        list of lines in the header block
-    Raises
-    ------
-    ValueError
-        _description_
-    """
-    found_data = False
-    max_rows = 50
-    header_lines = []
-    with open(file) as f:
-        while not found_data and max_rows:
-            max_rows -= 1
-            line = f.readline()
-            if is_data_row(line):
-                found_data = True
-                break
-            else:
-                header_lines.append(line)
-    if not found_data:
-        raise ValueError("Could not find start of data")
-    return header_lines
-def guess_depths(labels: "list[str]") -> "list[float]":
-    pattern = re.compile(r"(-?[\d\.]+)")
-    matches = [pattern.search(l) for l in labels]
-    depths = [float(d.group(1)) if d else None for d in matches]
-    return depths
-def guessed_depths_ok(depths, n_channel) -> bool:
-    """ Evaluate whether the guessed depths are valid """
-    d = np.array(depths, dtype='float64')
-    # monotonic (by convention)
-    if not (np.diff(d) > 0).all() or (np.diff(d) < 0).all():
-        return False
-    # equal to number of channels
-    if not sum(~np.isnan(d)) == n_channel:
-        return False
-    return True
-def dateformat():
-    return "%Y/%m/%d %H:%M:%S"
-def is_data_row(line: str) -> bool:
-    pattern = re.compile(r"^,\d{4}/\d{2}/\d{2}\s\d{2}:")
-    return bool(pattern.match(line))
-def is_columns_row(line:str) -> bool:
-    pattern = re.compile(r"^SensorId")
-    return bool(pattern.match(line))
-def is_label_row(line: str) -> bool:
-    pattern = re.compile(r"^Label")
-    return bool(pattern.match(line))
+import pandas as pd
+import regex as re
+import numpy as np
+import datetime as dt
+class LogR:
+    SEP = ","
+    def __init__(self):
+        self.DATA = None
+        self.META = None
+        pass
+    def read(self, file: str, cfg_txt: str = None):
+        raw = is_raw_data(file)
+        if raw and cfg_txt is None:
+            raise ValueError("cfg_txt must be specified if providing raw data.")
+        if cfg_txt is not None:
+            config_params = read_cfg_file(cfg_txt)
+        else:
+            config_params = None
+        header_rows = read_logr_header(file)
+        columns = [line.strip().split(',') for line in header_rows if is_columns_row(line)][0]
+        labels = [line.strip().split(',') for line in header_rows if is_label_row(line)][0]
+        data = pd.read_csv(file, header=len(header_rows) - 1,
+                           names=["TIME" if c == 'timestamp' else c for c in columns])
+        if raw:
+            data = convert_raw_to_temperatures(data=data, channel_metadata=config_params["channel_metadata"])
+        else:
+            data['TIME'] = pd.to_datetime(data['TIME'], format=dateformat())
+            if config_params is not None and "UTC Offset" in config_params.keys():
+                pattern = re.compile(r"-?\+?\d{2}:?\d{0,2}")
+                match = pattern.search(config_params["UTC Offset"])
+                if match is None:
+                    raise ValueError("Could not parse UTC offset")
+                offset = [int(ele) for ele in match.group().split(":")]
+                if len(offset) == 1:
+                    tz = dt.timezone(dt.timedelta(hours=offset[0]))
+                elif len(offset) == 2:
+                    tz = dt.timezone(dt.timedelta(hours=offset[0], minutes=offset[1]))
+                else:
+                    raise ValueError("Could not parse UTC offset")
+                data['TIME'] = data['TIME'].dt.tz_localize(tz)
+        channels = pd.Series(data.columns).str.match("^CH")
+        self.DATA = data
+        self.META = {'label': labels,
+                     'guessed_depths': guess_depths(labels)[-sum(channels):]}
+        if config_params is not None:
+            self.META = self.META | config_params
+        return self.DATA
+def read_cfg_file(file_path: str):
+    metadata = dict()
+    with open(file_path, "r") as f:
+        for i in range(50):
+            line = f.readline()
+            if line.startswith("ChannelID"):
+                break
+            if line != "\n":
+                line = line.split(":")
+                metadata[line[0].strip()] = line[1].strip()
+    if "Serial Number" in metadata.keys():
+        metadata["logger_sn"] = metadata["Serial Number"]
+        del metadata["Serial Number"]
+    metadata["channel_metadata"] = pd.read_csv(file_path, delimiter="\t", header=len(metadata.keys()),
+                                               index_col="ChannelID")
+    return metadata
+def convert_raw_to_temperatures(data: pd.DataFrame, channel_metadata: pd.DataFrame):
+    data["TIME"] = pd.to_datetime(data["TIME"], unit="s", utc=True)
+    voltage_ref = 2.5
+    r_fixed = 7500
+    r_correction = 100
+    for channel in channel_metadata.index:
+        if channel in data.columns:
+            coefficents = {letter: channel_metadata.loc[channel, letter] for letter in ["A", "B", "C", "D", "E"]}
+            resistances = r_fixed / (voltage_ref / data[channel] - 1) - r_correction
+            data[channel] = 1 / (coefficents["A"] + coefficents["B"] * np.log(resistances)
+                                 + coefficents["C"] * np.power(np.log(resistances), 3)
+                                 + coefficents["D"] * np.power(np.log(resistances), 5)) - 273.15
+    return data
+def read_logr_header(file: str) -> list:
+    """ Read metadata / header lines from LogR file
+    Parameters
+    ----------
+    file : str
+        path to a LogR file
+    Returns
+    -------
+    list
+        list of lines in the header block
+    Raises
+    ------
+    ValueError
+        _description_
+    """
+    found_data = False
+    max_rows = 50
+    header_lines = list()
+    with open(file) as f:
+        while not found_data and max_rows:
+            max_rows -= 1
+            line = f.readline()
+            if is_data_row(line):
+                found_data = True
+                break
+            else:
+                header_lines.append(line)
+    if not found_data:
+        raise ValueError("Could not find start of data")
+    return header_lines
+def guess_depths(labels: list[str]) -> list[float]:
+    pattern = re.compile(r"(-?[\d\.]+)")
+    matches = [pattern.search(l) for l in labels]
+    depths = [float(d.group(1)) if d else None for d in matches]
+    return depths
+def guessed_depths_ok(depths, n_channel) -> bool:
+    """ Evaluate whether the guessed depths are valid """
+    d = np.array(depths, dtype='float64')
+    # monotonic (by convention)
+    if not (np.diff(d) > 0).all() or (np.diff(d) < 0).all():
+        return False
+    # equal to number of channels
+    if not sum(~np.isnan(d)) == n_channel:
+        return False
+    return True
+def dateformat():
+    return "%Y/%m/%d %H:%M:%S"
+def is_data_row(line: str) -> bool:
+    if line == "":
+        return False
+    second_element = line.split(",")[1]
+    try:
+        if second_element.isnumeric():
+            dt.datetime.fromtimestamp(float(second_element))
+        else:
+            dt.datetime.strptime(second_element, dateformat())
+        return True
+    except:
+        return False
+def is_raw_data(file: str) -> bool:
+    with open(file) as f:
+        for i in range(50):
+            line = f.readline()
+            if line == "":
+                continue
+            second_element = line.split(",")[1]
+            try:
+                if second_element.isnumeric():
+                    dt.datetime.fromtimestamp(float(second_element))
+                    return True
+                else:
+                    dt.datetime.strptime(second_element, dateformat())
+                    return False
+            except:
+                pass
+    raise RuntimeError("Could not determine if raw data")
+def is_columns_row(line: str) -> bool:
+    pattern = re.compile(r"^SensorId")
+    return bool(pattern.match(line))
+def is_label_row(line: str) -> bool:
+    pattern = re.compile(r"^Label")
+    return bool(pattern.match(line))

tsp 1.8.1__py3-none-any.whl → 1.10.2__py3-none-any.whl

tsp 1.8.1py3-none-any.whl → 1.10.2py3-none-any.whl