PyPI - geo-explorer - Versions diffs - 0.9.8__tar.gz → 0.9.10__tar.gz - Mend

geo-explorer 0.9.8tar.gz → 0.9.10tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

{geo_explorer-0.9.8 → geo_explorer-0.9.10}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: geo-explorer
-Version: 0.9.8
+Version: 0.9.10
 Summary: Explore geodata interactively.
 License: MIT
 Author: Morten Letnes
@@ -20,7 +20,7 @@ Requires-Dist: fsspec (>=2024.10.1)
 Requires-Dist: geopandas (>=0.14.0)
 Requires-Dist: jenkspy (>=0.3.2)
 Requires-Dist: matplotlib (>=3.7.0)
-Requires-Dist: msgspec (>=0.19.0,<0.20.0)
+Requires-Dist: msgspec (>=0.19.0)
 Requires-Dist: numpy (>=1.26.4)
 Requires-Dist: pandas (>=2.2.1)
 Requires-Dist: polars (>=1.32.0)

{geo_explorer-0.9.8 → geo_explorer-0.9.10}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "geo-explorer"
-version = "0.9.8"
+version = "0.9.10"
 description = "Explore geodata interactively."
 authors = ["Morten Letnes <morten.letnes@ssb.no>"]
 license = "MIT"
@@ -36,7 +36,8 @@ fsspec = ">=2024.10.1"
 polars = ">=1.32.0"
 dash = ">=2.0.0"
 tzlocal = ">=5.3.1"
-msgspec = "^0.19.0"
+msgspec = ">=0.19.0"
+xarray = { version = ">=2024.3.0", optional = true }
 [tool.poetry.group.dev.dependencies]
 pygments = ">=2.10.0"

{geo_explorer-0.9.8 → geo_explorer-0.9.10}/src/geo_explorer/file_browser.py RENAMED Viewed

@@ -2,6 +2,7 @@ import datetime
 import time
 from concurrent.futures import ThreadPoolExecutor
 from pathlib import Path
+from typing import ClassVar
 import dash
 import dash_bootstrap_components as dbc
@@ -21,6 +22,8 @@ from .utils import get_button_with_tooltip
 class FileBrowser:
+    file_formats: ClassVar[list[str]] = [".parquet", ".tif", ".tiff", ".nc"]
     def __init__(
         self,
         start_dir: str,
@@ -313,7 +316,7 @@ class FileBrowser:
                 ]
                 alert = None
             else:
-                file_data_dict, file_list, alert = _list_dir(
+                file_data_dict, file_list, alert = self._list_dir(
                     path, search_word, case_sensitive, recursive, self.file_system
                 )
                 if sum(sort_by_clicks):
@@ -347,143 +350,162 @@ class FileBrowser:
             return (file_data_dict, file_list, alert, sort_by_clicks, self._history[1:])
-def _list_dir(
-    path: str, containing: str, case_sensitive: bool, recursive: bool, file_system
-):
-    containing = containing or ""
-    containing = [txt.strip() for txt in containing.split(",") if txt.strip()]
-    if (case_sensitive or 0) % 2 == 0:
-        def _contains(path):
-            if not containing:
-                return True
-            return all(
-                any(
-                    txt.strip().lower() in path.lower()
-                    for txt in x.split("|")
-                    if txt.strip()
+    def _list_dir(
+        self,
+        path: str,
+        containing: str,
+        case_sensitive: bool,
+        recursive: bool,
+        file_system,
+    ):
+        containing = containing or ""
+        containing = [txt.strip() for txt in containing.split(",") if txt.strip()]
+        if (case_sensitive or 0) % 2 == 0:
+            def _contains(path):
+                if not containing:
+                    return True
+                return all(
+                    any(
+                        txt.strip().lower() in path.lower()
+                        for txt in x.split("|")
+                        if txt.strip()
+                    )
+                    for x in containing
                 )
-                for x in containing
-            )
-    else:
+        else:
-        def _contains(path):
-            if not containing:
-                return True
-            return all(
-                any(txt.strip() in path for txt in x.split("|") if txt.strip())
-                for x in containing
-            )
+            def _contains(path):
+                if not containing:
+                    return True
+                return all(
+                    any(txt.strip() in path for txt in x.split("|") if txt.strip())
+                    for x in containing
+                )
-    if (recursive or 0) % 2 == 0:
+        if (recursive or 0) % 2 == 0:
-        def _ls(path):
-            return file_system.ls(path, detail=True)
+            def _ls(path):
+                return file_system.ls(path, detail=True)
-    else:
+        else:
-        def _ls(path):
-            path = str(Path(path) / "**")
-            return _try_glob(path, file_system)
+            def _ls(path):
+                path = str(Path(path) / "**")
+                return _try_glob(path, file_system)
-    try:
-        paths = _ls(path)
-    except Exception as e:
         try:
-            paths = _try_glob(path, file_system)
-        except Exception:
-            return (
-                [],
-                [],
-                dbc.Alert(
-                    f"Couldn't list files in {path}. {type(e)}: {e}",
-                    color="warning",
-                    dismissable=True,
-                ),
-            )
-    if not paths:
-        paths = _try_glob(path, file_system)
+            paths = _ls(path)
+        except Exception as e:
+            try:
+                paths = _try_glob(path, file_system)
+            except Exception:
+                return (
+                    [],
+                    [],
+                    dbc.Alert(
+                        f"Couldn't list files in {path}. {type(e)}: {e}",
+                        color="warning",
+                        dismissable=True,
+                    ),
+                )
-    if isinstance(paths, dict):
-        paths = list(paths.values())
+        if not paths:
+            paths = _try_glob(path, file_system)
-    def is_dir_or_is_partitioned_parquet(x) -> bool:
-        return x["type"] == "directory" or any(
-            x["name"].endswith(txt) for txt in [".parquet"]
-        )
+        if isinstance(paths, dict):
+            paths = list(paths.values())
-    paths = [
-        x
-        for x in paths
-        if isinstance(x, dict)
-        and _contains(x["name"])
-        and is_dir_or_is_partitioned_parquet(x)
-        and Path(path).parts != Path(x["name"]).parts
-    ]
-    paths.sort(key=lambda x: x["name"])
-    isdir_list = [x["type"] == "directory" for x in paths]
-    partitioned = {
-        i: x
-        for i, x in enumerate(paths)
-        if x["type"] == "directory"
-        and any(
-            str(x).endswith(".parquet") for x in (x["name"], *Path(x["name"]).parents)
-        )
-    }
+        def is_dir_or_is_partitioned_parquet(x) -> bool:
+            return x["type"] == "directory" or any(
+                x["name"].endswith(txt) for txt in self.file_formats
+            )
-    def get_summed_size_and_latest_timestamp_in_subdirs(
-        x,
-    ) -> tuple[float, datetime.datetime]:
-        file_info = _try_glob(str(Path(x["name"]) / "**/*.parquet"), file_system)
+        paths = [
+            x
+            for x in paths
+            if isinstance(x, dict)
+            and _contains(x["name"])
+            and is_dir_or_is_partitioned_parquet(x)
+            and Path(path).parts != Path(x["name"]).parts
+        ]
-        if isinstance(file_info, dict):
-            file_info = list(file_info.values())
+        paths.sort(key=lambda x: x["name"])
+        isdir_list = [x["type"] == "directory" for x in paths]
-        file_info = [
-            x for x in file_info if isinstance(x, dict) and x["type"] != "directory"
-        ]
-        if not file_info:
-            return 0, str(datetime.datetime.fromtimestamp(0))
-        return sum(x["size"] for x in file_info), max(x["updated"] for x in file_info)
-    with ThreadPoolExecutor() as executor:
-        summed_size_ant_time = list(
-            executor.map(
-                get_summed_size_and_latest_timestamp_in_subdirs, partitioned.values()
+        partitioned = {
+            i: x
+            for i, x in enumerate(paths)
+            if x["type"] == "directory"
+            and any(
+                str(x).endswith(".parquet")
+                for x in (x["name"], *Path(x["name"]).parents)
+            )
+        }
+        def get_summed_size_and_latest_timestamp_in_subdirs(
+            x,
+        ) -> tuple[float, datetime.datetime]:
+            file_info = _try_glob(str(Path(x["name"]) / "**/*.parquet"), file_system)
+            if isinstance(file_info, dict):
+                file_info = list(file_info.values())
+            file_info = [
+                x for x in file_info if isinstance(x, dict) and x["type"] != "directory"
+            ]
+            if not file_info:
+                return 0, str(datetime.datetime.fromtimestamp(0))
+            return sum(x["size"] for x in file_info), max(
+                x["updated"] for x in file_info
             )
-        )
-        for i, (size, timestamp) in zip(partitioned, summed_size_ant_time, strict=True):
-            paths[i]["size"] = size
-            paths[i]["updated"] = timestamp
-    return (
-        paths,
-        [
-            _get_file_list_row(
-                x["name"], x.get("updated", None), x["size"], isdir, path, file_system
+        with ThreadPoolExecutor() as executor:
+            summed_size_ant_time = list(
+                executor.map(
+                    get_summed_size_and_latest_timestamp_in_subdirs,
+                    partitioned.values(),
+                )
             )
-            for x, isdir in zip(paths, isdir_list, strict=True)
-            if isinstance(x, dict)
-        ],
-        None,
-    )
+            for i, (size, timestamp) in zip(
+                partitioned, summed_size_ant_time, strict=True
+            ):
+                paths[i]["size"] = size
+                paths[i]["updated"] = timestamp
+        return (
+            paths,
+            [
+                _get_file_list_row(
+                    x["name"],
+                    x.get("updated", None),
+                    x["size"],
+                    isdir,
+                    path,
+                    self.file_formats,
+                    file_system,
+                )
+                for x, isdir in zip(paths, isdir_list, strict=True)
+                if isinstance(x, dict)
+            ],
+            None,
+        )
-def _get_file_list_row(path, timestamp, size, isdir: bool, current_path, file_system):
+def _get_file_list_row(
+    path, timestamp, size, isdir: bool, current_path, file_formats, file_system
+):
     path = _standardize_path(path)
     timestamp = str(timestamp)[:19]
     mb = str(round(size / 1_000_000, 2))
-    is_loadable = not isdir or (
-        path.endswith(".parquet")
+    is_loadable = not isdir or any(
+        path.endswith(file_format)
         or all(
-            x.endswith(".parquet") or _standardize_path(x) == path
+            x.endswith(file_format) or _standardize_path(x) == path
             for x in file_system.ls(path)
         )
+        for file_format in file_formats
     )
     if is_loadable:
         button = html.Button(

geo-explorer 0.9.8__tar.gz → 0.9.10__tar.gz

geo-explorer 0.9.8tar.gz → 0.9.10tar.gz