PyPI - lamindb_setup - Versions diffs - 1.18.2__py3-none-any.whl → 1.19.1__py3-none-any.whl - Mend

lamindb_setup 1.18.2py3-none-any.whl → 1.19.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

lamindb_setup/__init__.py +4 -19
lamindb_setup/_cache.py +87 -87
lamindb_setup/_check.py +7 -7
lamindb_setup/_check_setup.py +131 -131
lamindb_setup/_connect_instance.py +443 -438
lamindb_setup/_delete.py +155 -151
lamindb_setup/_disconnect.py +38 -38
lamindb_setup/_django.py +39 -39
lamindb_setup/_entry_points.py +19 -19
lamindb_setup/_init_instance.py +423 -429
lamindb_setup/_migrate.py +331 -327
lamindb_setup/_register_instance.py +32 -32
lamindb_setup/_schema.py +27 -27
lamindb_setup/_schema_metadata.py +451 -451
lamindb_setup/_set_managed_storage.py +81 -80
lamindb_setup/_setup_user.py +198 -198
lamindb_setup/_silence_loggers.py +46 -46
lamindb_setup/core/__init__.py +25 -34
lamindb_setup/core/_aws_options.py +276 -266
lamindb_setup/core/_aws_storage.py +57 -55
lamindb_setup/core/_clone.py +50 -50
lamindb_setup/core/_deprecated.py +62 -62
lamindb_setup/core/_docs.py +14 -14
lamindb_setup/core/_hub_client.py +288 -294
lamindb_setup/core/_hub_core.py +0 -2
lamindb_setup/core/_hub_crud.py +247 -247
lamindb_setup/core/_hub_utils.py +100 -100
lamindb_setup/core/_private_django_api.py +80 -80
lamindb_setup/core/_settings.py +440 -434
lamindb_setup/core/_settings_instance.py +32 -7
lamindb_setup/core/_settings_load.py +162 -159
lamindb_setup/core/_settings_save.py +108 -96
lamindb_setup/core/_settings_storage.py +433 -433
lamindb_setup/core/_settings_store.py +162 -92
lamindb_setup/core/_settings_user.py +55 -55
lamindb_setup/core/_setup_bionty_sources.py +44 -44
lamindb_setup/core/cloud_sqlite_locker.py +240 -240
lamindb_setup/core/django.py +414 -413
lamindb_setup/core/exceptions.py +1 -1
lamindb_setup/core/hashing.py +134 -134
lamindb_setup/core/types.py +1 -1
lamindb_setup/core/upath.py +1031 -1028
lamindb_setup/errors.py +72 -70
lamindb_setup/io.py +423 -416
lamindb_setup/types.py +17 -17
{lamindb_setup-1.18.2.dist-info → lamindb_setup-1.19.1.dist-info}/METADATA +4 -2
lamindb_setup-1.19.1.dist-info/RECORD +51 -0
{lamindb_setup-1.18.2.dist-info → lamindb_setup-1.19.1.dist-info}/WHEEL +1 -1
{lamindb_setup-1.18.2.dist-info → lamindb_setup-1.19.1.dist-info/licenses}/LICENSE +201 -201
lamindb_setup-1.18.2.dist-info/RECORD +0 -51

lamindb_setup/core/exceptions.py CHANGED Viewed

	@@ -1 +1 @@
1	- from lamindb_setup.errors import DefaultMessageException # backwards compatibility
1	+ from lamindb_setup.errors import DefaultMessageException # backwards compatibility

lamindb_setup/core/hashing.py CHANGED Viewed

@@ -1,134 +1,134 @@
-from __future__ import annotations
-"""Hashing.
-.. autosummary::
-   :toctree: .
-   hash_set
-   hash_file
-"""
-import base64
-import hashlib
-import json
-from concurrent.futures import ThreadPoolExecutor
-from typing import TYPE_CHECKING
-import psutil
-HASH_LENGTH = 22
-if TYPE_CHECKING:
-    from collections.abc import Iterable
-    from lamindb_setup.types import Path, UPathStr
-def hash_and_encode_as_b62(s: str) -> str:
-    from lamin_utils._base62 import encodebytes
-    return encodebytes(hashlib.md5(s.encode()).digest())
-def to_b64_str(bstr: bytes):
-    b64 = base64.urlsafe_b64encode(bstr).decode().strip("=")
-    return b64
-def b16_to_b64(s: str):
-    return to_b64_str(base64.b16decode(s.strip('"'), casefold=True))
-# a lot to read about this: lamin-notes/2022/hashing
-def hash_set(s: set[str]) -> str:
-    join_s = ":".join(sorted(s))
-    return hash_string(join_s)[:HASH_LENGTH]
-def hash_dict(d: dict) -> str:
-    return to_b64_str(hashlib.md5(json.dumps(d, sort_keys=True).encode()).digest())[
-        :HASH_LENGTH
-    ]
-def hash_from_hashes_list(hashes: Iterable[str]) -> str:
-    # need to sort below because we don't want the order of parsing the dir to
-    # affect the hash
-    digests = b"".join(
-        hashlib.md5(hash.encode("utf-8")).digest() for hash in sorted(hashes)
-    )
-    digest = hashlib.md5(digests).digest()
-    return to_b64_str(digest)[:HASH_LENGTH]
-# below is only used when comparing with git's sha1 hashes
-# we don't use it for our own hashes
-def hash_code(file_path: UPathStr) -> hashlib._Hash:
-    with open(file_path, "rb") as fp:
-        data = fp.read()
-    data_size = len(data)
-    header = f"blob {data_size}\0".encode()
-    blob = header + data
-    return hashlib.sha1(blob)
-def hash_small_bytes(data: bytes) -> str:
-    return to_b64_str(hashlib.md5(data).digest())
-# this is equivalent with hash_file for small files
-def hash_string(string: str) -> str:
-    # as we're truncating (not here) at 22 b64, we choose md5 over sha512
-    return to_b64_str(hashlib.md5(string.encode("utf-8")).digest())[:HASH_LENGTH]
-def hash_file(
-    file_path: Path,
-    file_size: int | None = None,
-    chunk_size: int | None = 50 * 1024 * 1024,
-) -> tuple[int, str, str]:
-    with open(file_path, "rb") as fp:
-        if file_size is None:
-            fp.seek(0, 2)
-            file_size = fp.tell()
-            fp.seek(0, 0)
-        if chunk_size is None:
-            chunk_size = file_size
-        first_chunk = fp.read(chunk_size)
-        if file_size <= chunk_size:
-            digest = hashlib.md5(first_chunk).digest()
-            hash_type = "md5"
-        else:
-            fp.seek(-chunk_size, 2)
-            last_chunk = fp.read(chunk_size)
-            digest = hashlib.sha1(
-                hashlib.sha1(first_chunk).digest() + hashlib.sha1(last_chunk).digest()
-            ).digest()
-            hash_type = "sha1-fl"
-    return file_size, to_b64_str(digest)[:HASH_LENGTH], hash_type
-def hash_dir(path: Path) -> tuple[int, str, str, int]:
-    files = (subpath for subpath in path.rglob("*") if subpath.is_file())
-    def hash_size(file):
-        size, hash, _ = hash_file(file)
-        return hash, size
-    try:
-        n_workers = len(psutil.Process().cpu_affinity())
-    except AttributeError:
-        n_workers = psutil.cpu_count()
-    if n_workers > 1:
-        with ThreadPoolExecutor(n_workers) as pool:
-            hashes_sizes = pool.map(hash_size, files)
-    else:
-        hashes_sizes = map(hash_size, files)
-    hashes, sizes = zip(*hashes_sizes, strict=False)
-    hash, hash_type = hash_from_hashes_list(hashes), "md5-d"
-    n_files = len(hashes)
-    size = sum(sizes)
-    return size, hash, hash_type, n_files
+from __future__ import annotations
+"""Hashing.
+.. autosummary::
+   :toctree: .
+   hash_set
+   hash_file
+"""
+import base64
+import hashlib
+import json
+from concurrent.futures import ThreadPoolExecutor
+from typing import TYPE_CHECKING
+import psutil
+HASH_LENGTH = 22
+if TYPE_CHECKING:
+    from collections.abc import Iterable
+    from lamindb_setup.types import Path, UPathStr
+def hash_and_encode_as_b62(s: str) -> str:
+    from lamin_utils._base62 import encodebytes
+    return encodebytes(hashlib.md5(s.encode()).digest())
+def to_b64_str(bstr: bytes):
+    b64 = base64.urlsafe_b64encode(bstr).decode().strip("=")
+    return b64
+def b16_to_b64(s: str):
+    return to_b64_str(base64.b16decode(s.strip('"'), casefold=True))
+# a lot to read about this: lamin-notes/2022/hashing
+def hash_set(s: set[str]) -> str:
+    join_s = ":".join(sorted(s))
+    return hash_string(join_s)[:HASH_LENGTH]
+def hash_dict(d: dict) -> str:
+    return to_b64_str(hashlib.md5(json.dumps(d, sort_keys=True).encode()).digest())[
+        :HASH_LENGTH
+    ]
+def hash_from_hashes_list(hashes: Iterable[str]) -> str:
+    # need to sort below because we don't want the order of parsing the dir to
+    # affect the hash
+    digests = b"".join(
+        hashlib.md5(hash.encode("utf-8")).digest() for hash in sorted(hashes)
+    )
+    digest = hashlib.md5(digests).digest()
+    return to_b64_str(digest)[:HASH_LENGTH]
+# below is only used when comparing with git's sha1 hashes
+# we don't use it for our own hashes
+def hash_code(file_path: UPathStr) -> hashlib._Hash:
+    with open(file_path, "rb") as fp:
+        data = fp.read()
+    data_size = len(data)
+    header = f"blob {data_size}\0".encode()
+    blob = header + data
+    return hashlib.sha1(blob)
+def hash_small_bytes(data: bytes) -> str:
+    return to_b64_str(hashlib.md5(data).digest())
+# this is equivalent with hash_file for small files
+def hash_string(string: str) -> str:
+    # as we're truncating (not here) at 22 b64, we choose md5 over sha512
+    return to_b64_str(hashlib.md5(string.encode("utf-8")).digest())[:HASH_LENGTH]
+def hash_file(
+    file_path: Path,
+    file_size: int | None = None,
+    chunk_size: int | None = 50 * 1024 * 1024,
+) -> tuple[int, str, str]:
+    with open(file_path, "rb") as fp:
+        if file_size is None:
+            fp.seek(0, 2)
+            file_size = fp.tell()
+            fp.seek(0, 0)
+        if chunk_size is None:
+            chunk_size = file_size
+        first_chunk = fp.read(chunk_size)
+        if file_size <= chunk_size:
+            digest = hashlib.md5(first_chunk).digest()
+            hash_type = "md5"
+        else:
+            fp.seek(-chunk_size, 2)
+            last_chunk = fp.read(chunk_size)
+            digest = hashlib.sha1(
+                hashlib.sha1(first_chunk).digest() + hashlib.sha1(last_chunk).digest()
+            ).digest()
+            hash_type = "sha1-fl"
+    return file_size, to_b64_str(digest)[:HASH_LENGTH], hash_type
+def hash_dir(path: Path) -> tuple[int, str, str, int]:
+    files = (subpath for subpath in path.rglob("*") if subpath.is_file())
+    def hash_size(file):
+        size, hash, _ = hash_file(file)
+        return hash, size
+    try:
+        n_workers = len(psutil.Process().cpu_affinity())
+    except AttributeError:
+        n_workers = psutil.cpu_count()
+    if n_workers > 1:
+        with ThreadPoolExecutor(n_workers) as pool:
+            hashes_sizes = pool.map(hash_size, files)
+    else:
+        hashes_sizes = map(hash_size, files)
+    hashes, sizes = zip(*hashes_sizes, strict=False)
+    hash, hash_type = hash_from_hashes_list(hashes), "md5-d"
+    n_files = len(hashes)
+    size = sum(sizes)
+    return size, hash, hash_type, n_files

lamindb_setup/core/types.py CHANGED Viewed

	@@ -1 +1 @@
1	- from lamindb_setup.types import UPathStr # backward compatibility
1	+ from lamindb_setup.types import UPathStr # backward compatibility

lamindb_setup 1.18.2__py3-none-any.whl → 1.19.1__py3-none-any.whl

lamindb_setup 1.18.2py3-none-any.whl → 1.19.1py3-none-any.whl