PyPI - datachain - Versions diffs - 0.14.2__py3-none-any.whl → 0.39.0__py3-none-any.whl - Mend

datachain 0.14.2py3-none-any.whl → 0.39.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (137) hide show

datachain/__init__.py +20 -0
datachain/asyn.py +11 -12
datachain/cache.py +7 -7
datachain/catalog/__init__.py +2 -2
datachain/catalog/catalog.py +621 -507
datachain/catalog/dependency.py +164 -0
datachain/catalog/loader.py +28 -18
datachain/checkpoint.py +43 -0
datachain/cli/__init__.py +24 -33
datachain/cli/commands/__init__.py +1 -8
datachain/cli/commands/datasets.py +83 -52
datachain/cli/commands/ls.py +17 -17
datachain/cli/commands/show.py +4 -4
datachain/cli/parser/__init__.py +8 -74
datachain/cli/parser/job.py +95 -3
datachain/cli/parser/studio.py +11 -4
datachain/cli/parser/utils.py +1 -2
datachain/cli/utils.py +2 -15
datachain/client/azure.py +4 -4
datachain/client/fsspec.py +45 -28
datachain/client/gcs.py +6 -6
datachain/client/hf.py +29 -2
datachain/client/http.py +157 -0
datachain/client/local.py +15 -11
datachain/client/s3.py +17 -9
datachain/config.py +4 -8
datachain/data_storage/db_engine.py +12 -6
datachain/data_storage/job.py +5 -1
datachain/data_storage/metastore.py +1252 -186
datachain/data_storage/schema.py +58 -45
datachain/data_storage/serializer.py +105 -15
datachain/data_storage/sqlite.py +286 -127
datachain/data_storage/warehouse.py +250 -113
datachain/dataset.py +353 -148
datachain/delta.py +391 -0
datachain/diff/__init__.py +27 -29
datachain/error.py +60 -0
datachain/func/__init__.py +2 -1
datachain/func/aggregate.py +66 -42
datachain/func/array.py +242 -38
datachain/func/base.py +7 -4
datachain/func/conditional.py +110 -60
datachain/func/func.py +96 -45
datachain/func/numeric.py +55 -38
datachain/func/path.py +32 -20
datachain/func/random.py +2 -2
datachain/func/string.py +67 -37
datachain/func/window.py +7 -8
datachain/hash_utils.py +123 -0
datachain/job.py +11 -7
datachain/json.py +138 -0
datachain/lib/arrow.py +58 -22
datachain/lib/audio.py +245 -0
datachain/lib/clip.py +14 -13
datachain/lib/convert/flatten.py +5 -3
datachain/lib/convert/python_to_sql.py +6 -10
datachain/lib/convert/sql_to_python.py +8 -0
datachain/lib/convert/values_to_tuples.py +156 -51
datachain/lib/data_model.py +42 -20
datachain/lib/dataset_info.py +36 -8
datachain/lib/dc/__init__.py +8 -2
datachain/lib/dc/csv.py +25 -28
datachain/lib/dc/database.py +398 -0
datachain/lib/dc/datachain.py +1289 -425
datachain/lib/dc/datasets.py +320 -38
datachain/lib/dc/hf.py +38 -24
datachain/lib/dc/json.py +29 -32
datachain/lib/dc/listings.py +112 -8
datachain/lib/dc/pandas.py +16 -12
datachain/lib/dc/parquet.py +35 -23
datachain/lib/dc/records.py +31 -23
datachain/lib/dc/storage.py +154 -64
datachain/lib/dc/storage_pattern.py +251 -0
datachain/lib/dc/utils.py +24 -16
datachain/lib/dc/values.py +8 -9
datachain/lib/file.py +622 -89
datachain/lib/hf.py +69 -39
datachain/lib/image.py +14 -14
datachain/lib/listing.py +14 -11
datachain/lib/listing_info.py +1 -2
datachain/lib/meta_formats.py +3 -4
datachain/lib/model_store.py +39 -7
datachain/lib/namespaces.py +125 -0
datachain/lib/projects.py +130 -0
datachain/lib/pytorch.py +32 -21
datachain/lib/settings.py +192 -56
datachain/lib/signal_schema.py +427 -104
datachain/lib/tar.py +1 -2
datachain/lib/text.py +8 -7
datachain/lib/udf.py +164 -76
datachain/lib/udf_signature.py +60 -35
datachain/lib/utils.py +118 -4
datachain/lib/video.py +17 -9
datachain/lib/webdataset.py +61 -56
datachain/lib/webdataset_laion.py +15 -16
datachain/listing.py +22 -10
datachain/model/bbox.py +3 -1
datachain/model/ultralytics/bbox.py +16 -12
datachain/model/ultralytics/pose.py +16 -12
datachain/model/ultralytics/segment.py +16 -12
datachain/namespace.py +84 -0
datachain/node.py +6 -6
datachain/nodes_thread_pool.py +0 -1
datachain/plugins.py +24 -0
datachain/project.py +78 -0
datachain/query/batch.py +40 -41
datachain/query/dataset.py +604 -322
datachain/query/dispatch.py +261 -154
datachain/query/metrics.py +4 -6
datachain/query/params.py +2 -3
datachain/query/queue.py +3 -12
datachain/query/schema.py +11 -6
datachain/query/session.py +200 -33
datachain/query/udf.py +34 -2
datachain/remote/studio.py +171 -69
datachain/script_meta.py +12 -12
datachain/semver.py +68 -0
datachain/sql/__init__.py +2 -0
datachain/sql/functions/array.py +33 -1
datachain/sql/postgresql_dialect.py +9 -0
datachain/sql/postgresql_types.py +21 -0
datachain/sql/sqlite/__init__.py +5 -1
datachain/sql/sqlite/base.py +102 -29
datachain/sql/sqlite/types.py +8 -13
datachain/sql/types.py +70 -15
datachain/studio.py +223 -46
datachain/toolkit/split.py +31 -10
datachain/utils.py +101 -59
{datachain-0.14.2.dist-info → datachain-0.39.0.dist-info}/METADATA +77 -22
datachain-0.39.0.dist-info/RECORD +173 -0
{datachain-0.14.2.dist-info → datachain-0.39.0.dist-info}/WHEEL +1 -1
datachain/cli/commands/query.py +0 -53
datachain/query/utils.py +0 -42
datachain-0.14.2.dist-info/RECORD +0 -158
{datachain-0.14.2.dist-info → datachain-0.39.0.dist-info}/entry_points.txt +0 -0
{datachain-0.14.2.dist-info → datachain-0.39.0.dist-info}/licenses/LICENSE +0 -0
{datachain-0.14.2.dist-info → datachain-0.39.0.dist-info}/top_level.txt +0 -0

datachain/func/path.py CHANGED Viewed

@@ -8,23 +8,26 @@ def parent(col: ColT) -> Func:
     Returns the directory component of a posix-style path.
     Args:
-        col (str | literal | Func): String to compute the path parent of.
+        col (str | Column | Func | literal): String to compute the path parent of.
             If a string is provided, it is assumed to be the name of the column.
-            If a literal is provided, it is assumed to be a string literal.
+            If a Column is provided, it is assumed to be a column object.
             If a Func is provided, it is assumed to be a function returning a string.
+            If a literal is provided, it is assumed to be a string literal.
     Returns:
-        Func: A Func object that represents the path parent function.
+        Func: A `Func` object that represents the path parent function.
     Example:
         ```py
         dc.mutate(
-            parent=func.path.parent("file.path"),
+            parent1=func.path.parent("file.path"),
+            parent2=func.path.parent(dc.C("file.path")),
+            parent3=func.path.parent(dc.func.literal("/path/to/file.txt")),
         )
         ```
     Note:
-        - Result column will always be of type string.
+        - The result column will always be of type string.
     """
     return Func("parent", inner=path.parent, cols=[col], result_type=str)
@@ -34,23 +37,26 @@ def name(col: ColT) -> Func:
     Returns the final component of a posix-style path.
     Args:
-        col (str | literal): String to compute the path name of.
+        col (str | Column | Func | literal): String to compute the path name of.
             If a string is provided, it is assumed to be the name of the column.
-            If a literal is provided, it is assumed to be a string literal.
+            If a Column is provided, it is assumed to be a column object.
             If a Func is provided, it is assumed to be a function returning a string.
+            If a literal is provided, it is assumed to be a string literal.
     Returns:
-        Func: A Func object that represents the path name function.
+        Func: A `Func` object that represents the path name function.
     Example:
         ```py
         dc.mutate(
-            file_name=func.path.name("file.path"),
+            filename1=func.path.name("file.path"),
+            filename2=func.path.name(dc.C("file.path")),
+            filename3=func.path.name(dc.func.literal("/path/to/file.txt")
         )
         ```
     Note:
-        - Result column will always be of type string.
+        - The result column will always be of type string.
     """
     return Func("name", inner=path.name, cols=[col], result_type=str)
@@ -61,23 +67,26 @@ def file_stem(col: ColT) -> Func:
     Returns the path without the extension.
     Args:
-        col (str | literal): String to compute the file stem of.
+        col (str | Column | Func | literal): String to compute the file stem of.
             If a string is provided, it is assumed to be the name of the column.
-            If a literal is provided, it is assumed to be a string literal.
+            If a Column is provided, it is assumed to be a column object.
             If a Func is provided, it is assumed to be a function returning a string.
+            If a literal is provided, it is assumed to be a string literal.
     Returns:
-        Func: A Func object that represents the file stem function.
+        Func: A `Func` object that represents the file stem function.
     Example:
         ```py
         dc.mutate(
-            file_stem=func.path.file_stem("file.path"),
+            filestem1=func.path.file_stem("file.path"),
+            filestem2=func.path.file_stem(dc.C("file.path")),
+            filestem3=func.path.file_stem(dc.func.literal("/path/to/file.txt")
         )
         ```
     Note:
-        - Result column will always be of type string.
+        - The result column will always be of type string.
     """
     return Func("file_stem", inner=path.file_stem, cols=[col], result_type=str)
@@ -88,23 +97,26 @@ def file_ext(col: ColT) -> Func:
     Returns the extension of the given path.
     Args:
-        col (str | literal): String to compute the file extension of.
+        col (str | Column | Func | literal): String to compute the file extension of.
             If a string is provided, it is assumed to be the name of the column.
-            If a literal is provided, it is assumed to be a string literal.
+            If a Column is provided, it is assumed to be a column object.
             If a Func is provided, it is assumed to be a function returning a string.
+            If a literal is provided, it is assumed to be a string literal.
     Returns:
-        Func: A Func object that represents the file extension function.
+        Func: A `Func` object that represents the file extension function.
     Example:
         ```py
         dc.mutate(
-            file_stem=func.path.file_ext("file.path"),
+            filestem1=func.path.file_ext("file.path"),
+            filestem2=func.path.file_ext(dc.C("file.path")),
+            filestem3=func.path.file_ext(dc.func.literal("/path/to/file.txt")
         )
         ```
     Note:
-        - Result column will always be of type string.
+        - The result column will always be of type string.
     """
     return Func("file_ext", inner=path.file_ext, cols=[col], result_type=str)

datachain/func/random.py CHANGED Viewed

@@ -8,7 +8,7 @@ def rand() -> Func:
     Returns the random integer value.
     Returns:
-        Func: A Func object that represents the rand function.
+        Func: A `Func` object that represents the rand function.
     Example:
         ```py
@@ -18,6 +18,6 @@ def rand() -> Func:
         ```
     Note:
-        - Result column will always be of type integer.
+        - The result column will always be of type integer.
     """
     return Func("rand", inner=random.rand, result_type=int)

datachain/func/string.py CHANGED Viewed

@@ -1,64 +1,76 @@
-from typing import Optional, Union, get_origin
+from typing import get_origin
 from sqlalchemy import literal
 from datachain.sql.functions import string
-from .func import Func
+from .func import ColT, Func
+__all__ = [
+    "byte_hamming_distance",
+    "length",
+    "regexp_replace",
+    "replace",
+    "split",
+]
-def length(col: Union[str, Func]) -> Func:
+def length(col: ColT) -> Func:
     """
     Returns the length of the string.
     Args:
-        col (str | literal | Func): String to compute the length of.
+        col (str | Column | Func | literal): String to compute the length of.
             If a string is provided, it is assumed to be the name of the column.
-            If a literal is provided, it is assumed to be a string literal.
+            If a Column is provided, it is assumed to be a column in the dataset.
             If a Func is provided, it is assumed to be a function returning a string.
+            If a literal is provided, it is assumed to be a string literal.
     Returns:
-        Func: A Func object that represents the string length function.
+        Func: A `Func` object that represents the string length function.
     Example:
         ```py
         dc.mutate(
             len1=func.string.length("file.path"),
-            len2=func.string.length("Random string"),
+            len2=func.string.length(dc.C("file.path")),
+            len3=func.string.length(dc.func.literal("Random string")),
         )
         ```
-    Note:
-        - Result column will always be of type int.
+    Notes:
+        - The result column will always be of type int.
     """
     return Func("length", inner=string.length, cols=[col], result_type=int)
-def split(col: Union[str, Func], sep: str, limit: Optional[int] = None) -> Func:
+def split(col: ColT, sep: str, limit: int | None = None) -> Func:
     """
     Takes a column and split character and returns an array of the parts.
     Args:
-        col (str | literal): Column to split.
+        col (str | Column | Func | literal): Column to split.
             If a string is provided, it is assumed to be the name of the column.
-            If a literal is provided, it is assumed to be a string literal.
+            If a Column is provided, it is assumed to be a column in the dataset.
             If a Func is provided, it is assumed to be a function returning a string.
+            If a literal is provided, it is assumed to be a string literal.
         sep (str): Separator to split the string.
         limit (int, optional): Maximum number of splits to perform.
     Returns:
-        Func: A Func object that represents the split function.
+        Func: A `Func` object that represents the split function.
     Example:
         ```py
         dc.mutate(
             path_parts=func.string.split("file.path", "/"),
-            str_words=func.string.length("Random string", " "),
+            signal_values=func.string.split(dc.C("signal.value"), ","),
+            str_words=func.string.split(dc.func.literal("Random string"), " "),
         )
         ```
-    Note:
-        - Result column will always be of type array of strings.
+    Notes:
+        - The result column will always be of type array of strings.
     """
     def inner(arg):
@@ -76,30 +88,33 @@ def split(col: Union[str, Func], sep: str, limit: Optional[int] = None) -> Func:
     return Func("split", inner=inner, cols=cols, args=args, result_type=list[str])
-def replace(col: Union[str, Func], pattern: str, replacement: str) -> Func:
+def replace(col: ColT, pattern: str, replacement: str) -> Func:
     """
     Replaces substring with another string.
     Args:
-        col (str | literal): Column to split.
+        col (str | Column | Func | literal): Column to perform replacement on.
             If a string is provided, it is assumed to be the name of the column.
-            If a literal is provided, it is assumed to be a string literal.
+            If a Column is provided, it is assumed to be a column in the dataset.
             If a Func is provided, it is assumed to be a function returning a string.
+            If a literal is provided, it is assumed to be a string literal.
         pattern (str): Pattern to replace.
         replacement (str): Replacement string.
     Returns:
-        Func: A Func object that represents the replace function.
+        Func: A `Func` object that represents the replace function.
     Example:
         ```py
         dc.mutate(
-            signal=func.string.replace("signal.name", "pattern", "replacement),
+            s1=func.string.replace("signal.name", "pattern", "replacement"),
+            s2=func.string.replace(dc.C("signal.name"), "pattern", "replacement"),
+            s3=func.string.replace(dc.func.literal("Random string"), "Random", "New"),
         )
         ```
-    Note:
-        - Result column will always be of type string.
+    Notes:
+        - The result column will always be of type string.
     """
     def inner(arg):
@@ -115,30 +130,37 @@ def replace(col: Union[str, Func], pattern: str, replacement: str) -> Func:
     return Func("replace", inner=inner, cols=cols, args=args, result_type=str)
-def regexp_replace(col: Union[str, Func], regex: str, replacement: str) -> Func:
+def regexp_replace(col: ColT, regex: str, replacement: str) -> Func:
     r"""
     Replaces substring that match a regular expression.
     Args:
-        col (str | literal): Column to split.
+        col (str | Column | Func | literal): Column to perform replacement on.
             If a string is provided, it is assumed to be the name of the column.
-            If a literal is provided, it is assumed to be a string literal.
+            If a Column is provided, it is assumed to be a column in the dataset.
             If a Func is provided, it is assumed to be a function returning a string.
+            If a literal is provided, it is assumed to be a string literal.
         regex (str): Regular expression pattern to replace.
         replacement (str): Replacement string.
     Returns:
-        Func: A Func object that represents the regexp_replace function.
+        Func: A `Func` object that represents the regexp_replace function.
     Example:
         ```py
         dc.mutate(
-            signal=func.string.regexp_replace("signal.name", r"\d+", "X"),
+            s1=func.string.regexp_replace("signal.name", r"\d+", "X"),
+            s2=func.string.regexp_replace(dc.C("signal.name"), r"\d+", "X"),
+            s3=func.string.regexp_replace(
+                dc.func.literal("Random string"),
+                r"\s+",
+                "_",
+            ),
         )
         ```
-    Note:
-        - Result column will always be of type string.
+    Notes:
+        - The result column will always be of type string.
     """
     def inner(arg):
@@ -154,7 +176,7 @@ def regexp_replace(col: Union[str, Func], regex: str, replacement: str) -> Func:
     return Func("regexp_replace", inner=inner, cols=cols, args=args, result_type=str)
-def byte_hamming_distance(*args: Union[str, Func]) -> Func:
+def byte_hamming_distance(*args: ColT) -> Func:
     """
     Computes the Hamming distance between two strings.
@@ -164,22 +186,30 @@ def byte_hamming_distance(*args: Union[str, Func]) -> Func:
     of the strings indicate higher dissimilarity.
     Args:
-        args (str | literal): Two strings to compute the Hamming distance between.
-            If a str is provided, it is assumed to be the name of the column.
-            If a Literal is provided, it is assumed to be a string literal.
+        args (str | Column | Func | literal): Two strings to compute
+            the Hamming distance between.
+            If a string is provided, it is assumed to be the name of the column.
+            If a Column is provided, it is assumed to be a column in the dataset.
+            If a Func is provided, it is assumed to be a function returning a string.
+            If a literal is provided, it is assumed to be a string literal.
     Returns:
-        Func: A Func object that represents the Hamming distance function.
+        Func: A `Func` object that represents the Hamming distance function.
     Example:
         ```py
         dc.mutate(
-            ham_dist=func.byte_hamming_distance("file.phash", literal("hello")),
+            hd1=func.byte_hamming_distance("file.phash", literal("hello")),
+            hd2=func.byte_hamming_distance(dc.C("file.phash"), "hello"),
+            hd3=func.byte_hamming_distance(
+                dc.func.literal("hi"),
+                dc.func.literal("hello"),
+            ),
         )
         ```
     Notes:
-        - Result column will always be of type int.
+        - The result column will always be of type int.
     """
     cols, func_args = [], []
     for arg in args:

datachain/func/window.py CHANGED Viewed

@@ -22,17 +22,16 @@ def window(partition_by: str, order_by: str, desc: bool = False) -> Window:
     Args:
         partition_by (str): The column name by which to partition the result set.
-                            Rows with the same value in the partition column
-                            will be grouped together for the window function.
-        order_by (str): The column name by which to order the rows
-                        within each partition. This determines the sequence in which
-                        the window function is applied.
+            Rows with the same value in the partition column will be grouped together
+            for the window function.
+        order_by (str): The column name by which to order the rows within
+            each partition. This determines the sequence in which the window function
+            is applied.
         desc (bool, optional): If True, the rows will be ordered in descending order.
-                               Defaults to False, which orders the rows
-                               in ascending order.
+            Defaults to False, which orders the rows in ascending order.
     Returns:
-        Window: A Window object representing the window specification.
+        Window: A `Window` object representing the window specification.
     Example:
         ```py

datachain/hash_utils.py ADDED Viewed

@@ -0,0 +1,123 @@
+import hashlib
+import inspect
+import textwrap
+from collections.abc import Sequence
+from typing import TypeAlias, TypeVar
+from sqlalchemy.sql.elements import ClauseElement, ColumnElement
+from datachain import json
+T = TypeVar("T", bound=ColumnElement)
+ColumnLike: TypeAlias = str | T
+def _serialize_value(val):  # noqa: PLR0911
+    """Helper to serialize arbitrary values recursively."""
+    if val is None:
+        return None
+    if isinstance(val, (str, int, float, bool)):
+        return val
+    if isinstance(val, ClauseElement):
+        return serialize_column_element(val)
+    if isinstance(val, dict):
+        # Sort dict keys for deterministic serialization
+        return {k: _serialize_value(v) for k, v in sorted(val.items())}
+    if isinstance(val, (list, tuple)):
+        return [_serialize_value(v) for v in val]
+    if callable(val):
+        return val.__name__ if hasattr(val, "__name__") else str(val)
+    return str(val)
+def serialize_column_element(expr: str | ColumnElement) -> dict:
+    """
+    Recursively serialize a SQLAlchemy ColumnElement into a deterministic structure.
+    Uses SQLAlchemy's _traverse_internals to automatically handle all expression types.
+    """
+    from sqlalchemy.sql.elements import BindParameter
+    # Special case: BindParameter has non-deterministic 'key' attribute, only use value
+    if isinstance(expr, BindParameter):
+        return {"type": "bind", "value": _serialize_value(expr.value)}
+    # Generic handling for all ClauseElement types using SQLAlchemy's internals
+    if isinstance(expr, ClauseElement):
+        # All standard SQLAlchemy types have _traverse_internals
+        if hasattr(expr, "_traverse_internals"):
+            result = {"type": expr.__class__.__name__}
+            for attr_name, _ in expr._traverse_internals:
+                # Skip 'table' attribute - table names can be auto-generated/random
+                # and are not semantically important for hashing
+                if attr_name == "table":
+                    continue
+                if hasattr(expr, attr_name):
+                    val = getattr(expr, attr_name)
+                    result[attr_name] = _serialize_value(val)
+            return result
+        # Rare case: custom user-defined ClauseElement without _traverse_internals
+        # We don't know its structure, so just stringify it
+        return {"type": expr.__class__.__name__, "repr": str(expr)}
+    # Absolute fallback: stringify completely unknown types
+    return {"type": "other", "repr": str(expr)}
+def hash_column_elements(columns: ColumnLike | Sequence[ColumnLike]) -> str:
+    """
+    Hash a list of ColumnElements deterministically, dialect agnostic.
+    Only accepts ordered iterables (like list or tuple).
+    """
+    # Handle case where a single ColumnElement is passed instead of a sequence
+    if isinstance(columns, (ColumnElement, str)):
+        columns = (columns,)
+    serialized = [serialize_column_element(c) for c in columns]
+    json_str = json.dumps(
+        serialized, sort_keys=True, separators=(", ", ": ")
+    )  # stable JSON
+    return hashlib.sha256(json_str.encode("utf-8")).hexdigest()
+def hash_callable(func):
+    """
+    Calculate a hash from a callable.
+    Rules:
+    - Named functions (def) → use source code for stable, cross-version hashing
+    - Lambdas → use bytecode (deterministic in same Python runtime)
+    """
+    if not callable(func):
+        raise TypeError("Expected a callable")
+    # Determine if it is a lambda
+    is_lambda = func.__name__ == "<lambda>"
+    if not is_lambda:
+        # Try to get exact source of named function
+        try:
+            lines, _ = inspect.getsourcelines(func)
+            payload = textwrap.dedent("".join(lines)).strip()
+        except (OSError, TypeError):
+            # Fallback: bytecode if source not available
+            payload = func.__code__.co_code
+    else:
+        # For lambdas, fall back directly to bytecode
+        payload = func.__code__.co_code
+    # Normalize annotations
+    annotations = {
+        k: getattr(v, "__name__", str(v)) for k, v in func.__annotations__.items()
+    }
+    # Extras to distinguish functions with same code but different metadata
+    extras = {
+        "name": func.__name__,
+        "defaults": func.__defaults__,
+        "annotations": annotations,
+    }
+    # Compute SHA256
+    h = hashlib.sha256()
+    h.update(str(payload).encode() if isinstance(payload, str) else payload)
+    h.update(str(extras).encode())
+    return h.hexdigest()

datachain/job.py CHANGED Viewed

@@ -1,8 +1,9 @@
-import json
 import uuid
 from dataclasses import dataclass
 from datetime import datetime
-from typing import Any, Optional, TypeVar, Union
+from typing import Any, TypeVar
+from datachain import json
 J = TypeVar("J", bound="Job")
@@ -18,27 +19,29 @@ class Job:
     workers: int
     params: dict[str, str]
     metrics: dict[str, Any]
-    finished_at: Optional[datetime] = None
-    python_version: Optional[str] = None
+    finished_at: datetime | None = None
+    python_version: str | None = None
     error_message: str = ""
     error_stack: str = ""
+    parent_job_id: str | None = None
     @classmethod
     def parse(
         cls,
-        id: Union[str, uuid.UUID],
+        id: str | uuid.UUID,
         name: str,
         status: int,
         created_at: datetime,
-        finished_at: Optional[datetime],
+        finished_at: datetime | None,
         query: str,
         query_type: int,
         workers: int,
-        python_version: Optional[str],
+        python_version: str | None,
         error_message: str,
         error_stack: str,
         params: str,
         metrics: str,
+        parent_job_id: str | None,
     ) -> "Job":
         return cls(
             str(id),
@@ -54,4 +57,5 @@ class Job:
             python_version,
             error_message,
             error_stack,
+            str(parent_job_id) if parent_job_id else None,
         )

datachain 0.14.2__py3-none-any.whl → 0.39.0__py3-none-any.whl

datachain 0.14.2py3-none-any.whl → 0.39.0py3-none-any.whl