datachain 0.13.0__py3-none-any.whl → 0.13.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of datachain might be problematic. Click here for more details.
- datachain/catalog/catalog.py +13 -0
- datachain/diff/__init__.py +8 -5
- {datachain-0.13.0.dist-info → datachain-0.13.1.dist-info}/METADATA +3 -2
- {datachain-0.13.0.dist-info → datachain-0.13.1.dist-info}/RECORD +8 -8
- {datachain-0.13.0.dist-info → datachain-0.13.1.dist-info}/WHEEL +1 -1
- {datachain-0.13.0.dist-info → datachain-0.13.1.dist-info}/entry_points.txt +0 -0
- {datachain-0.13.0.dist-info → datachain-0.13.1.dist-info/licenses}/LICENSE +0 -0
- {datachain-0.13.0.dist-info → datachain-0.13.1.dist-info}/top_level.txt +0 -0
datachain/catalog/catalog.py
CHANGED
|
@@ -795,6 +795,19 @@ class Catalog:
|
|
|
795
795
|
try:
|
|
796
796
|
dataset = self.get_dataset(name)
|
|
797
797
|
default_version = dataset.next_version
|
|
798
|
+
|
|
799
|
+
if (description or labels) and (
|
|
800
|
+
dataset.description != description or dataset.labels != labels
|
|
801
|
+
):
|
|
802
|
+
description = description or dataset.description
|
|
803
|
+
labels = labels or dataset.labels
|
|
804
|
+
|
|
805
|
+
self.update_dataset(
|
|
806
|
+
dataset,
|
|
807
|
+
description=description,
|
|
808
|
+
labels=labels,
|
|
809
|
+
)
|
|
810
|
+
|
|
798
811
|
except DatasetNotFoundError:
|
|
799
812
|
schema = {
|
|
800
813
|
c.name: c.type.to_dict() for c in columns if isinstance(c.type, SQLType)
|
datachain/diff/__init__.py
CHANGED
|
@@ -74,6 +74,7 @@ def _compare( # noqa: C901
|
|
|
74
74
|
# all left and right columns
|
|
75
75
|
cols = left.signals_schema.clone_without_sys_signals().db_signals()
|
|
76
76
|
right_cols = right.signals_schema.clone_without_sys_signals().db_signals()
|
|
77
|
+
cols_select = list(left.signals_schema.clone_without_sys_signals().values.keys())
|
|
77
78
|
|
|
78
79
|
# getting correct on and right_on column names
|
|
79
80
|
on = left.signals_schema.resolve(*on).db_signals() # type: ignore[assignment]
|
|
@@ -131,10 +132,12 @@ def _compare( # noqa: C901
|
|
|
131
132
|
# when the row is deleted, we need to take column values from the right chain
|
|
132
133
|
.mutate(
|
|
133
134
|
**{
|
|
134
|
-
f"{
|
|
135
|
-
C(diff_col) == CompareStatus.DELETED,
|
|
135
|
+
f"{l_on}": ifelse(
|
|
136
|
+
C(diff_col) == CompareStatus.DELETED,
|
|
137
|
+
C(f"{rname + l_on if on == right_on else r_on}"),
|
|
138
|
+
C(l_on),
|
|
136
139
|
)
|
|
137
|
-
for
|
|
140
|
+
for l_on, r_on in zip(on, right_on) # type: ignore[arg-type]
|
|
138
141
|
}
|
|
139
142
|
)
|
|
140
143
|
.select_except(ldiff_col, rdiff_col)
|
|
@@ -150,9 +153,9 @@ def _compare( # noqa: C901
|
|
|
150
153
|
dc_diff = dc_diff.filter(C(diff_col) != CompareStatus.DELETED)
|
|
151
154
|
|
|
152
155
|
if status_col:
|
|
153
|
-
|
|
156
|
+
cols_select.append(diff_col)
|
|
154
157
|
|
|
155
|
-
dc_diff = dc_diff.select(*
|
|
158
|
+
dc_diff = dc_diff.select(*cols_select)
|
|
156
159
|
|
|
157
160
|
# final schema is schema from the left chain with status column added if needed
|
|
158
161
|
dc_diff.signals_schema = (
|
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
Metadata-Version: 2.
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
2
|
Name: datachain
|
|
3
|
-
Version: 0.13.
|
|
3
|
+
Version: 0.13.1
|
|
4
4
|
Summary: Wrangle unstructured AI data at scale
|
|
5
5
|
Author-email: Dmitry Petrov <support@dvc.org>
|
|
6
6
|
License: Apache-2.0
|
|
@@ -107,6 +107,7 @@ Requires-Dist: accelerate; extra == "examples"
|
|
|
107
107
|
Requires-Dist: huggingface_hub[hf_transfer]; extra == "examples"
|
|
108
108
|
Requires-Dist: ultralytics; extra == "examples"
|
|
109
109
|
Requires-Dist: open_clip_torch; extra == "examples"
|
|
110
|
+
Dynamic: license-file
|
|
110
111
|
|
|
111
112
|
================
|
|
112
113
|
|logo| DataChain
|
|
@@ -17,7 +17,7 @@ datachain/studio.py,sha256=9MEpFPLKI3gG4isKklcfD5BMLeNsSXhtOUboOjW4Fdc,10017
|
|
|
17
17
|
datachain/telemetry.py,sha256=0A4IOPPp9VlP5pyW9eBfaTK3YhHGzHl7dQudQjUAx9A,994
|
|
18
18
|
datachain/utils.py,sha256=CLAYkI7iPbLYw3Pjh5EkWuc2UOs8wEbuXQnqIs4UyV8,14173
|
|
19
19
|
datachain/catalog/__init__.py,sha256=cMZzSz3VoUi-6qXSVaHYN-agxQuAcz2XSqnEPZ55crE,353
|
|
20
|
-
datachain/catalog/catalog.py,sha256=
|
|
20
|
+
datachain/catalog/catalog.py,sha256=C9FmhIDlTePiFZFJ4Yq7pfchNs1nciAVlkijtFLPZy4,60822
|
|
21
21
|
datachain/catalog/datasource.py,sha256=IkGMh0Ttg6Q-9DWfU_H05WUnZepbGa28HYleECi6K7I,1353
|
|
22
22
|
datachain/catalog/loader.py,sha256=AhSQR_-S-9lY3DcXn3PVZv9UtarHOMlDy2x75iDwUjo,6035
|
|
23
23
|
datachain/cli/__init__.py,sha256=YPVkuQ7IezNhtzo5xrfca1hEIiZtFxOlJCOzAOEuxmA,8335
|
|
@@ -50,7 +50,7 @@ datachain/data_storage/schema.py,sha256=qSukry2kINhVw8aj5lQrpe7N90DFeatKIKmDh6jA
|
|
|
50
50
|
datachain/data_storage/serializer.py,sha256=6G2YtOFqqDzJf1KbvZraKGXl2XHZyVml2krunWUum5o,927
|
|
51
51
|
datachain/data_storage/sqlite.py,sha256=KJ8hI0Hrwv9eAA-nLUlw2AYCQxiAAZ12a-ftUBtroNQ,24545
|
|
52
52
|
datachain/data_storage/warehouse.py,sha256=GGtgHcOKjnvHN6CFkGGB8m4CFgPPJBo3f-KHEFEJmDc,30730
|
|
53
|
-
datachain/diff/__init__.py,sha256=
|
|
53
|
+
datachain/diff/__init__.py,sha256=YkGdiDbZIMhAZ2SJ4eSe00HU67VP1P6SL2L_t0ODYMs,9425
|
|
54
54
|
datachain/fs/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
55
55
|
datachain/fs/reference.py,sha256=A8McpXF0CqbXPqanXuvpKu50YLB3a2ZXA3YAPxtBXSM,914
|
|
56
56
|
datachain/fs/utils.py,sha256=s-FkTOCGBk-b6TT3toQH51s9608pofoFjUSTc1yy7oE,825
|
|
@@ -138,9 +138,9 @@ datachain/sql/sqlite/vector.py,sha256=ncW4eu2FlJhrP_CIpsvtkUabZlQdl2D5Lgwy_cbfqR
|
|
|
138
138
|
datachain/toolkit/__init__.py,sha256=eQ58Q5Yf_Fgv1ZG0IO5dpB4jmP90rk8YxUWmPc1M2Bo,68
|
|
139
139
|
datachain/toolkit/split.py,sha256=z3zRJNzjWrpPuRw-zgFbCOBKInyYxJew8ygrYQRQLNc,2930
|
|
140
140
|
datachain/torch/__init__.py,sha256=gIS74PoEPy4TB3X6vx9nLO0Y3sLJzsA8ckn8pRWihJM,579
|
|
141
|
-
datachain-0.13.
|
|
142
|
-
datachain-0.13.
|
|
143
|
-
datachain-0.13.
|
|
144
|
-
datachain-0.13.
|
|
145
|
-
datachain-0.13.
|
|
146
|
-
datachain-0.13.
|
|
141
|
+
datachain-0.13.1.dist-info/licenses/LICENSE,sha256=8DnqK5yoPI_E50bEg_zsHKZHY2HqPy4rYN338BHQaRA,11344
|
|
142
|
+
datachain-0.13.1.dist-info/METADATA,sha256=FUW59zu58aHCBMYTtC_K6DkXYQZXaRQRc1L4wJFcGtc,11373
|
|
143
|
+
datachain-0.13.1.dist-info/WHEEL,sha256=1tXe9gY0PYatrMPMDd6jXqjfpz_B-Wqm32CPfRC58XU,91
|
|
144
|
+
datachain-0.13.1.dist-info/entry_points.txt,sha256=0GMJS6B_KWq0m3VT98vQI2YZodAMkn4uReZ_okga9R4,49
|
|
145
|
+
datachain-0.13.1.dist-info/top_level.txt,sha256=lZPpdU_2jJABLNIg2kvEOBi8PtsYikbN1OdMLHk8bTg,10
|
|
146
|
+
datachain-0.13.1.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|