datachain 0.37.5__py3-none-any.whl → 0.37.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of datachain might be problematic. Click here for more details.

@@ -577,7 +577,8 @@ class DataChain:
577
577
  create=True,
578
578
  )
579
579
  return self._evolve(
580
- query=self._query.save(project=project, feature_schema=schema)
580
+ query=self._query.save(project=project, feature_schema=schema),
581
+ signal_schema=self.signals_schema | SignalSchema({"sys": Sys}),
581
582
  )
582
583
 
583
584
  def _calculate_job_hash(self, job_id: str) -> str:
@@ -630,23 +630,18 @@ class UDFStep(Step, ABC):
630
630
  def apply(
631
631
  self, query_generator: QueryGenerator, temp_tables: list[str]
632
632
  ) -> "StepResult":
633
- _query = query = query_generator.select()
633
+ query, tables = self.process_input_query(query_generator.select())
634
+ _query = query
634
635
 
635
636
  # Apply partitioning if needed.
636
637
  if self.partition_by is not None:
637
- _query = query = self.catalog.warehouse._regenerate_system_columns(
638
- query_generator.select(),
639
- keep_existing_columns=True,
640
- regenerate_columns=["sys__id"],
641
- )
642
638
  partition_tbl = self.create_partitions_table(query)
643
- temp_tables.append(partition_tbl.name)
644
639
  query = query.outerjoin(
645
640
  partition_tbl,
646
641
  partition_tbl.c.sys__id == query.selected_columns.sys__id,
647
642
  ).add_columns(*partition_columns())
643
+ tables = [*tables, partition_tbl]
648
644
 
649
- query, tables = self.process_input_query(query)
650
645
  temp_tables.extend(t.name for t in tables)
651
646
  udf_table = self.create_udf_table(_query)
652
647
  temp_tables.append(udf_table.name)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: datachain
3
- Version: 0.37.5
3
+ Version: 0.37.7
4
4
  Summary: Wrangle unstructured AI data at scale
5
5
  Author-email: Dmitry Petrov <support@dvc.org>
6
6
  License-Expression: Apache-2.0
@@ -55,9 +55,9 @@ Provides-Extra: docs
55
55
  Requires-Dist: mkdocs>=1.5.2; extra == "docs"
56
56
  Requires-Dist: mkdocs-gen-files>=0.5.0; extra == "docs"
57
57
  Requires-Dist: mkdocs-material==9.5.22; extra == "docs"
58
- Requires-Dist: mkdocs-section-index>=0.3.6; extra == "docs"
59
58
  Requires-Dist: mkdocstrings-python>=1.6.3; extra == "docs"
60
59
  Requires-Dist: mkdocs-literate-nav>=0.6.1; extra == "docs"
60
+ Requires-Dist: mkdocs-section-index>=0.3.10; extra == "docs"
61
61
  Requires-Dist: eval-type-backport; extra == "docs"
62
62
  Provides-Extra: torch
63
63
  Requires-Dist: torch>=2.1.0; extra == "torch"
@@ -109,7 +109,7 @@ datachain/lib/convert/values_to_tuples.py,sha256=Sxj0ojeMSpAwM_NNoXa1dMR_2L_cQ6X
109
109
  datachain/lib/dc/__init__.py,sha256=UrUzmDH6YyVl8fxM5iXTSFtl5DZTUzEYm1MaazK4vdQ,900
110
110
  datachain/lib/dc/csv.py,sha256=fIfj5-2Ix4z5D5yZueagd5WUWw86pusJ9JJKD-U3KGg,4407
111
111
  datachain/lib/dc/database.py,sha256=Wqob3dQc9Mol_0vagzVEXzteCKS9M0E3U5130KVmQKg,14629
112
- datachain/lib/dc/datachain.py,sha256=RYhinLQ6CMU3tudLpiJGh-vfCL24KDKbKM3Q1EsWoAE,104072
112
+ datachain/lib/dc/datachain.py,sha256=fa7BHEXBCsO_3-zxN0F5zzIdsqDieY6TkcLYx70B11s,104149
113
113
  datachain/lib/dc/datasets.py,sha256=oY1t8QBAaZdhjwR439zZT74hMOspewVCrgdwy6juXng,15321
114
114
  datachain/lib/dc/hf.py,sha256=FeruEO176L2qQ1Mnx0QmK4kV0GuQ4xtj717N8fGJrBI,2849
115
115
  datachain/lib/dc/json.py,sha256=iJ6G0jwTKz8xtfh1eICShnWk_bAMWjF5bFnOXLHaTlw,2683
@@ -132,7 +132,7 @@ datachain/model/ultralytics/pose.py,sha256=pvoXrWWUSWT_UBaMwUb5MBHAY57Co2HFDPigF
132
132
  datachain/model/ultralytics/segment.py,sha256=v9_xDxd5zw_I8rXsbl7yQXgEdTs2T38zyY_Y4XGN8ok,3194
133
133
  datachain/query/__init__.py,sha256=7DhEIjAA8uZJfejruAVMZVcGFmvUpffuZJwgRqNwe-c,263
134
134
  datachain/query/batch.py,sha256=ugTlSFqh_kxMcG6vJ5XrEzG9jBXRdb7KRAEEsFWiPew,4190
135
- datachain/query/dataset.py,sha256=5r7atEt1pTsH8PHKaahKvXEG2zf8L8ZId-rWnbpa6KM,67367
135
+ datachain/query/dataset.py,sha256=kfNh6B6pYSz3batUpwW_6vJ7XRLwLfC08hKOZUMjf3o,67126
136
136
  datachain/query/dispatch.py,sha256=Tg73zB6vDnYYYAvtlS9l7BI3sI1EfRCbDjiasvNxz2s,16385
137
137
  datachain/query/metrics.py,sha256=qOMHiYPTMtVs2zI-mUSy8OPAVwrg4oJtVF85B9tdQyM,810
138
138
  datachain/query/params.py,sha256=JkVz6IKUIpF58JZRkUXFT8DAHX2yfaULbhVaGmHKFLc,826
@@ -165,9 +165,9 @@ datachain/sql/sqlite/vector.py,sha256=ncW4eu2FlJhrP_CIpsvtkUabZlQdl2D5Lgwy_cbfqR
165
165
  datachain/toolkit/__init__.py,sha256=eQ58Q5Yf_Fgv1ZG0IO5dpB4jmP90rk8YxUWmPc1M2Bo,68
166
166
  datachain/toolkit/split.py,sha256=xQzzmvQRKsPteDKbpgOxd4r971BnFaK33mcOl0FuGeI,2883
167
167
  datachain/torch/__init__.py,sha256=gIS74PoEPy4TB3X6vx9nLO0Y3sLJzsA8ckn8pRWihJM,579
168
- datachain-0.37.5.dist-info/licenses/LICENSE,sha256=8DnqK5yoPI_E50bEg_zsHKZHY2HqPy4rYN338BHQaRA,11344
169
- datachain-0.37.5.dist-info/METADATA,sha256=xBtVsgQ5arecWHTP80Cfa2iAIYyaIgMecBIBqv2bH4M,13762
170
- datachain-0.37.5.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
171
- datachain-0.37.5.dist-info/entry_points.txt,sha256=0GMJS6B_KWq0m3VT98vQI2YZodAMkn4uReZ_okga9R4,49
172
- datachain-0.37.5.dist-info/top_level.txt,sha256=lZPpdU_2jJABLNIg2kvEOBi8PtsYikbN1OdMLHk8bTg,10
173
- datachain-0.37.5.dist-info/RECORD,,
168
+ datachain-0.37.7.dist-info/licenses/LICENSE,sha256=8DnqK5yoPI_E50bEg_zsHKZHY2HqPy4rYN338BHQaRA,11344
169
+ datachain-0.37.7.dist-info/METADATA,sha256=XAwgoA4w5RvJxX-1AiSoGRFW2_6egaEigJUT-owm77g,13763
170
+ datachain-0.37.7.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
171
+ datachain-0.37.7.dist-info/entry_points.txt,sha256=0GMJS6B_KWq0m3VT98vQI2YZodAMkn4uReZ_okga9R4,49
172
+ datachain-0.37.7.dist-info/top_level.txt,sha256=lZPpdU_2jJABLNIg2kvEOBi8PtsYikbN1OdMLHk8bTg,10
173
+ datachain-0.37.7.dist-info/RECORD,,