datachain 0.6.6__tar.gz → 0.6.7__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of datachain might be problematic. Click here for more details.

Files changed (257) hide show
  1. {datachain-0.6.6 → datachain-0.6.7}/.github/workflows/tests-studio.yml +2 -5
  2. {datachain-0.6.6/src/datachain.egg-info → datachain-0.6.7}/PKG-INFO +1 -1
  3. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/catalog/catalog.py +2 -6
  4. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/data_storage/schema.py +4 -2
  5. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/types.py +2 -0
  6. {datachain-0.6.6 → datachain-0.6.7/src/datachain.egg-info}/PKG-INFO +1 -1
  7. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_datasets.py +2 -5
  8. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_pull.py +4 -6
  9. {datachain-0.6.6 → datachain-0.6.7}/.cruft.json +0 -0
  10. {datachain-0.6.6 → datachain-0.6.7}/.gitattributes +0 -0
  11. {datachain-0.6.6 → datachain-0.6.7}/.github/ISSUE_TEMPLATE/bug_report.yml +0 -0
  12. {datachain-0.6.6 → datachain-0.6.7}/.github/ISSUE_TEMPLATE/empty_issue.md +0 -0
  13. {datachain-0.6.6 → datachain-0.6.7}/.github/ISSUE_TEMPLATE/feature_request.yml +0 -0
  14. {datachain-0.6.6 → datachain-0.6.7}/.github/codecov.yaml +0 -0
  15. {datachain-0.6.6 → datachain-0.6.7}/.github/dependabot.yml +0 -0
  16. {datachain-0.6.6 → datachain-0.6.7}/.github/workflows/benchmarks.yml +0 -0
  17. {datachain-0.6.6 → datachain-0.6.7}/.github/workflows/release.yml +0 -0
  18. {datachain-0.6.6 → datachain-0.6.7}/.github/workflows/tests.yml +0 -0
  19. {datachain-0.6.6 → datachain-0.6.7}/.github/workflows/update-template.yaml +0 -0
  20. {datachain-0.6.6 → datachain-0.6.7}/.gitignore +0 -0
  21. {datachain-0.6.6 → datachain-0.6.7}/.pre-commit-config.yaml +0 -0
  22. {datachain-0.6.6 → datachain-0.6.7}/CODE_OF_CONDUCT.rst +0 -0
  23. {datachain-0.6.6 → datachain-0.6.7}/CONTRIBUTING.rst +0 -0
  24. {datachain-0.6.6 → datachain-0.6.7}/LICENSE +0 -0
  25. {datachain-0.6.6 → datachain-0.6.7}/README.rst +0 -0
  26. {datachain-0.6.6 → datachain-0.6.7}/docs/assets/captioned_cartoons.png +0 -0
  27. {datachain-0.6.6 → datachain-0.6.7}/docs/assets/datachain-white.svg +0 -0
  28. {datachain-0.6.6 → datachain-0.6.7}/docs/assets/datachain.svg +0 -0
  29. {datachain-0.6.6 → datachain-0.6.7}/docs/assets/flowchart.png +0 -0
  30. {datachain-0.6.6 → datachain-0.6.7}/docs/index.md +0 -0
  31. {datachain-0.6.6 → datachain-0.6.7}/docs/references/datachain.md +0 -0
  32. {datachain-0.6.6 → datachain-0.6.7}/docs/references/datatype.md +0 -0
  33. {datachain-0.6.6 → datachain-0.6.7}/docs/references/file.md +0 -0
  34. {datachain-0.6.6 → datachain-0.6.7}/docs/references/index.md +0 -0
  35. {datachain-0.6.6 → datachain-0.6.7}/docs/references/sql.md +0 -0
  36. {datachain-0.6.6 → datachain-0.6.7}/docs/references/torch.md +0 -0
  37. {datachain-0.6.6 → datachain-0.6.7}/docs/references/udf.md +0 -0
  38. {datachain-0.6.6 → datachain-0.6.7}/examples/computer_vision/iptc_exif_xmp_lib.py +0 -0
  39. {datachain-0.6.6 → datachain-0.6.7}/examples/computer_vision/llava2_image_desc_lib.py +0 -0
  40. {datachain-0.6.6 → datachain-0.6.7}/examples/computer_vision/openimage-detect.py +0 -0
  41. {datachain-0.6.6 → datachain-0.6.7}/examples/get_started/common_sql_functions.py +0 -0
  42. {datachain-0.6.6 → datachain-0.6.7}/examples/get_started/json-csv-reader.py +0 -0
  43. {datachain-0.6.6 → datachain-0.6.7}/examples/get_started/torch-loader.py +0 -0
  44. {datachain-0.6.6 → datachain-0.6.7}/examples/get_started/udfs/parallel.py +0 -0
  45. {datachain-0.6.6 → datachain-0.6.7}/examples/get_started/udfs/simple.py +0 -0
  46. {datachain-0.6.6 → datachain-0.6.7}/examples/get_started/udfs/stateful.py +0 -0
  47. {datachain-0.6.6 → datachain-0.6.7}/examples/llm_and_nlp/claude-query.py +0 -0
  48. {datachain-0.6.6 → datachain-0.6.7}/examples/llm_and_nlp/hf-dataset-llm-eval.py +0 -0
  49. {datachain-0.6.6 → datachain-0.6.7}/examples/llm_and_nlp/unstructured-embeddings-gen.py +0 -0
  50. {datachain-0.6.6 → datachain-0.6.7}/examples/llm_and_nlp/unstructured-summary-map.py +0 -0
  51. {datachain-0.6.6 → datachain-0.6.7}/examples/multimodal/clip_inference.py +0 -0
  52. {datachain-0.6.6 → datachain-0.6.7}/examples/multimodal/hf_pipeline.py +0 -0
  53. {datachain-0.6.6 → datachain-0.6.7}/examples/multimodal/openai_image_desc_lib.py +0 -0
  54. {datachain-0.6.6 → datachain-0.6.7}/examples/multimodal/wds.py +0 -0
  55. {datachain-0.6.6 → datachain-0.6.7}/examples/multimodal/wds_filtered.py +0 -0
  56. {datachain-0.6.6 → datachain-0.6.7}/mkdocs.yml +0 -0
  57. {datachain-0.6.6 → datachain-0.6.7}/noxfile.py +0 -0
  58. {datachain-0.6.6 → datachain-0.6.7}/overrides/main.html +0 -0
  59. {datachain-0.6.6 → datachain-0.6.7}/pyproject.toml +0 -0
  60. {datachain-0.6.6 → datachain-0.6.7}/setup.cfg +0 -0
  61. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/__init__.py +0 -0
  62. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/__main__.py +0 -0
  63. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/asyn.py +0 -0
  64. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/cache.py +0 -0
  65. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/catalog/__init__.py +0 -0
  66. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/catalog/datasource.py +0 -0
  67. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/catalog/loader.py +0 -0
  68. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/cli.py +0 -0
  69. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/cli_utils.py +0 -0
  70. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/client/__init__.py +0 -0
  71. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/client/azure.py +0 -0
  72. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/client/fileslice.py +0 -0
  73. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/client/fsspec.py +0 -0
  74. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/client/gcs.py +0 -0
  75. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/client/hf.py +0 -0
  76. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/client/local.py +0 -0
  77. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/client/s3.py +0 -0
  78. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/config.py +0 -0
  79. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/data_storage/__init__.py +0 -0
  80. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/data_storage/db_engine.py +0 -0
  81. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/data_storage/id_generator.py +0 -0
  82. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/data_storage/job.py +0 -0
  83. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/data_storage/metastore.py +0 -0
  84. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/data_storage/serializer.py +0 -0
  85. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/data_storage/sqlite.py +0 -0
  86. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/data_storage/warehouse.py +0 -0
  87. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/dataset.py +0 -0
  88. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/error.py +0 -0
  89. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/job.py +0 -0
  90. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/__init__.py +0 -0
  91. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/arrow.py +0 -0
  92. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/clip.py +0 -0
  93. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/convert/__init__.py +0 -0
  94. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/convert/flatten.py +0 -0
  95. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/convert/python_to_sql.py +0 -0
  96. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/convert/sql_to_python.py +0 -0
  97. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/convert/unflatten.py +0 -0
  98. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/convert/values_to_tuples.py +0 -0
  99. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/data_model.py +0 -0
  100. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/dataset_info.py +0 -0
  101. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/dc.py +0 -0
  102. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/file.py +0 -0
  103. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/func/__init__.py +0 -0
  104. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/func/aggregate.py +0 -0
  105. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/func/func.py +0 -0
  106. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/hf.py +0 -0
  107. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/image.py +0 -0
  108. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/listing.py +0 -0
  109. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/listing_info.py +0 -0
  110. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/meta_formats.py +0 -0
  111. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/model_store.py +0 -0
  112. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/pytorch.py +0 -0
  113. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/settings.py +0 -0
  114. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/signal_schema.py +0 -0
  115. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/tar.py +0 -0
  116. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/text.py +0 -0
  117. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/udf.py +0 -0
  118. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/udf_signature.py +0 -0
  119. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/utils.py +0 -0
  120. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/vfile.py +0 -0
  121. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/webdataset.py +0 -0
  122. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/lib/webdataset_laion.py +0 -0
  123. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/listing.py +0 -0
  124. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/node.py +0 -0
  125. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/nodes_fetcher.py +0 -0
  126. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/nodes_thread_pool.py +0 -0
  127. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/progress.py +0 -0
  128. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/py.typed +0 -0
  129. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/query/__init__.py +0 -0
  130. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/query/batch.py +0 -0
  131. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/query/dataset.py +0 -0
  132. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/query/dispatch.py +0 -0
  133. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/query/metrics.py +0 -0
  134. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/query/params.py +0 -0
  135. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/query/queue.py +0 -0
  136. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/query/schema.py +0 -0
  137. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/query/session.py +0 -0
  138. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/remote/__init__.py +0 -0
  139. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/remote/studio.py +0 -0
  140. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/__init__.py +0 -0
  141. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/default/__init__.py +0 -0
  142. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/default/base.py +0 -0
  143. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/functions/__init__.py +0 -0
  144. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/functions/aggregate.py +0 -0
  145. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/functions/array.py +0 -0
  146. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/functions/conditional.py +0 -0
  147. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/functions/path.py +0 -0
  148. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/functions/random.py +0 -0
  149. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/functions/string.py +0 -0
  150. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/selectable.py +0 -0
  151. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/sqlite/__init__.py +0 -0
  152. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/sqlite/base.py +0 -0
  153. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/sqlite/types.py +0 -0
  154. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/sqlite/vector.py +0 -0
  155. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/sql/utils.py +0 -0
  156. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/studio.py +0 -0
  157. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/telemetry.py +0 -0
  158. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/torch/__init__.py +0 -0
  159. {datachain-0.6.6 → datachain-0.6.7}/src/datachain/utils.py +0 -0
  160. {datachain-0.6.6 → datachain-0.6.7}/src/datachain.egg-info/SOURCES.txt +0 -0
  161. {datachain-0.6.6 → datachain-0.6.7}/src/datachain.egg-info/dependency_links.txt +0 -0
  162. {datachain-0.6.6 → datachain-0.6.7}/src/datachain.egg-info/entry_points.txt +0 -0
  163. {datachain-0.6.6 → datachain-0.6.7}/src/datachain.egg-info/requires.txt +0 -0
  164. {datachain-0.6.6 → datachain-0.6.7}/src/datachain.egg-info/top_level.txt +0 -0
  165. {datachain-0.6.6 → datachain-0.6.7}/tests/__init__.py +0 -0
  166. {datachain-0.6.6 → datachain-0.6.7}/tests/benchmarks/__init__.py +0 -0
  167. {datachain-0.6.6 → datachain-0.6.7}/tests/benchmarks/conftest.py +0 -0
  168. {datachain-0.6.6 → datachain-0.6.7}/tests/benchmarks/datasets/.dvc/.gitignore +0 -0
  169. {datachain-0.6.6 → datachain-0.6.7}/tests/benchmarks/datasets/.dvc/config +0 -0
  170. {datachain-0.6.6 → datachain-0.6.7}/tests/benchmarks/datasets/.gitignore +0 -0
  171. {datachain-0.6.6 → datachain-0.6.7}/tests/benchmarks/datasets/laion-tiny.npz.dvc +0 -0
  172. {datachain-0.6.6 → datachain-0.6.7}/tests/benchmarks/test_datachain.py +0 -0
  173. {datachain-0.6.6 → datachain-0.6.7}/tests/benchmarks/test_ls.py +0 -0
  174. {datachain-0.6.6 → datachain-0.6.7}/tests/benchmarks/test_version.py +0 -0
  175. {datachain-0.6.6 → datachain-0.6.7}/tests/conftest.py +0 -0
  176. {datachain-0.6.6 → datachain-0.6.7}/tests/data.py +0 -0
  177. {datachain-0.6.6 → datachain-0.6.7}/tests/examples/__init__.py +0 -0
  178. {datachain-0.6.6 → datachain-0.6.7}/tests/examples/test_examples.py +0 -0
  179. {datachain-0.6.6 → datachain-0.6.7}/tests/examples/test_wds_e2e.py +0 -0
  180. {datachain-0.6.6 → datachain-0.6.7}/tests/examples/wds_data.py +0 -0
  181. {datachain-0.6.6 → datachain-0.6.7}/tests/func/__init__.py +0 -0
  182. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_catalog.py +0 -0
  183. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_client.py +0 -0
  184. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_datachain.py +0 -0
  185. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_dataset_query.py +0 -0
  186. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_feature_pickling.py +0 -0
  187. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_listing.py +0 -0
  188. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_ls.py +0 -0
  189. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_meta_formats.py +0 -0
  190. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_metrics.py +0 -0
  191. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_pytorch.py +0 -0
  192. {datachain-0.6.6 → datachain-0.6.7}/tests/func/test_query.py +0 -0
  193. {datachain-0.6.6 → datachain-0.6.7}/tests/scripts/feature_class.py +0 -0
  194. {datachain-0.6.6 → datachain-0.6.7}/tests/scripts/feature_class_exception.py +0 -0
  195. {datachain-0.6.6 → datachain-0.6.7}/tests/scripts/feature_class_parallel.py +0 -0
  196. {datachain-0.6.6 → datachain-0.6.7}/tests/scripts/feature_class_parallel_data_model.py +0 -0
  197. {datachain-0.6.6 → datachain-0.6.7}/tests/scripts/name_len_slow.py +0 -0
  198. {datachain-0.6.6 → datachain-0.6.7}/tests/test_atomicity.py +0 -0
  199. {datachain-0.6.6 → datachain-0.6.7}/tests/test_cli_e2e.py +0 -0
  200. {datachain-0.6.6 → datachain-0.6.7}/tests/test_cli_studio.py +0 -0
  201. {datachain-0.6.6 → datachain-0.6.7}/tests/test_query_e2e.py +0 -0
  202. {datachain-0.6.6 → datachain-0.6.7}/tests/test_telemetry.py +0 -0
  203. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/__init__.py +0 -0
  204. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/__init__.py +0 -0
  205. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/conftest.py +0 -0
  206. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_arrow.py +0 -0
  207. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_clip.py +0 -0
  208. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_datachain.py +0 -0
  209. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_datachain_bootstrap.py +0 -0
  210. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_datachain_merge.py +0 -0
  211. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_feature.py +0 -0
  212. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_feature_utils.py +0 -0
  213. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_file.py +0 -0
  214. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_hf.py +0 -0
  215. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_image.py +0 -0
  216. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_listing_info.py +0 -0
  217. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_schema.py +0 -0
  218. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_signal_schema.py +0 -0
  219. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_sql_to_python.py +0 -0
  220. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_text.py +0 -0
  221. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_udf_signature.py +0 -0
  222. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_utils.py +0 -0
  223. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/lib/test_webdataset.py +0 -0
  224. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/sql/__init__.py +0 -0
  225. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/sql/sqlite/__init__.py +0 -0
  226. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/sql/sqlite/test_utils.py +0 -0
  227. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/sql/test_array.py +0 -0
  228. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/sql/test_conditional.py +0 -0
  229. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/sql/test_path.py +0 -0
  230. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/sql/test_random.py +0 -0
  231. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/sql/test_selectable.py +0 -0
  232. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/sql/test_string.py +0 -0
  233. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_asyn.py +0 -0
  234. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_cache.py +0 -0
  235. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_catalog.py +0 -0
  236. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_catalog_loader.py +0 -0
  237. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_cli_parsing.py +0 -0
  238. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_client.py +0 -0
  239. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_client_s3.py +0 -0
  240. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_config.py +0 -0
  241. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_data_storage.py +0 -0
  242. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_database_engine.py +0 -0
  243. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_dataset.py +0 -0
  244. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_dispatch.py +0 -0
  245. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_fileslice.py +0 -0
  246. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_id_generator.py +0 -0
  247. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_listing.py +0 -0
  248. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_metastore.py +0 -0
  249. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_module_exports.py +0 -0
  250. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_query.py +0 -0
  251. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_query_metrics.py +0 -0
  252. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_query_params.py +0 -0
  253. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_serializer.py +0 -0
  254. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_session.py +0 -0
  255. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_utils.py +0 -0
  256. {datachain-0.6.6 → datachain-0.6.7}/tests/unit/test_warehouse.py +0 -0
  257. {datachain-0.6.6 → datachain-0.6.7}/tests/utils.py +0 -0
@@ -52,14 +52,11 @@ jobs:
52
52
  STUDIO_READ_ACCESS_TOKEN: ${{ secrets.ITERATIVE_STUDIO_READ_ACCESS_TOKEN }}
53
53
  run: |
54
54
  echo "DataChain branch: $BRANCH"
55
- if [[ "$BRANCH" == "main" ]]
56
- then
57
- STUDIO_BRANCH=develop
58
- elif git ls-remote --heads https://"$STUDIO_READ_ACCESS_TOKEN"@github.com/iterative/studio.git "$BRANCH" | grep -F "$BRANCH" 2>&1>/dev/null
55
+ if git ls-remote --heads https://"$STUDIO_READ_ACCESS_TOKEN"@github.com/iterative/studio.git "$BRANCH" | grep -F "$BRANCH" 2>&1>/dev/null
59
56
  then
60
57
  STUDIO_BRANCH="$BRANCH"
61
58
  else
62
- STUDIO_BRANCH=develop
59
+ STUDIO_BRANCH=main
63
60
  fi
64
61
  echo "STUDIO_BRANCH=$STUDIO_BRANCH" >> $GITHUB_ENV
65
62
  echo "Studio branch: $STUDIO_BRANCH"
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: datachain
3
- Version: 0.6.6
3
+ Version: 0.6.7
4
4
  Summary: Wrangle unstructured AI data at scale
5
5
  Author-email: Dmitry Petrov <support@dvc.org>
6
6
  License: Apache-2.0
@@ -58,7 +58,7 @@ from datachain.listing import Listing
58
58
  from datachain.node import DirType, Node, NodeWithPath
59
59
  from datachain.nodes_thread_pool import NodesThreadPool
60
60
  from datachain.remote.studio import StudioClient
61
- from datachain.sql.types import DateTime, SQLType, String
61
+ from datachain.sql.types import DateTime, SQLType
62
62
  from datachain.utils import (
63
63
  DataChainDir,
64
64
  batched,
@@ -196,11 +196,6 @@ class DatasetRowsFetcher(NodesThreadPool):
196
196
  for c in [c for c, t in self.schema.items() if t == DateTime]:
197
197
  df[c] = pd.to_datetime(df[c], unit="s")
198
198
 
199
- # strings are represented as binaries in parquet export so need to
200
- # decode it back to strings
201
- for c in [c for c, t in self.schema.items() if t == String]:
202
- df[c] = df[c].str.decode("utf-8")
203
-
204
199
  def do_task(self, urls):
205
200
  import lz4.frame
206
201
  import pandas as pd
@@ -1403,6 +1398,7 @@ class Catalog:
1403
1398
  query_script=remote_dataset_version.query_script,
1404
1399
  create_rows=True,
1405
1400
  columns=columns,
1401
+ feature_schema=remote_dataset_version.feature_schema,
1406
1402
  validate_version=False,
1407
1403
  )
1408
1404
 
@@ -145,6 +145,8 @@ class DirExpansion:
145
145
 
146
146
 
147
147
  class DataTable:
148
+ MAX_RANDOM = 2**63 - 1
149
+
148
150
  def __init__(
149
151
  self,
150
152
  name: str,
@@ -269,8 +271,8 @@ class DataTable:
269
271
  def delete(self):
270
272
  return self.apply_conditions(self.table.delete())
271
273
 
272
- @staticmethod
273
- def sys_columns():
274
+ @classmethod
275
+ def sys_columns(cls):
274
276
  return [
275
277
  sa.Column("sys__id", Int, primary_key=True),
276
278
  sa.Column(
@@ -440,6 +440,8 @@ class TypeReadConverter:
440
440
 
441
441
  def json(self, value):
442
442
  if isinstance(value, str):
443
+ if value == "":
444
+ return {}
443
445
  return orjson.loads(value)
444
446
  return value
445
447
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: datachain
3
- Version: 0.6.6
3
+ Version: 0.6.7
4
4
  Summary: Wrangle unstructured AI data at scale
5
5
  Author-email: Dmitry Petrov <support@dvc.org>
6
6
  License: Apache-2.0
@@ -5,7 +5,7 @@ from unittest.mock import ANY
5
5
  import pytest
6
6
  import sqlalchemy as sa
7
7
 
8
- from datachain.data_storage.sqlite import SQLiteWarehouse
8
+ from datachain.data_storage.schema import DataTable
9
9
  from datachain.dataset import DatasetDependencyType, DatasetStatus
10
10
  from datachain.error import (
11
11
  DatasetInvalidVersionError,
@@ -827,10 +827,7 @@ def test_row_random(cloud_test_catalog):
827
827
  # Random values are unique
828
828
  assert len(set(random_values)) == len(random_values)
829
829
 
830
- if isinstance(catalog.warehouse, SQLiteWarehouse):
831
- RAND_MAX = 2**63 # noqa: N806
832
- else:
833
- RAND_MAX = 2**64 # noqa: N806
830
+ RAND_MAX = DataTable.MAX_RANDOM # noqa: N806
834
831
 
835
832
  # Values are drawn uniformly from range(2**63)
836
833
  assert 0 <= min(random_values) < 0.4 * RAND_MAX
@@ -49,19 +49,17 @@ def dog_entries_parquet_lz4(dog_entries) -> bytes:
49
49
  """
50
50
  adapted = {}
51
51
  for k, v in row.items():
52
- if isinstance(v, str):
53
- adapted[k] = v.encode("utf-8")
54
- elif isinstance(v, datetime):
52
+ if isinstance(v, datetime):
55
53
  adapted[k] = v.timestamp()
56
54
  elif v is None:
57
- adapted[k] = b""
55
+ adapted[k] = ""
58
56
  else:
59
57
  adapted[k] = v
60
58
 
61
59
  adapted["sys__id"] = 1
62
60
  adapted["sys__rand"] = 1
63
- adapted["file__location"] = b""
64
- adapted["file__source"] = b"s3://dogs"
61
+ adapted["file__location"] = ""
62
+ adapted["file__source"] = "s3://dogs"
65
63
  return adapted
66
64
 
67
65
  dog_entries = [_adapt_row(e) for e in dog_entries]
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes