datachain 0.2.18__tar.gz → 0.3.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of datachain might be problematic. Click here for more details.

Files changed (262) hide show
  1. {datachain-0.2.18 → datachain-0.3.1}/.github/workflows/tests.yml +20 -1
  2. {datachain-0.2.18/src/datachain.egg-info → datachain-0.3.1}/PKG-INFO +1 -1
  3. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/blip2_image_desc_lib.py +2 -4
  4. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/1-quick-start.ipynb +283 -281
  5. datachain-0.3.1/examples/computer_vision/fashion_product_images/2-working-with-image-datachains.ipynb +4103 -0
  6. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/3-train-model.ipynb +46 -45
  7. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/4-inference.ipynb +5 -5
  8. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/scripts/1-quick-start.py +5 -2
  9. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/scripts/2-basic-operations.py +3 -5
  10. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/scripts/3-split-train-test.py +2 -2
  11. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/scripts/3-train-model.py +1 -1
  12. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/iptc_exif_xmp_lib.py +2 -2
  13. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/llava2_image_desc_lib.py +2 -4
  14. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/openimage-detect.py +3 -4
  15. datachain-0.3.1/examples/get_started/common_sql_functions.py +97 -0
  16. {datachain-0.2.18 → datachain-0.3.1}/examples/get_started/json-csv-reader.py +1 -1
  17. datachain-0.3.1/examples/get_started/json-metadata-tutorial.ipynb +2020 -0
  18. {datachain-0.2.18 → datachain-0.3.1}/examples/get_started/torch-loader.py +5 -3
  19. {datachain-0.2.18 → datachain-0.3.1}/examples/get_started/udfs/parallel.py +5 -5
  20. {datachain-0.2.18 → datachain-0.3.1}/examples/get_started/udfs/simple.py +6 -6
  21. {datachain-0.2.18 → datachain-0.3.1}/examples/get_started/udfs/stateful.py +1 -1
  22. {datachain-0.2.18 → datachain-0.3.1}/examples/llm_and_nlp/llm-claude-aggregate-query.py +2 -2
  23. {datachain-0.2.18 → datachain-0.3.1}/examples/llm_and_nlp/llm-claude-simple-query.py +2 -2
  24. {datachain-0.2.18 → datachain-0.3.1}/examples/llm_and_nlp/llm-claude.py +1 -1
  25. {datachain-0.2.18 → datachain-0.3.1}/examples/llm_and_nlp/unstructured-text.py +1 -1
  26. {datachain-0.2.18 → datachain-0.3.1}/examples/multimodal/clip_fine_tuning.ipynb +276 -286
  27. {datachain-0.2.18 → datachain-0.3.1}/examples/multimodal/clip_inference.py +4 -4
  28. {datachain-0.2.18 → datachain-0.3.1}/examples/multimodal/hf_pipeline.py +8 -8
  29. {datachain-0.2.18 → datachain-0.3.1}/examples/multimodal/openai_image_desc_lib.py +2 -2
  30. datachain-0.3.1/examples/multimodal/wds.py +34 -0
  31. {datachain-0.2.18 → datachain-0.3.1}/examples/multimodal/wds_filtered.py +1 -1
  32. {datachain-0.2.18 → datachain-0.3.1}/pyproject.toml +1 -0
  33. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/cache.py +5 -10
  34. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/catalog/catalog.py +10 -20
  35. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/client/azure.py +5 -12
  36. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/client/fsspec.py +6 -10
  37. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/client/gcs.py +4 -14
  38. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/client/local.py +4 -11
  39. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/client/s3.py +4 -8
  40. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/data_storage/schema.py +7 -15
  41. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/data_storage/warehouse.py +34 -45
  42. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/dc.py +8 -6
  43. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/file.py +19 -18
  44. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/udf.py +21 -14
  45. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/webdataset.py +2 -3
  46. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/listing.py +14 -20
  47. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/node.py +32 -21
  48. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/query/batch.py +45 -41
  49. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/query/builtins.py +5 -12
  50. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/query/dataset.py +15 -8
  51. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/query/dispatch.py +53 -68
  52. datachain-0.3.1/src/datachain/query/queue.py +120 -0
  53. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/query/schema.py +3 -7
  54. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/query/udf.py +23 -8
  55. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/utils.py +17 -2
  56. {datachain-0.2.18 → datachain-0.3.1/src/datachain.egg-info}/PKG-INFO +1 -1
  57. {datachain-0.2.18 → datachain-0.3.1}/src/datachain.egg-info/SOURCES.txt +1 -1
  58. {datachain-0.2.18 → datachain-0.3.1}/tests/conftest.py +3 -1
  59. {datachain-0.2.18 → datachain-0.3.1}/tests/data.py +10 -20
  60. {datachain-0.2.18 → datachain-0.3.1}/tests/func/test_catalog.py +1 -1
  61. {datachain-0.2.18 → datachain-0.3.1}/tests/func/test_client.py +1 -1
  62. {datachain-0.2.18 → datachain-0.3.1}/tests/func/test_datachain.py +2 -3
  63. {datachain-0.2.18 → datachain-0.3.1}/tests/func/test_dataset_query.py +542 -601
  64. {datachain-0.2.18 → datachain-0.3.1}/tests/func/test_datasets.py +15 -5
  65. {datachain-0.2.18 → datachain-0.3.1}/tests/func/test_feature_pickling.py +5 -5
  66. {datachain-0.2.18 → datachain-0.3.1}/tests/func/test_pull.py +8 -9
  67. {datachain-0.2.18 → datachain-0.3.1}/tests/func/test_query.py +6 -4
  68. {datachain-0.2.18 → datachain-0.3.1}/tests/scripts/feature_class.py +1 -1
  69. {datachain-0.2.18 → datachain-0.3.1}/tests/scripts/feature_class_parallel.py +2 -2
  70. {datachain-0.2.18 → datachain-0.3.1}/tests/scripts/feature_class_parallel_data_model.py +2 -2
  71. {datachain-0.2.18 → datachain-0.3.1}/tests/scripts/name_len_slow.py +5 -5
  72. {datachain-0.2.18 → datachain-0.3.1}/tests/test_query_e2e.py +23 -23
  73. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_arrow.py +2 -2
  74. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_datachain.py +41 -41
  75. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_file.py +35 -41
  76. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_image.py +1 -1
  77. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_signal_schema.py +2 -2
  78. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_text.py +1 -1
  79. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_webdataset.py +7 -7
  80. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_cache.py +3 -5
  81. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_client.py +1 -1
  82. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_client_s3.py +12 -13
  83. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_data_storage.py +30 -34
  84. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_database_engine.py +2 -0
  85. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_dataset.py +2 -4
  86. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_id_generator.py +2 -0
  87. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_listing.py +5 -5
  88. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_storage.py +1 -1
  89. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_udf.py +3 -4
  90. {datachain-0.2.18 → datachain-0.3.1}/tests/utils.py +21 -28
  91. datachain-0.2.18/examples/computer_vision/fashion_product_images/2-working-with-image-datachains.ipynb +0 -4083
  92. datachain-0.2.18/examples/get_started/common_sql_functions.py +0 -93
  93. datachain-0.2.18/examples/get_started/json-metadata-tutorial.ipynb +0 -1949
  94. datachain-0.2.18/examples/multimodal/wds.py +0 -42
  95. datachain-0.2.18/tests/scripts/name_len_normal.py +0 -27
  96. {datachain-0.2.18 → datachain-0.3.1}/.cruft.json +0 -0
  97. {datachain-0.2.18 → datachain-0.3.1}/.gitattributes +0 -0
  98. {datachain-0.2.18 → datachain-0.3.1}/.github/ISSUE_TEMPLATE/bug_report.yml +0 -0
  99. {datachain-0.2.18 → datachain-0.3.1}/.github/ISSUE_TEMPLATE/empty_issue.md +0 -0
  100. {datachain-0.2.18 → datachain-0.3.1}/.github/ISSUE_TEMPLATE/feature_request.yml +0 -0
  101. {datachain-0.2.18 → datachain-0.3.1}/.github/codecov.yaml +0 -0
  102. {datachain-0.2.18 → datachain-0.3.1}/.github/dependabot.yml +0 -0
  103. {datachain-0.2.18 → datachain-0.3.1}/.github/workflows/benchmarks.yml +0 -0
  104. {datachain-0.2.18 → datachain-0.3.1}/.github/workflows/release.yml +0 -0
  105. {datachain-0.2.18 → datachain-0.3.1}/.github/workflows/update-template.yaml +0 -0
  106. {datachain-0.2.18 → datachain-0.3.1}/.gitignore +0 -0
  107. {datachain-0.2.18 → datachain-0.3.1}/.pre-commit-config.yaml +0 -0
  108. {datachain-0.2.18 → datachain-0.3.1}/CODE_OF_CONDUCT.rst +0 -0
  109. {datachain-0.2.18 → datachain-0.3.1}/CONTRIBUTING.rst +0 -0
  110. {datachain-0.2.18 → datachain-0.3.1}/LICENSE +0 -0
  111. {datachain-0.2.18 → datachain-0.3.1}/README.rst +0 -0
  112. {datachain-0.2.18 → datachain-0.3.1}/docs/assets/captioned_cartoons.png +0 -0
  113. {datachain-0.2.18 → datachain-0.3.1}/docs/assets/datachain.png +0 -0
  114. {datachain-0.2.18 → datachain-0.3.1}/docs/assets/flowchart.png +0 -0
  115. {datachain-0.2.18 → datachain-0.3.1}/docs/index.md +0 -0
  116. {datachain-0.2.18 → datachain-0.3.1}/docs/references/datachain.md +0 -0
  117. {datachain-0.2.18 → datachain-0.3.1}/docs/references/datatype.md +0 -0
  118. {datachain-0.2.18 → datachain-0.3.1}/docs/references/file.md +0 -0
  119. {datachain-0.2.18 → datachain-0.3.1}/docs/references/index.md +0 -0
  120. {datachain-0.2.18 → datachain-0.3.1}/docs/references/sql.md +0 -0
  121. {datachain-0.2.18 → datachain-0.3.1}/docs/references/torch.md +0 -0
  122. {datachain-0.2.18 → datachain-0.3.1}/docs/references/udf.md +0 -0
  123. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/.gitignore +0 -0
  124. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/README.md +0 -0
  125. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/requirements.txt +0 -0
  126. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/scripts/2-embeddings.py +0 -0
  127. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/src/clustering.py +0 -0
  128. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/src/train.py +0 -0
  129. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/static/images/basic-operations.png +0 -0
  130. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/static/images/core-concepts.png +0 -0
  131. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/static/images/datachain-logo.png +0 -0
  132. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/static/images/datachain-overview.png +0 -0
  133. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/static/images/dataset-1.png +0 -0
  134. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/static/images/dataset-2.png +0 -0
  135. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/static/images/dataset-3.png +0 -0
  136. {datachain-0.2.18 → datachain-0.3.1}/examples/computer_vision/fashion_product_images/static/images/studio.png +0 -0
  137. {datachain-0.2.18 → datachain-0.3.1}/examples/llm/llm_chatbot_evaluation.ipynb +0 -0
  138. {datachain-0.2.18 → datachain-0.3.1}/mkdocs.yml +0 -0
  139. {datachain-0.2.18 → datachain-0.3.1}/noxfile.py +0 -0
  140. {datachain-0.2.18 → datachain-0.3.1}/setup.cfg +0 -0
  141. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/__init__.py +0 -0
  142. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/__main__.py +0 -0
  143. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/asyn.py +0 -0
  144. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/catalog/__init__.py +0 -0
  145. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/catalog/datasource.py +0 -0
  146. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/catalog/loader.py +0 -0
  147. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/catalog/subclass.py +0 -0
  148. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/cli.py +0 -0
  149. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/cli_utils.py +0 -0
  150. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/client/__init__.py +0 -0
  151. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/client/fileslice.py +0 -0
  152. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/config.py +0 -0
  153. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/data_storage/__init__.py +0 -0
  154. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/data_storage/db_engine.py +0 -0
  155. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/data_storage/id_generator.py +0 -0
  156. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/data_storage/job.py +0 -0
  157. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/data_storage/metastore.py +0 -0
  158. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/data_storage/serializer.py +0 -0
  159. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/data_storage/sqlite.py +0 -0
  160. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/dataset.py +0 -0
  161. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/error.py +0 -0
  162. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/job.py +0 -0
  163. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/__init__.py +0 -0
  164. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/arrow.py +0 -0
  165. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/clip.py +0 -0
  166. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/convert/__init__.py +0 -0
  167. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/convert/flatten.py +0 -0
  168. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/convert/python_to_sql.py +0 -0
  169. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/convert/sql_to_python.py +0 -0
  170. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/convert/unflatten.py +0 -0
  171. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/convert/values_to_tuples.py +0 -0
  172. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/data_model.py +0 -0
  173. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/dataset_info.py +0 -0
  174. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/image.py +0 -0
  175. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/meta_formats.py +0 -0
  176. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/model_store.py +0 -0
  177. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/pytorch.py +0 -0
  178. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/settings.py +0 -0
  179. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/signal_schema.py +0 -0
  180. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/text.py +0 -0
  181. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/udf_signature.py +0 -0
  182. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/utils.py +0 -0
  183. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/vfile.py +0 -0
  184. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/lib/webdataset_laion.py +0 -0
  185. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/nodes_fetcher.py +0 -0
  186. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/nodes_thread_pool.py +0 -0
  187. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/progress.py +0 -0
  188. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/py.typed +0 -0
  189. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/query/__init__.py +0 -0
  190. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/query/metrics.py +0 -0
  191. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/query/params.py +0 -0
  192. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/query/session.py +0 -0
  193. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/remote/__init__.py +0 -0
  194. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/remote/studio.py +0 -0
  195. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/__init__.py +0 -0
  196. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/default/__init__.py +0 -0
  197. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/default/base.py +0 -0
  198. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/functions/__init__.py +0 -0
  199. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/functions/array.py +0 -0
  200. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/functions/conditional.py +0 -0
  201. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/functions/path.py +0 -0
  202. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/functions/random.py +0 -0
  203. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/functions/string.py +0 -0
  204. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/selectable.py +0 -0
  205. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/sqlite/__init__.py +0 -0
  206. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/sqlite/base.py +0 -0
  207. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/sqlite/types.py +0 -0
  208. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/sqlite/vector.py +0 -0
  209. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/types.py +0 -0
  210. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/sql/utils.py +0 -0
  211. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/storage.py +0 -0
  212. {datachain-0.2.18 → datachain-0.3.1}/src/datachain/torch/__init__.py +0 -0
  213. {datachain-0.2.18 → datachain-0.3.1}/src/datachain.egg-info/dependency_links.txt +0 -0
  214. {datachain-0.2.18 → datachain-0.3.1}/src/datachain.egg-info/entry_points.txt +0 -0
  215. {datachain-0.2.18 → datachain-0.3.1}/src/datachain.egg-info/requires.txt +0 -0
  216. {datachain-0.2.18 → datachain-0.3.1}/src/datachain.egg-info/top_level.txt +0 -0
  217. {datachain-0.2.18 → datachain-0.3.1}/tests/__init__.py +0 -0
  218. {datachain-0.2.18 → datachain-0.3.1}/tests/benchmarks/__init__.py +0 -0
  219. {datachain-0.2.18 → datachain-0.3.1}/tests/benchmarks/conftest.py +0 -0
  220. {datachain-0.2.18 → datachain-0.3.1}/tests/benchmarks/test_ls.py +0 -0
  221. {datachain-0.2.18 → datachain-0.3.1}/tests/benchmarks/test_version.py +0 -0
  222. {datachain-0.2.18 → datachain-0.3.1}/tests/examples/__init__.py +0 -0
  223. {datachain-0.2.18 → datachain-0.3.1}/tests/examples/test_wds_e2e.py +0 -0
  224. {datachain-0.2.18 → datachain-0.3.1}/tests/examples/wds_data.py +0 -0
  225. {datachain-0.2.18 → datachain-0.3.1}/tests/func/__init__.py +0 -0
  226. {datachain-0.2.18 → datachain-0.3.1}/tests/func/test_ls.py +0 -0
  227. {datachain-0.2.18 → datachain-0.3.1}/tests/func/test_pytorch.py +0 -0
  228. {datachain-0.2.18 → datachain-0.3.1}/tests/test_cli_e2e.py +0 -0
  229. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/__init__.py +0 -0
  230. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/__init__.py +0 -0
  231. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/conftest.py +0 -0
  232. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_clip.py +0 -0
  233. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_datachain_bootstrap.py +0 -0
  234. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_datachain_merge.py +0 -0
  235. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_feature.py +0 -0
  236. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_feature_utils.py +0 -0
  237. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_sql_to_python.py +0 -0
  238. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_udf_signature.py +0 -0
  239. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/lib/test_utils.py +0 -0
  240. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/sql/__init__.py +0 -0
  241. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/sql/sqlite/__init__.py +0 -0
  242. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/sql/sqlite/test_utils.py +0 -0
  243. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/sql/test_array.py +0 -0
  244. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/sql/test_conditional.py +0 -0
  245. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/sql/test_path.py +0 -0
  246. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/sql/test_random.py +0 -0
  247. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/sql/test_selectable.py +0 -0
  248. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/sql/test_string.py +0 -0
  249. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_asyn.py +0 -0
  250. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_catalog.py +0 -0
  251. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_catalog_loader.py +0 -0
  252. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_cli_parsing.py +0 -0
  253. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_dispatch.py +0 -0
  254. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_fileslice.py +0 -0
  255. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_metastore.py +0 -0
  256. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_module_exports.py +0 -0
  257. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_query_metrics.py +0 -0
  258. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_query_params.py +0 -0
  259. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_serializer.py +0 -0
  260. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_session.py +0 -0
  261. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_utils.py +0 -0
  262. {datachain-0.2.18 → datachain-0.3.1}/tests/unit/test_warehouse.py +0 -0
@@ -8,6 +8,7 @@ on:
8
8
 
9
9
  env:
10
10
  FORCE_COLOR: "1"
11
+ BRANCH: ${{ github.head_ref || github.ref_name }}
11
12
 
12
13
  concurrency:
13
14
  group: ${{ github.workflow }}-${{ github.head_ref || github.run_id }}
@@ -144,12 +145,30 @@ jobs:
144
145
  - 6379:6379
145
146
  steps:
146
147
 
148
+ - name: Studio branch name
149
+ env:
150
+ BRANCH: ${{ env.BRANCH }}
151
+ STUDIO_READ_ACCESS_TOKEN: ${{ secrets.ITERATIVE_STUDIO_READ_ACCESS_TOKEN }}
152
+ run: |
153
+ echo "DataChain branch: $BRANCH"
154
+ if [[ "$BRANCH" == "main" ]]
155
+ then
156
+ STUDIO_BRANCH=develop
157
+ elif git ls-remote --heads https://"$STUDIO_READ_ACCESS_TOKEN"@github.com/iterative/studio.git "$BRANCH" | grep -F "$BRANCH" 2>&1>/dev/null
158
+ then
159
+ STUDIO_BRANCH="$BRANCH"
160
+ else
161
+ STUDIO_BRANCH=develop
162
+ fi
163
+ echo "STUDIO_BRANCH=$STUDIO_BRANCH" >> $GITHUB_ENV
164
+ echo "Studio branch: $STUDIO_BRANCH"
165
+
147
166
  - name: Check out Studio
148
167
  uses: actions/checkout@v4
149
168
  with:
150
169
  fetch-depth: 0
151
170
  repository: iterative/studio
152
- ref: develop
171
+ ref: ${{ env.STUDIO_BRANCH }}
153
172
  token: ${{ secrets.ITERATIVE_STUDIO_READ_ACCESS_TOKEN }}
154
173
 
155
174
  - name: Check out repository
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: datachain
3
- Version: 0.2.18
3
+ Version: 0.3.1
4
4
  Summary: Wrangle unstructured AI data at scale
5
5
  Author-email: Dmitry Petrov <support@dvc.org>
6
6
  License: Apache-2.0
@@ -86,7 +86,7 @@ class LLaVADescribe(Mapper):
86
86
  if __name__ == "__main__":
87
87
  (
88
88
  DataChain.from_storage(source, type="image")
89
- .filter(C("file.name").glob("cat*.jpg"))
89
+ .filter(C("file.path").glob("*/cat*.jpg"))
90
90
  .map(
91
91
  desc=BLIP2Describe(
92
92
  # device=device,
@@ -95,8 +95,6 @@ if __name__ == "__main__":
95
95
  params=["file"],
96
96
  output={"description": str, "error": str},
97
97
  )
98
- .select(
99
- "file.source", "file.parent", "file.name", "desc.description", "desc.error"
100
- )
98
+ .select("file.source", "file.path", "desc.description", "desc.error")
101
99
  .show(5)
102
100
  )