datachain 0.19.1__tar.gz → 0.20.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of datachain might be problematic. Click here for more details.

Files changed (397) hide show
  1. {datachain-0.19.1 → datachain-0.20.0}/.github/workflows/tests-studio.yml +1 -0
  2. {datachain-0.19.1 → datachain-0.20.0}/PKG-INFO +2 -2
  3. datachain-0.20.0/docs/commands/auth/team.md +42 -0
  4. {datachain-0.19.1 → datachain-0.20.0}/docs/commands/index.md +2 -0
  5. datachain-0.20.0/docs/commands/job/clusters.md +39 -0
  6. {datachain-0.19.1 → datachain-0.20.0}/docs/commands/job/run.md +10 -0
  7. datachain-0.20.0/docs/guide/env.md +18 -0
  8. {datachain-0.19.1 → datachain-0.20.0}/docs/guide/index.md +1 -0
  9. {datachain-0.19.1 → datachain-0.20.0}/mkdocs.yml +2 -0
  10. {datachain-0.19.1 → datachain-0.20.0}/pyproject.toml +1 -1
  11. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/__init__.py +3 -0
  12. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/catalog/catalog.py +180 -65
  13. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/__init__.py +0 -7
  14. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/datasets.py +43 -28
  15. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/parser/__init__.py +1 -35
  16. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/parser/job.py +25 -0
  17. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/parser/studio.py +11 -4
  18. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/metastore.py +390 -37
  19. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/schema.py +23 -1
  20. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/sqlite.py +139 -7
  21. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/warehouse.py +26 -7
  22. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/dataset.py +125 -12
  23. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/delta.py +9 -5
  24. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/error.py +36 -0
  25. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dataset_info.py +4 -0
  26. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/datachain.py +86 -7
  27. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/datasets.py +62 -12
  28. datachain-0.20.0/src/datachain/lib/dc/listings.py +154 -0
  29. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/records.py +1 -0
  30. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/storage.py +14 -2
  31. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/listing.py +3 -1
  32. datachain-0.20.0/src/datachain/lib/namespaces.py +73 -0
  33. datachain-0.20.0/src/datachain/lib/projects.py +86 -0
  34. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/settings.py +10 -0
  35. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/listing.py +3 -1
  36. datachain-0.20.0/src/datachain/namespace.py +65 -0
  37. datachain-0.20.0/src/datachain/project.py +78 -0
  38. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/dataset.py +71 -46
  39. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/session.py +1 -1
  40. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/remote/studio.py +67 -26
  41. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/studio.py +68 -8
  42. {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/PKG-INFO +2 -2
  43. {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/SOURCES.txt +8 -0
  44. {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/requires.txt +1 -1
  45. {datachain-0.19.1 → datachain-0.20.0}/tests/conftest.py +81 -4
  46. {datachain-0.19.1 → datachain-0.20.0}/tests/examples/test_examples.py +2 -0
  47. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_batching.py +5 -5
  48. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_dataset_query.py +20 -2
  49. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_datasets.py +113 -81
  50. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_metastore.py +30 -10
  51. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_pull.py +69 -18
  52. {datachain-0.19.1 → datachain-0.20.0}/tests/test_atomicity.py +4 -0
  53. {datachain-0.19.1 → datachain-0.20.0}/tests/test_cli_e2e.py +43 -10
  54. {datachain-0.19.1 → datachain-0.20.0}/tests/test_cli_studio.py +46 -32
  55. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_datachain.py +107 -4
  56. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_listing_info.py +9 -2
  57. datachain-0.20.0/tests/unit/lib/test_namespace.py +87 -0
  58. datachain-0.20.0/tests/unit/lib/test_project.py +184 -0
  59. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_dataset.py +25 -1
  60. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_listing.py +20 -4
  61. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_metastore.py +35 -3
  62. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_session.py +32 -9
  63. {datachain-0.19.1 → datachain-0.20.0}/tests/utils.py +1 -1
  64. datachain-0.19.1/docs/commands/auth/team.md +0 -36
  65. datachain-0.19.1/src/datachain/lib/dc/listings.py +0 -43
  66. {datachain-0.19.1 → datachain-0.20.0}/.cruft.json +0 -0
  67. {datachain-0.19.1 → datachain-0.20.0}/.gitattributes +0 -0
  68. {datachain-0.19.1 → datachain-0.20.0}/.github/ISSUE_TEMPLATE/bug_report.yml +0 -0
  69. {datachain-0.19.1 → datachain-0.20.0}/.github/ISSUE_TEMPLATE/empty_issue.md +0 -0
  70. {datachain-0.19.1 → datachain-0.20.0}/.github/ISSUE_TEMPLATE/feature_request.yml +0 -0
  71. {datachain-0.19.1 → datachain-0.20.0}/.github/codecov.yaml +0 -0
  72. {datachain-0.19.1 → datachain-0.20.0}/.github/dependabot.yml +0 -0
  73. {datachain-0.19.1 → datachain-0.20.0}/.github/workflows/benchmarks.yml +0 -0
  74. {datachain-0.19.1 → datachain-0.20.0}/.github/workflows/release.yml +0 -0
  75. {datachain-0.19.1 → datachain-0.20.0}/.github/workflows/tests.yml +0 -0
  76. {datachain-0.19.1 → datachain-0.20.0}/.github/workflows/update-template.yaml +0 -0
  77. {datachain-0.19.1 → datachain-0.20.0}/.gitignore +0 -0
  78. {datachain-0.19.1 → datachain-0.20.0}/.pre-commit-config.yaml +0 -0
  79. {datachain-0.19.1 → datachain-0.20.0}/CODE_OF_CONDUCT.rst +0 -0
  80. {datachain-0.19.1 → datachain-0.20.0}/LICENSE +0 -0
  81. {datachain-0.19.1 → datachain-0.20.0}/README.rst +0 -0
  82. {datachain-0.19.1 → datachain-0.20.0}/docs/assets/captioned_cartoons.png +0 -0
  83. {datachain-0.19.1 → datachain-0.20.0}/docs/assets/datachain-white.svg +0 -0
  84. {datachain-0.19.1 → datachain-0.20.0}/docs/assets/datachain.svg +0 -0
  85. {datachain-0.19.1 → datachain-0.20.0}/docs/commands/auth/login.md +0 -0
  86. {datachain-0.19.1 → datachain-0.20.0}/docs/commands/auth/logout.md +0 -0
  87. {datachain-0.19.1 → datachain-0.20.0}/docs/commands/auth/token.md +0 -0
  88. {datachain-0.19.1 → datachain-0.20.0}/docs/commands/job/cancel.md +0 -0
  89. {datachain-0.19.1 → datachain-0.20.0}/docs/commands/job/logs.md +0 -0
  90. {datachain-0.19.1 → datachain-0.20.0}/docs/commands/job/ls.md +0 -0
  91. {datachain-0.19.1 → datachain-0.20.0}/docs/contributing.md +0 -0
  92. {datachain-0.19.1 → datachain-0.20.0}/docs/css/github-permalink-style.css +0 -0
  93. {datachain-0.19.1 → datachain-0.20.0}/docs/examples.md +0 -0
  94. {datachain-0.19.1 → datachain-0.20.0}/docs/guide/delta.md +0 -0
  95. {datachain-0.19.1 → datachain-0.20.0}/docs/guide/processing.md +0 -0
  96. {datachain-0.19.1 → datachain-0.20.0}/docs/guide/remotes.md +0 -0
  97. {datachain-0.19.1 → datachain-0.20.0}/docs/guide/retry.md +0 -0
  98. {datachain-0.19.1 → datachain-0.20.0}/docs/index.md +0 -0
  99. {datachain-0.19.1 → datachain-0.20.0}/docs/overrides/main.html +0 -0
  100. {datachain-0.19.1 → datachain-0.20.0}/docs/quick-start.md +0 -0
  101. {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/arrowrow.md +0 -0
  102. {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/bbox.md +0 -0
  103. {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/file.md +0 -0
  104. {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/imagefile.md +0 -0
  105. {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/index.md +0 -0
  106. {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/pose.md +0 -0
  107. {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/segment.md +0 -0
  108. {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/tarvfile.md +0 -0
  109. {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/textfile.md +0 -0
  110. {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/videofile.md +0 -0
  111. {datachain-0.19.1 → datachain-0.20.0}/docs/references/datachain.md +0 -0
  112. {datachain-0.19.1 → datachain-0.20.0}/docs/references/func.md +0 -0
  113. {datachain-0.19.1 → datachain-0.20.0}/docs/references/index.md +0 -0
  114. {datachain-0.19.1 → datachain-0.20.0}/docs/references/toolkit.md +0 -0
  115. {datachain-0.19.1 → datachain-0.20.0}/docs/references/torch.md +0 -0
  116. {datachain-0.19.1 → datachain-0.20.0}/docs/references/udf.md +0 -0
  117. {datachain-0.19.1 → datachain-0.20.0}/docs/tutorials.md +0 -0
  118. {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/iptc_exif_xmp_lib.py +0 -0
  119. {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/llava2_image_desc_lib.py +0 -0
  120. {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/openimage-detect.py +0 -0
  121. {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/ultralytics-bbox.py +0 -0
  122. {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/ultralytics-pose.py +0 -0
  123. {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/ultralytics-segment.py +0 -0
  124. {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/common_sql_functions.py +0 -0
  125. {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/json-csv-reader.py +0 -0
  126. {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/torch-loader.py +0 -0
  127. {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/udfs/parallel.py +0 -0
  128. {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/udfs/simple.py +0 -0
  129. {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/udfs/stateful.py +0 -0
  130. {datachain-0.19.1 → datachain-0.20.0}/examples/incremental_processing/delta.py +0 -0
  131. {datachain-0.19.1 → datachain-0.20.0}/examples/incremental_processing/retry.py +0 -0
  132. {datachain-0.19.1 → datachain-0.20.0}/examples/incremental_processing/utils.py +0 -0
  133. {datachain-0.19.1 → datachain-0.20.0}/examples/llm_and_nlp/claude-query.py +0 -0
  134. {datachain-0.19.1 → datachain-0.20.0}/examples/llm_and_nlp/hf-dataset-llm-eval.py +0 -0
  135. {datachain-0.19.1 → datachain-0.20.0}/examples/multimodal/clip_inference.py +0 -0
  136. {datachain-0.19.1 → datachain-0.20.0}/examples/multimodal/hf_pipeline.py +0 -0
  137. {datachain-0.19.1 → datachain-0.20.0}/examples/multimodal/openai_image_desc_lib.py +0 -0
  138. {datachain-0.19.1 → datachain-0.20.0}/examples/multimodal/wds.py +0 -0
  139. {datachain-0.19.1 → datachain-0.20.0}/examples/multimodal/wds_filtered.py +0 -0
  140. {datachain-0.19.1 → datachain-0.20.0}/noxfile.py +0 -0
  141. {datachain-0.19.1 → datachain-0.20.0}/setup.cfg +0 -0
  142. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/__main__.py +0 -0
  143. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/asyn.py +0 -0
  144. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cache.py +0 -0
  145. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/catalog/__init__.py +0 -0
  146. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/catalog/datasource.py +0 -0
  147. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/catalog/loader.py +0 -0
  148. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/__init__.py +0 -0
  149. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/du.py +0 -0
  150. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/index.py +0 -0
  151. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/ls.py +0 -0
  152. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/misc.py +0 -0
  153. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/query.py +0 -0
  154. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/show.py +0 -0
  155. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/parser/utils.py +0 -0
  156. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/utils.py +0 -0
  157. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/__init__.py +0 -0
  158. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/azure.py +0 -0
  159. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/fileslice.py +0 -0
  160. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/fsspec.py +0 -0
  161. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/gcs.py +0 -0
  162. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/hf.py +0 -0
  163. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/local.py +0 -0
  164. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/s3.py +0 -0
  165. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/config.py +0 -0
  166. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/__init__.py +0 -0
  167. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/db_engine.py +0 -0
  168. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/job.py +0 -0
  169. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/serializer.py +0 -0
  170. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/diff/__init__.py +0 -0
  171. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/fs/__init__.py +0 -0
  172. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/fs/reference.py +0 -0
  173. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/fs/utils.py +0 -0
  174. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/__init__.py +0 -0
  175. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/aggregate.py +0 -0
  176. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/array.py +0 -0
  177. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/base.py +0 -0
  178. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/conditional.py +0 -0
  179. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/func.py +0 -0
  180. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/numeric.py +0 -0
  181. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/path.py +0 -0
  182. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/random.py +0 -0
  183. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/string.py +0 -0
  184. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/window.py +0 -0
  185. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/job.py +0 -0
  186. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/__init__.py +0 -0
  187. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/arrow.py +0 -0
  188. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/clip.py +0 -0
  189. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/__init__.py +0 -0
  190. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/flatten.py +0 -0
  191. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/python_to_sql.py +0 -0
  192. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/sql_to_python.py +0 -0
  193. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/unflatten.py +0 -0
  194. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/values_to_tuples.py +0 -0
  195. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/data_model.py +0 -0
  196. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/__init__.py +0 -0
  197. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/csv.py +0 -0
  198. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/database.py +0 -0
  199. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/hf.py +0 -0
  200. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/json.py +0 -0
  201. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/pandas.py +0 -0
  202. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/parquet.py +0 -0
  203. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/utils.py +0 -0
  204. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/values.py +0 -0
  205. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/file.py +0 -0
  206. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/hf.py +0 -0
  207. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/image.py +0 -0
  208. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/listing_info.py +0 -0
  209. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/meta_formats.py +0 -0
  210. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/model_store.py +0 -0
  211. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/pytorch.py +0 -0
  212. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/signal_schema.py +0 -0
  213. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/tar.py +0 -0
  214. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/text.py +0 -0
  215. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/udf.py +0 -0
  216. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/udf_signature.py +0 -0
  217. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/utils.py +0 -0
  218. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/video.py +0 -0
  219. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/webdataset.py +0 -0
  220. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/webdataset_laion.py +0 -0
  221. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/__init__.py +0 -0
  222. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/bbox.py +0 -0
  223. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/pose.py +0 -0
  224. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/segment.py +0 -0
  225. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/ultralytics/__init__.py +0 -0
  226. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/ultralytics/bbox.py +0 -0
  227. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/ultralytics/pose.py +0 -0
  228. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/ultralytics/segment.py +0 -0
  229. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/utils.py +0 -0
  230. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/node.py +0 -0
  231. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/nodes_fetcher.py +0 -0
  232. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/nodes_thread_pool.py +0 -0
  233. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/progress.py +0 -0
  234. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/py.typed +0 -0
  235. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/__init__.py +0 -0
  236. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/batch.py +0 -0
  237. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/dispatch.py +0 -0
  238. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/metrics.py +0 -0
  239. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/params.py +0 -0
  240. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/queue.py +0 -0
  241. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/schema.py +0 -0
  242. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/udf.py +0 -0
  243. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/utils.py +0 -0
  244. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/remote/__init__.py +0 -0
  245. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/script_meta.py +0 -0
  246. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/semver.py +0 -0
  247. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/__init__.py +0 -0
  248. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/default/__init__.py +0 -0
  249. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/default/base.py +0 -0
  250. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/__init__.py +0 -0
  251. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/aggregate.py +0 -0
  252. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/array.py +0 -0
  253. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/conditional.py +0 -0
  254. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/numeric.py +0 -0
  255. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/path.py +0 -0
  256. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/random.py +0 -0
  257. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/string.py +0 -0
  258. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/selectable.py +0 -0
  259. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/sqlite/__init__.py +0 -0
  260. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/sqlite/base.py +0 -0
  261. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/sqlite/types.py +0 -0
  262. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/sqlite/vector.py +0 -0
  263. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/types.py +0 -0
  264. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/utils.py +0 -0
  265. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/telemetry.py +0 -0
  266. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/toolkit/__init__.py +0 -0
  267. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/toolkit/split.py +0 -0
  268. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/torch/__init__.py +0 -0
  269. {datachain-0.19.1 → datachain-0.20.0}/src/datachain/utils.py +0 -0
  270. {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/dependency_links.txt +0 -0
  271. {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/entry_points.txt +0 -0
  272. {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/top_level.txt +0 -0
  273. {datachain-0.19.1 → datachain-0.20.0}/tests/__init__.py +0 -0
  274. {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/__init__.py +0 -0
  275. {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/conftest.py +0 -0
  276. {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/datasets/.dvc/.gitignore +0 -0
  277. {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/datasets/.dvc/config +0 -0
  278. {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/datasets/.gitignore +0 -0
  279. {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/datasets/laion-tiny.npz.dvc +0 -0
  280. {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/test_datachain.py +0 -0
  281. {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/test_ls.py +0 -0
  282. {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/test_version.py +0 -0
  283. {datachain-0.19.1 → datachain-0.20.0}/tests/data.py +0 -0
  284. {datachain-0.19.1 → datachain-0.20.0}/tests/examples/__init__.py +0 -0
  285. {datachain-0.19.1 → datachain-0.20.0}/tests/examples/test_wds_e2e.py +0 -0
  286. {datachain-0.19.1 → datachain-0.20.0}/tests/examples/wds_data.py +0 -0
  287. {datachain-0.19.1 → datachain-0.20.0}/tests/func/__init__.py +0 -0
  288. {datachain-0.19.1 → datachain-0.20.0}/tests/func/data/Big_Buck_Bunny_360_10s_1MB.mp4 +0 -0
  289. {datachain-0.19.1 → datachain-0.20.0}/tests/func/data/lena.jpg +0 -0
  290. {datachain-0.19.1 → datachain-0.20.0}/tests/func/fake-service-account-credentials.json +0 -0
  291. {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/__init__.py +0 -0
  292. {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_aggregate.py +0 -0
  293. {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_array.py +0 -0
  294. {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_conditional.py +0 -0
  295. {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_numeric.py +0 -0
  296. {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_path.py +0 -0
  297. {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_random.py +0 -0
  298. {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_string.py +0 -0
  299. {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/__init__.py +0 -0
  300. {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/data/running-mask0.png +0 -0
  301. {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/data/running-mask1.png +0 -0
  302. {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/data/running.jpg +0 -0
  303. {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/data/ships.jpg +0 -0
  304. {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/test_yolo.py +0 -0
  305. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_catalog.py +0 -0
  306. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_client.py +0 -0
  307. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_cloud_transfer.py +0 -0
  308. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_data_storage.py +0 -0
  309. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_datachain.py +0 -0
  310. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_datachain_merge.py +0 -0
  311. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_delta.py +0 -0
  312. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_feature_pickling.py +0 -0
  313. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_file.py +0 -0
  314. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_hf.py +0 -0
  315. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_hidden_field.py +0 -0
  316. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_image.py +0 -0
  317. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_listing.py +0 -0
  318. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_ls.py +0 -0
  319. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_meta_formats.py +0 -0
  320. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_metrics.py +0 -0
  321. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_pytorch.py +0 -0
  322. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_query.py +0 -0
  323. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_read_database.py +0 -0
  324. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_retry.py +0 -0
  325. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_session.py +0 -0
  326. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_toolkit.py +0 -0
  327. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_video.py +0 -0
  328. {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_warehouse.py +0 -0
  329. {datachain-0.19.1 → datachain-0.20.0}/tests/scripts/feature_class.py +0 -0
  330. {datachain-0.19.1 → datachain-0.20.0}/tests/scripts/feature_class_exception.py +0 -0
  331. {datachain-0.19.1 → datachain-0.20.0}/tests/scripts/feature_class_parallel.py +0 -0
  332. {datachain-0.19.1 → datachain-0.20.0}/tests/scripts/feature_class_parallel_data_model.py +0 -0
  333. {datachain-0.19.1 → datachain-0.20.0}/tests/scripts/name_len_slow.py +0 -0
  334. {datachain-0.19.1 → datachain-0.20.0}/tests/test_import_time.py +0 -0
  335. {datachain-0.19.1 → datachain-0.20.0}/tests/test_query_e2e.py +0 -0
  336. {datachain-0.19.1 → datachain-0.20.0}/tests/test_telemetry.py +0 -0
  337. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/__init__.py +0 -0
  338. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/__init__.py +0 -0
  339. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/conftest.py +0 -0
  340. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_arrow.py +0 -0
  341. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_clip.py +0 -0
  342. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_datachain_bootstrap.py +0 -0
  343. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_datachain_merge.py +0 -0
  344. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_diff.py +0 -0
  345. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_feature.py +0 -0
  346. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_feature_utils.py +0 -0
  347. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_file.py +0 -0
  348. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_hf.py +0 -0
  349. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_image.py +0 -0
  350. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_python_to_sql.py +0 -0
  351. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_schema.py +0 -0
  352. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_signal_schema.py +0 -0
  353. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_sql_to_python.py +0 -0
  354. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_text.py +0 -0
  355. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_udf.py +0 -0
  356. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_udf_signature.py +0 -0
  357. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_utils.py +0 -0
  358. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_webdataset.py +0 -0
  359. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/model/__init__.py +0 -0
  360. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/model/test_bbox.py +0 -0
  361. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/model/test_pose.py +0 -0
  362. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/model/test_segment.py +0 -0
  363. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/model/test_utils.py +0 -0
  364. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/__init__.py +0 -0
  365. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/sqlite/__init__.py +0 -0
  366. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/sqlite/test_types.py +0 -0
  367. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/sqlite/test_utils.py +0 -0
  368. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_array.py +0 -0
  369. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_conditional.py +0 -0
  370. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_path.py +0 -0
  371. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_random.py +0 -0
  372. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_selectable.py +0 -0
  373. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_string.py +0 -0
  374. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_asyn.py +0 -0
  375. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_cache.py +0 -0
  376. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_catalog.py +0 -0
  377. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_catalog_loader.py +0 -0
  378. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_cli_parsing.py +0 -0
  379. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_client.py +0 -0
  380. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_client_gcs.py +0 -0
  381. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_client_s3.py +0 -0
  382. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_config.py +0 -0
  383. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_data_storage.py +0 -0
  384. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_database_engine.py +0 -0
  385. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_dispatch.py +0 -0
  386. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_fileslice.py +0 -0
  387. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_func.py +0 -0
  388. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_module_exports.py +0 -0
  389. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_pytorch.py +0 -0
  390. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_query.py +0 -0
  391. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_query_metrics.py +0 -0
  392. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_query_params.py +0 -0
  393. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_script_meta.py +0 -0
  394. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_semver.py +0 -0
  395. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_serializer.py +0 -0
  396. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_utils.py +0 -0
  397. {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_warehouse.py +0 -0
@@ -98,6 +98,7 @@ jobs:
98
98
  - name: Run tests
99
99
  # Generate `.test_durations` file with `pytest --store-durations --durations-path ../.github/.test_durations ...`
100
100
  run: >
101
+ DATACHAIN_METASTORE_ARG_PROJECT=john
101
102
  PYTHONPATH="$(pwd)/..:${PYTHONPATH}"
102
103
  pytest
103
104
  --config-file=pyproject.toml -rs
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: datachain
3
- Version: 0.19.1
3
+ Version: 0.20.0
4
4
  Summary: Wrangle unstructured AI data at scale
5
5
  Author-email: Dmitry Petrov <support@dvc.org>
6
6
  License-Expression: Apache-2.0
@@ -94,7 +94,7 @@ Requires-Dist: scipy; extra == "tests"
94
94
  Requires-Dist: ultralytics; extra == "tests"
95
95
  Provides-Extra: dev
96
96
  Requires-Dist: datachain[docs,tests]; extra == "dev"
97
- Requires-Dist: mypy==1.16.0; extra == "dev"
97
+ Requires-Dist: mypy==1.16.1; extra == "dev"
98
98
  Requires-Dist: types-python-dateutil; extra == "dev"
99
99
  Requires-Dist: types-pytz; extra == "dev"
100
100
  Requires-Dist: types-PyYAML; extra == "dev"
@@ -0,0 +1,42 @@
1
+ # auth team
2
+
3
+ Set the default team for Studio operations.
4
+
5
+ ## Synopsis
6
+
7
+ ```usage
8
+ usage: datachain auth team [-h] [-v] [-q] [--local] [team_name]
9
+ ```
10
+
11
+ ## Description
12
+
13
+ This command sets or shows the default team for Studio operations. By default, the team setting is saved globally, but you can use the `--local` option to set it for the current project.
14
+ If team_name is not passed, the current team in use is shown to the user.
15
+
16
+ ## Arguments
17
+
18
+ * `team_name` - Optional, Name of the team to set as default
19
+
20
+ ## Options
21
+
22
+ * `--local` - Set team locally for the current project
23
+ * `-h`, `--help` - Show the help message and exit.
24
+ * `-v`, `--verbose` - Be verbose.
25
+ * `-q`, `--quiet` - Be quiet.
26
+
27
+ ## Examples
28
+
29
+ 1. Set default team for all projects:
30
+ ```bash
31
+ datachain auth team my-team
32
+ ```
33
+
34
+ 2. Set default team locally for the current project:
35
+ ```bash
36
+ datachain auth team --local my-team
37
+ ```
38
+
39
+ 3. Print the current default in use
40
+ ```bash
41
+ datachain auth team
42
+ ```
@@ -31,3 +31,5 @@ DataChain is a command-line tool for wrangling unstructured AI data at scale. Us
31
31
  - Monitor job logs with [`datachain job logs`](job/logs.md)
32
32
 
33
33
  - Cancel running jobs with [`datachain job cancel`](job/cancel.md)
34
+
35
+ - Check for the clusters available for jobs [`datachain job clusters`](job/clusters.md)
@@ -0,0 +1,39 @@
1
+ # job clusters
2
+
3
+ List compute clusters in Studio.
4
+
5
+ ## Synopsis
6
+
7
+ ```usage
8
+ usage: datachain job clusters [-h] [-v] [-q] [--team TEAM]
9
+ ```
10
+
11
+ ## Description
12
+
13
+ This command lists compute clusters available in Studio. You can specify a team to list clusters for. The command provides information about the compute resources available for running jobs.
14
+
15
+ ## Options
16
+
17
+ * `--team TEAM` - Team to list clusters for (default: from config)
18
+ * `-h`, `--help` - Show the help message and exit
19
+ * `-v`, `--verbose` - Be verbose
20
+ * `-q`, `--quiet` - Be quiet
21
+
22
+ ## Examples
23
+
24
+ 1. List all clusters for the default team:
25
+ ```bash
26
+ datachain job clusters
27
+ ```
28
+
29
+ 2. List clusters for a specific team:
30
+ ```bash
31
+ datachain job clusters --team my-team
32
+ ```
33
+
34
+
35
+ ## Notes
36
+
37
+ * The command shows all compute clusters available to your team
38
+ * Clusters represent the compute resources where your jobs can run
39
+ * Use the `--team` option to view clusters for a different team
@@ -24,6 +24,7 @@ This command runs a job in Studio using the specified query file. You can config
24
24
  * `--team TEAM` - Team to run job for (default: from config)
25
25
  * `--env-file ENV_FILE` - File with environment variables for the job
26
26
  * `--env ENV` - Environment variables in KEY=VALUE format
27
+ * `--cluster-id CLUSTER_ID` - Compute cluster ID to run the job on
27
28
  * `--workers WORKERS` - Number of workers for the job
28
29
  * `--files FILES` - Additional files to include in the job
29
30
  * `--python-version PYTHON_VERSION` - Python version for the job (e.g., 3.9, 3.10, 3.11)
@@ -71,8 +72,17 @@ datachain job run --repository https://github.com/iterative/datachain query.py
71
72
  datachain job run --priority 2 query.py
72
73
  ```
73
74
 
75
+ 8. Run a job in a specific cluster
76
+ ```bash
77
+ # Get the cluster id using following command
78
+ datachain job clusters
79
+ # Use the id of an active clusters from above
80
+ datachain job run --cluster-id 1 query.py
81
+ ```
82
+
74
83
  ## Notes
75
84
 
76
85
  * Closing the logs command (e.g., with Ctrl+C) will only stop displaying the logs but will not cancel the job execution
77
86
  * To cancel a running job, use the `datachain job cancel` command
78
87
  * The job will continue running in Studio even after you stop viewing the logs
88
+ * You can get the list of compute clusters using `datachain job clusters` command.
@@ -0,0 +1,18 @@
1
+ # Environment Variables
2
+
3
+ List of environment variables used to configure DataChain behavior.
4
+
5
+ ### Core Configuration
6
+
7
+ - `DATACHAIN_ROOT_DIR` – Specifies the root directory where DataChain will create the `.datachain` folder to store its internal data. (default: the current working directory).
8
+ - `DATACHAIN_SYSTEM_CONFIG_DIR` – Overrides the system-wide configuration directory (default depends on the platform).
9
+ - `DATACHAIN_GLOBAL_CONFIG_DIR` – Overrides the user's global configuration directory (default depends on the platform).
10
+ - `DATACHAIN_NO_ANALYTICS` – Disables telemetry.
11
+
12
+ ### Studio Integration
13
+
14
+ - `DATACHAIN_STUDIO_URL` – Custom Studio URL.
15
+ - `DATACHAIN_STUDIO_TOKEN` – Authentication token for Studio.
16
+ - `DATACHAIN_STUDIO_TEAM` – Studio team name.
17
+
18
+ Note: Some environment variables are used internally and may not be documented here. For the most up-to-date list, refer to the source code.
@@ -10,3 +10,4 @@ Welcome to the DataChain User Guide! This section provides comprehensive documen
10
10
  - [Data Processing Overview](./processing.md) - Discover DataChain's specialized data processing features.
11
11
  - [Delta Processing](./delta.md) - Incremental data processing to efficiently handle large datasets that change over time.
12
12
  - [Error Handling and Retries](./retry.md) - Learn how to handle processing errors and selectively reprocess problematic records.
13
+ - [Environment Variables](./env.md) - Configure DataChain's behavior using environment variables.
@@ -97,6 +97,7 @@ nav:
97
97
  - logs: commands/job/logs.md
98
98
  - cancel: commands/job/cancel.md
99
99
  - ls: commands/job/ls.md
100
+ - clusters: commands/job/clusters.md
100
101
  - 📚 User Guide:
101
102
  - Overview: guide/index.md
102
103
  - 📡 Interacting with remote storage: guide/remotes.md
@@ -104,6 +105,7 @@ nav:
104
105
  - Overview: guide/processing.md
105
106
  - Delta Processing: guide/delta.md
106
107
  - Errors Handling and Retries: guide/retry.md
108
+ - Environment Variables: guide/env.md
107
109
  - 🤝 Contributing: contributing.md
108
110
 
109
111
  - DataChain Website ↗: https://datachain.ai" target="_blank"
@@ -108,7 +108,7 @@ tests = [
108
108
  ]
109
109
  dev = [
110
110
  "datachain[docs,tests]",
111
- "mypy==1.16.0",
111
+ "mypy==1.16.1",
112
112
  "types-python-dateutil",
113
113
  "types-pytz",
114
114
  "types-PyYAML",
@@ -1,3 +1,4 @@
1
+ from datachain.lib import namespaces, projects
1
2
  from datachain.lib.data_model import DataModel, DataType, is_chain_type
2
3
  from datachain.lib.dc import (
3
4
  C,
@@ -67,7 +68,9 @@ __all__ = [
67
68
  "is_chain_type",
68
69
  "listings",
69
70
  "metrics",
71
+ "namespaces",
70
72
  "param",
73
+ "projects",
71
74
  "read_csv",
72
75
  "read_database",
73
76
  "read_dataset",