datachain 0.16.1__tar.gz → 0.16.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of datachain might be problematic. Click here for more details.

Files changed (363) hide show
  1. {datachain-0.16.1 → datachain-0.16.2}/.pre-commit-config.yaml +1 -1
  2. {datachain-0.16.1/src/datachain.egg-info → datachain-0.16.2}/PKG-INFO +1 -1
  3. datachain-0.16.2/docs/commands/auth/login.md +51 -0
  4. datachain-0.16.2/docs/commands/auth/logout.md +37 -0
  5. datachain-0.16.2/docs/commands/auth/team.md +36 -0
  6. datachain-0.16.2/docs/commands/auth/token.md +26 -0
  7. datachain-0.16.2/docs/commands/index.md +33 -0
  8. datachain-0.16.2/docs/commands/job/cancel.md +43 -0
  9. datachain-0.16.2/docs/commands/job/logs.md +47 -0
  10. datachain-0.16.2/docs/commands/job/run.md +67 -0
  11. {datachain-0.16.1 → datachain-0.16.2}/mkdocs.yml +12 -0
  12. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/records.py +4 -2
  13. {datachain-0.16.1 → datachain-0.16.2/src/datachain.egg-info}/PKG-INFO +1 -1
  14. {datachain-0.16.1 → datachain-0.16.2}/src/datachain.egg-info/SOURCES.txt +8 -0
  15. {datachain-0.16.1 → datachain-0.16.2}/.cruft.json +0 -0
  16. {datachain-0.16.1 → datachain-0.16.2}/.gitattributes +0 -0
  17. {datachain-0.16.1 → datachain-0.16.2}/.github/ISSUE_TEMPLATE/bug_report.yml +0 -0
  18. {datachain-0.16.1 → datachain-0.16.2}/.github/ISSUE_TEMPLATE/empty_issue.md +0 -0
  19. {datachain-0.16.1 → datachain-0.16.2}/.github/ISSUE_TEMPLATE/feature_request.yml +0 -0
  20. {datachain-0.16.1 → datachain-0.16.2}/.github/codecov.yaml +0 -0
  21. {datachain-0.16.1 → datachain-0.16.2}/.github/dependabot.yml +0 -0
  22. {datachain-0.16.1 → datachain-0.16.2}/.github/workflows/benchmarks.yml +0 -0
  23. {datachain-0.16.1 → datachain-0.16.2}/.github/workflows/release.yml +0 -0
  24. {datachain-0.16.1 → datachain-0.16.2}/.github/workflows/tests-studio.yml +0 -0
  25. {datachain-0.16.1 → datachain-0.16.2}/.github/workflows/tests.yml +0 -0
  26. {datachain-0.16.1 → datachain-0.16.2}/.github/workflows/update-template.yaml +0 -0
  27. {datachain-0.16.1 → datachain-0.16.2}/.gitignore +0 -0
  28. {datachain-0.16.1 → datachain-0.16.2}/CODE_OF_CONDUCT.rst +0 -0
  29. {datachain-0.16.1 → datachain-0.16.2}/LICENSE +0 -0
  30. {datachain-0.16.1 → datachain-0.16.2}/README.rst +0 -0
  31. {datachain-0.16.1 → datachain-0.16.2}/docs/assets/captioned_cartoons.png +0 -0
  32. {datachain-0.16.1 → datachain-0.16.2}/docs/assets/datachain-white.svg +0 -0
  33. {datachain-0.16.1 → datachain-0.16.2}/docs/assets/datachain.svg +0 -0
  34. {datachain-0.16.1 → datachain-0.16.2}/docs/contributing.md +0 -0
  35. {datachain-0.16.1 → datachain-0.16.2}/docs/css/github-permalink-style.css +0 -0
  36. {datachain-0.16.1 → datachain-0.16.2}/docs/examples.md +0 -0
  37. {datachain-0.16.1 → datachain-0.16.2}/docs/index.md +0 -0
  38. {datachain-0.16.1 → datachain-0.16.2}/docs/overrides/main.html +0 -0
  39. {datachain-0.16.1 → datachain-0.16.2}/docs/quick-start.md +0 -0
  40. {datachain-0.16.1 → datachain-0.16.2}/docs/references/data-types/arrowrow.md +0 -0
  41. {datachain-0.16.1 → datachain-0.16.2}/docs/references/data-types/bbox.md +0 -0
  42. {datachain-0.16.1 → datachain-0.16.2}/docs/references/data-types/file.md +0 -0
  43. {datachain-0.16.1 → datachain-0.16.2}/docs/references/data-types/imagefile.md +0 -0
  44. {datachain-0.16.1 → datachain-0.16.2}/docs/references/data-types/index.md +0 -0
  45. {datachain-0.16.1 → datachain-0.16.2}/docs/references/data-types/pose.md +0 -0
  46. {datachain-0.16.1 → datachain-0.16.2}/docs/references/data-types/segment.md +0 -0
  47. {datachain-0.16.1 → datachain-0.16.2}/docs/references/data-types/tarvfile.md +0 -0
  48. {datachain-0.16.1 → datachain-0.16.2}/docs/references/data-types/textfile.md +0 -0
  49. {datachain-0.16.1 → datachain-0.16.2}/docs/references/data-types/videofile.md +0 -0
  50. {datachain-0.16.1 → datachain-0.16.2}/docs/references/datachain.md +0 -0
  51. {datachain-0.16.1 → datachain-0.16.2}/docs/references/func.md +0 -0
  52. {datachain-0.16.1 → datachain-0.16.2}/docs/references/index.md +0 -0
  53. {datachain-0.16.1 → datachain-0.16.2}/docs/references/remotes.md +0 -0
  54. {datachain-0.16.1 → datachain-0.16.2}/docs/references/toolkit.md +0 -0
  55. {datachain-0.16.1 → datachain-0.16.2}/docs/references/torch.md +0 -0
  56. {datachain-0.16.1 → datachain-0.16.2}/docs/references/udf.md +0 -0
  57. {datachain-0.16.1 → datachain-0.16.2}/docs/tutorials.md +0 -0
  58. {datachain-0.16.1 → datachain-0.16.2}/examples/computer_vision/iptc_exif_xmp_lib.py +0 -0
  59. {datachain-0.16.1 → datachain-0.16.2}/examples/computer_vision/llava2_image_desc_lib.py +0 -0
  60. {datachain-0.16.1 → datachain-0.16.2}/examples/computer_vision/openimage-detect.py +0 -0
  61. {datachain-0.16.1 → datachain-0.16.2}/examples/computer_vision/ultralytics-bbox.py +0 -0
  62. {datachain-0.16.1 → datachain-0.16.2}/examples/computer_vision/ultralytics-pose.py +0 -0
  63. {datachain-0.16.1 → datachain-0.16.2}/examples/computer_vision/ultralytics-segment.py +0 -0
  64. {datachain-0.16.1 → datachain-0.16.2}/examples/get_started/common_sql_functions.py +0 -0
  65. {datachain-0.16.1 → datachain-0.16.2}/examples/get_started/json-csv-reader.py +0 -0
  66. {datachain-0.16.1 → datachain-0.16.2}/examples/get_started/torch-loader.py +0 -0
  67. {datachain-0.16.1 → datachain-0.16.2}/examples/get_started/udfs/parallel.py +0 -0
  68. {datachain-0.16.1 → datachain-0.16.2}/examples/get_started/udfs/simple.py +0 -0
  69. {datachain-0.16.1 → datachain-0.16.2}/examples/get_started/udfs/stateful.py +0 -0
  70. {datachain-0.16.1 → datachain-0.16.2}/examples/llm_and_nlp/claude-query.py +0 -0
  71. {datachain-0.16.1 → datachain-0.16.2}/examples/llm_and_nlp/hf-dataset-llm-eval.py +0 -0
  72. {datachain-0.16.1 → datachain-0.16.2}/examples/multimodal/clip_inference.py +0 -0
  73. {datachain-0.16.1 → datachain-0.16.2}/examples/multimodal/hf_pipeline.py +0 -0
  74. {datachain-0.16.1 → datachain-0.16.2}/examples/multimodal/openai_image_desc_lib.py +0 -0
  75. {datachain-0.16.1 → datachain-0.16.2}/examples/multimodal/wds.py +0 -0
  76. {datachain-0.16.1 → datachain-0.16.2}/examples/multimodal/wds_filtered.py +0 -0
  77. {datachain-0.16.1 → datachain-0.16.2}/noxfile.py +0 -0
  78. {datachain-0.16.1 → datachain-0.16.2}/pyproject.toml +0 -0
  79. {datachain-0.16.1 → datachain-0.16.2}/setup.cfg +0 -0
  80. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/__init__.py +0 -0
  81. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/__main__.py +0 -0
  82. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/asyn.py +0 -0
  83. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cache.py +0 -0
  84. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/catalog/__init__.py +0 -0
  85. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/catalog/catalog.py +0 -0
  86. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/catalog/datasource.py +0 -0
  87. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/catalog/loader.py +0 -0
  88. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/__init__.py +0 -0
  89. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/commands/__init__.py +0 -0
  90. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/commands/datasets.py +0 -0
  91. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/commands/du.py +0 -0
  92. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/commands/index.py +0 -0
  93. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/commands/ls.py +0 -0
  94. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/commands/misc.py +0 -0
  95. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/commands/query.py +0 -0
  96. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/commands/show.py +0 -0
  97. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/parser/__init__.py +0 -0
  98. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/parser/job.py +0 -0
  99. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/parser/studio.py +0 -0
  100. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/parser/utils.py +0 -0
  101. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/cli/utils.py +0 -0
  102. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/client/__init__.py +0 -0
  103. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/client/azure.py +0 -0
  104. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/client/fileslice.py +0 -0
  105. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/client/fsspec.py +0 -0
  106. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/client/gcs.py +0 -0
  107. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/client/hf.py +0 -0
  108. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/client/local.py +0 -0
  109. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/client/s3.py +0 -0
  110. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/config.py +0 -0
  111. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/data_storage/__init__.py +0 -0
  112. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/data_storage/db_engine.py +0 -0
  113. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/data_storage/job.py +0 -0
  114. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/data_storage/metastore.py +0 -0
  115. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/data_storage/schema.py +0 -0
  116. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/data_storage/serializer.py +0 -0
  117. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/data_storage/sqlite.py +0 -0
  118. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/data_storage/warehouse.py +0 -0
  119. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/dataset.py +0 -0
  120. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/diff/__init__.py +0 -0
  121. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/error.py +0 -0
  122. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/fs/__init__.py +0 -0
  123. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/fs/reference.py +0 -0
  124. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/fs/utils.py +0 -0
  125. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/__init__.py +0 -0
  126. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/aggregate.py +0 -0
  127. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/array.py +0 -0
  128. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/base.py +0 -0
  129. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/conditional.py +0 -0
  130. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/func.py +0 -0
  131. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/numeric.py +0 -0
  132. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/path.py +0 -0
  133. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/random.py +0 -0
  134. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/string.py +0 -0
  135. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/func/window.py +0 -0
  136. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/job.py +0 -0
  137. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/__init__.py +0 -0
  138. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/arrow.py +0 -0
  139. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/clip.py +0 -0
  140. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/convert/__init__.py +0 -0
  141. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/convert/flatten.py +0 -0
  142. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/convert/python_to_sql.py +0 -0
  143. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/convert/sql_to_python.py +0 -0
  144. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/convert/unflatten.py +0 -0
  145. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/convert/values_to_tuples.py +0 -0
  146. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/data_model.py +0 -0
  147. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dataset_info.py +0 -0
  148. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/__init__.py +0 -0
  149. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/csv.py +0 -0
  150. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/database.py +0 -0
  151. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/datachain.py +0 -0
  152. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/datasets.py +0 -0
  153. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/hf.py +0 -0
  154. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/json.py +0 -0
  155. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/listings.py +0 -0
  156. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/pandas.py +0 -0
  157. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/parquet.py +0 -0
  158. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/storage.py +0 -0
  159. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/utils.py +0 -0
  160. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/dc/values.py +0 -0
  161. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/file.py +0 -0
  162. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/hf.py +0 -0
  163. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/image.py +0 -0
  164. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/listing.py +0 -0
  165. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/listing_info.py +0 -0
  166. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/meta_formats.py +0 -0
  167. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/model_store.py +0 -0
  168. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/pytorch.py +0 -0
  169. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/settings.py +0 -0
  170. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/signal_schema.py +0 -0
  171. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/tar.py +0 -0
  172. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/text.py +0 -0
  173. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/udf.py +0 -0
  174. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/udf_signature.py +0 -0
  175. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/utils.py +0 -0
  176. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/video.py +0 -0
  177. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/webdataset.py +0 -0
  178. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/lib/webdataset_laion.py +0 -0
  179. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/listing.py +0 -0
  180. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/model/__init__.py +0 -0
  181. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/model/bbox.py +0 -0
  182. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/model/pose.py +0 -0
  183. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/model/segment.py +0 -0
  184. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/model/ultralytics/__init__.py +0 -0
  185. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/model/ultralytics/bbox.py +0 -0
  186. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/model/ultralytics/pose.py +0 -0
  187. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/model/ultralytics/segment.py +0 -0
  188. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/model/utils.py +0 -0
  189. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/node.py +0 -0
  190. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/nodes_fetcher.py +0 -0
  191. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/nodes_thread_pool.py +0 -0
  192. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/progress.py +0 -0
  193. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/py.typed +0 -0
  194. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/__init__.py +0 -0
  195. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/batch.py +0 -0
  196. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/dataset.py +0 -0
  197. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/dispatch.py +0 -0
  198. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/metrics.py +0 -0
  199. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/params.py +0 -0
  200. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/queue.py +0 -0
  201. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/schema.py +0 -0
  202. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/session.py +0 -0
  203. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/udf.py +0 -0
  204. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/query/utils.py +0 -0
  205. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/remote/__init__.py +0 -0
  206. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/remote/studio.py +0 -0
  207. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/script_meta.py +0 -0
  208. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/__init__.py +0 -0
  209. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/default/__init__.py +0 -0
  210. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/default/base.py +0 -0
  211. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/functions/__init__.py +0 -0
  212. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/functions/aggregate.py +0 -0
  213. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/functions/array.py +0 -0
  214. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/functions/conditional.py +0 -0
  215. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/functions/numeric.py +0 -0
  216. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/functions/path.py +0 -0
  217. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/functions/random.py +0 -0
  218. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/functions/string.py +0 -0
  219. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/selectable.py +0 -0
  220. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/sqlite/__init__.py +0 -0
  221. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/sqlite/base.py +0 -0
  222. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/sqlite/types.py +0 -0
  223. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/sqlite/vector.py +0 -0
  224. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/types.py +0 -0
  225. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/sql/utils.py +0 -0
  226. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/studio.py +0 -0
  227. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/telemetry.py +0 -0
  228. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/toolkit/__init__.py +0 -0
  229. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/toolkit/split.py +0 -0
  230. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/torch/__init__.py +0 -0
  231. {datachain-0.16.1 → datachain-0.16.2}/src/datachain/utils.py +0 -0
  232. {datachain-0.16.1 → datachain-0.16.2}/src/datachain.egg-info/dependency_links.txt +0 -0
  233. {datachain-0.16.1 → datachain-0.16.2}/src/datachain.egg-info/entry_points.txt +0 -0
  234. {datachain-0.16.1 → datachain-0.16.2}/src/datachain.egg-info/requires.txt +0 -0
  235. {datachain-0.16.1 → datachain-0.16.2}/src/datachain.egg-info/top_level.txt +0 -0
  236. {datachain-0.16.1 → datachain-0.16.2}/tests/__init__.py +0 -0
  237. {datachain-0.16.1 → datachain-0.16.2}/tests/benchmarks/__init__.py +0 -0
  238. {datachain-0.16.1 → datachain-0.16.2}/tests/benchmarks/conftest.py +0 -0
  239. {datachain-0.16.1 → datachain-0.16.2}/tests/benchmarks/datasets/.dvc/.gitignore +0 -0
  240. {datachain-0.16.1 → datachain-0.16.2}/tests/benchmarks/datasets/.dvc/config +0 -0
  241. {datachain-0.16.1 → datachain-0.16.2}/tests/benchmarks/datasets/.gitignore +0 -0
  242. {datachain-0.16.1 → datachain-0.16.2}/tests/benchmarks/datasets/laion-tiny.npz.dvc +0 -0
  243. {datachain-0.16.1 → datachain-0.16.2}/tests/benchmarks/test_datachain.py +0 -0
  244. {datachain-0.16.1 → datachain-0.16.2}/tests/benchmarks/test_ls.py +0 -0
  245. {datachain-0.16.1 → datachain-0.16.2}/tests/benchmarks/test_version.py +0 -0
  246. {datachain-0.16.1 → datachain-0.16.2}/tests/conftest.py +0 -0
  247. {datachain-0.16.1 → datachain-0.16.2}/tests/data.py +0 -0
  248. {datachain-0.16.1 → datachain-0.16.2}/tests/examples/__init__.py +0 -0
  249. {datachain-0.16.1 → datachain-0.16.2}/tests/examples/test_examples.py +0 -0
  250. {datachain-0.16.1 → datachain-0.16.2}/tests/examples/test_wds_e2e.py +0 -0
  251. {datachain-0.16.1 → datachain-0.16.2}/tests/examples/wds_data.py +0 -0
  252. {datachain-0.16.1 → datachain-0.16.2}/tests/func/__init__.py +0 -0
  253. {datachain-0.16.1 → datachain-0.16.2}/tests/func/data/Big_Buck_Bunny_360_10s_1MB.mp4 +0 -0
  254. {datachain-0.16.1 → datachain-0.16.2}/tests/func/data/lena.jpg +0 -0
  255. {datachain-0.16.1 → datachain-0.16.2}/tests/func/fake-service-account-credentials.json +0 -0
  256. {datachain-0.16.1 → datachain-0.16.2}/tests/func/model/__init__.py +0 -0
  257. {datachain-0.16.1 → datachain-0.16.2}/tests/func/model/data/running-mask0.png +0 -0
  258. {datachain-0.16.1 → datachain-0.16.2}/tests/func/model/data/running-mask1.png +0 -0
  259. {datachain-0.16.1 → datachain-0.16.2}/tests/func/model/data/running.jpg +0 -0
  260. {datachain-0.16.1 → datachain-0.16.2}/tests/func/model/data/ships.jpg +0 -0
  261. {datachain-0.16.1 → datachain-0.16.2}/tests/func/model/test_yolo.py +0 -0
  262. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_catalog.py +0 -0
  263. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_client.py +0 -0
  264. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_cloud_transfer.py +0 -0
  265. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_data_storage.py +0 -0
  266. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_datachain.py +0 -0
  267. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_datachain_merge.py +0 -0
  268. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_dataset_query.py +0 -0
  269. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_datasets.py +0 -0
  270. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_feature_pickling.py +0 -0
  271. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_file.py +0 -0
  272. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_hf.py +0 -0
  273. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_hidden_field.py +0 -0
  274. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_image.py +0 -0
  275. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_listing.py +0 -0
  276. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_ls.py +0 -0
  277. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_meta_formats.py +0 -0
  278. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_metrics.py +0 -0
  279. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_pull.py +0 -0
  280. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_pytorch.py +0 -0
  281. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_query.py +0 -0
  282. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_read_database.py +0 -0
  283. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_session.py +0 -0
  284. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_toolkit.py +0 -0
  285. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_video.py +0 -0
  286. {datachain-0.16.1 → datachain-0.16.2}/tests/func/test_warehouse.py +0 -0
  287. {datachain-0.16.1 → datachain-0.16.2}/tests/scripts/feature_class.py +0 -0
  288. {datachain-0.16.1 → datachain-0.16.2}/tests/scripts/feature_class_exception.py +0 -0
  289. {datachain-0.16.1 → datachain-0.16.2}/tests/scripts/feature_class_parallel.py +0 -0
  290. {datachain-0.16.1 → datachain-0.16.2}/tests/scripts/feature_class_parallel_data_model.py +0 -0
  291. {datachain-0.16.1 → datachain-0.16.2}/tests/scripts/name_len_slow.py +0 -0
  292. {datachain-0.16.1 → datachain-0.16.2}/tests/test_atomicity.py +0 -0
  293. {datachain-0.16.1 → datachain-0.16.2}/tests/test_cli_e2e.py +0 -0
  294. {datachain-0.16.1 → datachain-0.16.2}/tests/test_cli_studio.py +0 -0
  295. {datachain-0.16.1 → datachain-0.16.2}/tests/test_import_time.py +0 -0
  296. {datachain-0.16.1 → datachain-0.16.2}/tests/test_query_e2e.py +0 -0
  297. {datachain-0.16.1 → datachain-0.16.2}/tests/test_telemetry.py +0 -0
  298. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/__init__.py +0 -0
  299. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/__init__.py +0 -0
  300. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/conftest.py +0 -0
  301. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_arrow.py +0 -0
  302. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_clip.py +0 -0
  303. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_datachain.py +0 -0
  304. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_datachain_bootstrap.py +0 -0
  305. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_datachain_merge.py +0 -0
  306. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_diff.py +0 -0
  307. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_feature.py +0 -0
  308. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_feature_utils.py +0 -0
  309. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_file.py +0 -0
  310. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_hf.py +0 -0
  311. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_image.py +0 -0
  312. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_listing_info.py +0 -0
  313. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_python_to_sql.py +0 -0
  314. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_schema.py +0 -0
  315. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_signal_schema.py +0 -0
  316. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_sql_to_python.py +0 -0
  317. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_text.py +0 -0
  318. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_udf_signature.py +0 -0
  319. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_utils.py +0 -0
  320. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/lib/test_webdataset.py +0 -0
  321. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/model/__init__.py +0 -0
  322. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/model/test_bbox.py +0 -0
  323. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/model/test_pose.py +0 -0
  324. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/model/test_segment.py +0 -0
  325. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/model/test_utils.py +0 -0
  326. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/sql/__init__.py +0 -0
  327. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/sql/sqlite/__init__.py +0 -0
  328. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/sql/sqlite/test_types.py +0 -0
  329. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/sql/sqlite/test_utils.py +0 -0
  330. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/sql/test_array.py +0 -0
  331. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/sql/test_conditional.py +0 -0
  332. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/sql/test_path.py +0 -0
  333. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/sql/test_random.py +0 -0
  334. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/sql/test_selectable.py +0 -0
  335. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/sql/test_string.py +0 -0
  336. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_asyn.py +0 -0
  337. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_cache.py +0 -0
  338. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_catalog.py +0 -0
  339. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_catalog_loader.py +0 -0
  340. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_cli_parsing.py +0 -0
  341. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_client.py +0 -0
  342. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_client_gcs.py +0 -0
  343. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_client_s3.py +0 -0
  344. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_config.py +0 -0
  345. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_data_storage.py +0 -0
  346. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_database_engine.py +0 -0
  347. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_dataset.py +0 -0
  348. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_dispatch.py +0 -0
  349. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_fileslice.py +0 -0
  350. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_func.py +0 -0
  351. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_listing.py +0 -0
  352. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_metastore.py +0 -0
  353. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_module_exports.py +0 -0
  354. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_pytorch.py +0 -0
  355. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_query.py +0 -0
  356. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_query_metrics.py +0 -0
  357. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_query_params.py +0 -0
  358. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_script_meta.py +0 -0
  359. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_serializer.py +0 -0
  360. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_session.py +0 -0
  361. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_utils.py +0 -0
  362. {datachain-0.16.1 → datachain-0.16.2}/tests/unit/test_warehouse.py +0 -0
  363. {datachain-0.16.1 → datachain-0.16.2}/tests/utils.py +0 -0
@@ -24,7 +24,7 @@ repos:
24
24
  - id: trailing-whitespace
25
25
  exclude: '^LICENSES/'
26
26
  - repo: https://github.com/astral-sh/ruff-pre-commit
27
- rev: 'v0.11.5'
27
+ rev: 'v0.11.6'
28
28
  hooks:
29
29
  - id: ruff
30
30
  args: [--fix, --exit-non-zero-on-fix]
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: datachain
3
- Version: 0.16.1
3
+ Version: 0.16.2
4
4
  Summary: Wrangle unstructured AI data at scale
5
5
  Author-email: Dmitry Petrov <support@dvc.org>
6
6
  License-Expression: Apache-2.0
@@ -0,0 +1,51 @@
1
+ # auth login
2
+
3
+ Authenticate DataChain with Studio to save a client access token to DataChain configuration.
4
+
5
+ ## Synopsis
6
+
7
+ ```usage
8
+ usage: datachain auth login [-h] [-v] [-q] [-H HOSTNAME] [-s SCOPES] [-n NAME] [--no-open] [--local]
9
+ ```
10
+
11
+ ## Description
12
+
13
+ By default, this command authenticates DataChain with Studio using default scopes and assigns a random name as the token name. The authentication token will be used for subsequent Studio operations.
14
+
15
+ ## Options
16
+
17
+ * `-H HOSTNAME`, `--hostname HOSTNAME` - The hostname of the Studio instance to authenticate with.
18
+ * `-s SCOPES`, `--scopes SCOPES` - Authentication token scopes. Allowed scopes: `EXPERIMENTS`, `DATASETS`, `MODELS`. Defaults to all available scopes.
19
+ * `-n NAME`, `--name NAME` - The name of the authentication token. It will be used to identify the token shown in Studio profile. Defaults to a random name.
20
+ * `--no-open` - Use code-based authentication without browser. You will be presented with a user code to enter in the browser. DataChain will also use this if it cannot launch the browser on your behalf.
21
+ * `--local` - Save the token in the local project config instead of the global configuration.
22
+ * `-h`, `--help` - Show the help message and exit.
23
+ * `-v`, `--verbose` - Be verbose.
24
+ * `-q`, `--quiet` - Be quiet.
25
+
26
+ ## Examples
27
+
28
+ 1. Basic authentication with default settings:
29
+ ```bash
30
+ datachain auth login
31
+ ```
32
+
33
+ 2. Authenticate with specific scopes:
34
+ ```bash
35
+ datachain auth login --scopes EXPERIMENTS,DATASETS
36
+ ```
37
+
38
+ 3. Authenticate with a custom token name:
39
+ ```bash
40
+ datachain auth login --name my-token
41
+ ```
42
+
43
+ 4. Authenticate using code-based flow:
44
+ ```bash
45
+ datachain auth login --no-open
46
+ ```
47
+
48
+ 5. Save token locally for the project:
49
+ ```bash
50
+ datachain auth login --local
51
+ ```
@@ -0,0 +1,37 @@
1
+ # auth logout
2
+
3
+ Remove the Studio authentication token from DataChain configuration.
4
+
5
+ ## Synopsis
6
+
7
+ ```usage
8
+ usage: datachain auth logout [-h] [-v] [-q] [--local]
9
+ ```
10
+
11
+ ## Description
12
+
13
+ This command removes the Studio authentication token from the global DataChain configuration. By default, it removes the token from the global configuration, but you can also remove it from the local project configuration using the `--local` option.
14
+
15
+ ## Options
16
+
17
+ * `--local` - Remove the token from the local project config instead of the global configuration.
18
+ * `-h`, `--help` - Show the help message and exit.
19
+ * `-v`, `--verbose` - Be verbose.
20
+ * `-q`, `--quiet` - Be quiet.
21
+
22
+ ## Examples
23
+
24
+ 1. Remove token from global configuration:
25
+ ```bash
26
+ datachain auth logout
27
+ ```
28
+
29
+ 2. Remove token from local project configuration:
30
+ ```bash
31
+ datachain auth logout --local
32
+ ```
33
+
34
+ 3. Remove token with verbose output:
35
+ ```bash
36
+ datachain auth logout -v
37
+ ```
@@ -0,0 +1,36 @@
1
+ # auth team
2
+
3
+ Set the default team for Studio operations.
4
+
5
+ ## Synopsis
6
+
7
+ ```usage
8
+ usage: datachain auth team [-h] [-v] [-q] [--global] team_name
9
+ ```
10
+
11
+ ## Description
12
+
13
+ This command sets the default team for Studio operations. By default, the team setting is project-specific, but you can use the `--global` option to set it for all projects.
14
+
15
+ ## Arguments
16
+
17
+ * `team_name` - Name of the team to set as default
18
+
19
+ ## Options
20
+
21
+ * `--global` - Set team globally for all projects
22
+ * `-h`, `--help` - Show the help message and exit.
23
+ * `-v`, `--verbose` - Be verbose.
24
+ * `-q`, `--quiet` - Be quiet.
25
+
26
+ ## Examples
27
+
28
+ 1. Set default team for current project:
29
+ ```bash
30
+ datachain auth team my-team
31
+ ```
32
+
33
+ 2. Set default team globally for all projects:
34
+ ```bash
35
+ datachain auth team --global my-team
36
+ ```
@@ -0,0 +1,26 @@
1
+ # auth token
2
+
3
+ Display the current authentication token for Studio.
4
+
5
+ ## Synopsis
6
+
7
+ ```usage
8
+ usage: datachain auth token [-h] [-v] [-q]
9
+ ```
10
+
11
+ ## Description
12
+
13
+ This command displays the current authentication token that DataChain is using for Studio operations. The token is used for authenticating with Studio and accessing its features.
14
+
15
+ ## Options
16
+
17
+ * `-h`, `--help` - Show the help message and exit.
18
+ * `-v`, `--verbose` - Be verbose.
19
+ * `-q`, `--quiet` - Be quiet.
20
+
21
+ ## Examples
22
+
23
+ 1. Display the current token:
24
+ ```bash
25
+ datachain auth token
26
+ ```
@@ -0,0 +1,33 @@
1
+
2
+ # Using DataChain Commands
3
+
4
+
5
+
6
+ DataChain is a command-line tool for wrangling unstructured AI data at scale. Use `datachain -h` to list all available commands.
7
+
8
+
9
+
10
+ ## Typical DataChain Workflow
11
+
12
+
13
+
14
+ 1. **Authentication with Studio**
15
+
16
+
17
+ - Use [`datachain auth login`](auth/login.md) to authenticate with Studio
18
+
19
+ - Set your default team with [`datachain auth team`](auth/team.md)
20
+
21
+ - View your token with [`datachain auth token`](auth/token.md)
22
+
23
+ - Log out from Studio with [`datachain auth logout`](auth/logout.md)
24
+
25
+
26
+
27
+ 2. **Job Management**
28
+
29
+ - Run jobs in Studio with [`datachain job run`](job/run.md)
30
+
31
+ - Monitor job logs with [`datachain job logs`](job/logs.md)
32
+
33
+ - Cancel running jobs with [`datachain job cancel`](job/cancel.md)
@@ -0,0 +1,43 @@
1
+ # job cancel
2
+
3
+ Cancel a running job in Studio.
4
+
5
+ ## Synopsis
6
+
7
+ ```usage
8
+ usage: datachain job cancel [-h] [-v] [-q] [--team TEAM] id
9
+ ```
10
+
11
+ ## Description
12
+
13
+ This command cancels a running job in Studio. The job ID can be obtained from the Studio UI or from the output when the job was created. This is the recommended way to stop a running job, as simply closing the logs view (e.g., with Ctrl+C) will not cancel the job execution.
14
+
15
+ ## Arguments
16
+
17
+ * `id` - Job ID to cancel. This ID is displayed when the job is created and can also be found in the Studio UI.
18
+
19
+ ## Options
20
+
21
+ * `--team TEAM` - Team to cancel job for (default: from config)
22
+ * `-h`, `--help` - Show the help message and exit.
23
+ * `-v`, `--verbose` - Be verbose.
24
+ * `-q`, `--quiet` - Be quiet.
25
+
26
+ ## Examples
27
+
28
+ 1. Cancel a specific job:
29
+ ```bash
30
+ datachain job cancel job-123
31
+ ```
32
+
33
+ 2. Cancel a job in a specific team:
34
+ ```bash
35
+ datachain job cancel --team my-team job-123
36
+ ```
37
+
38
+
39
+ ## Notes
40
+
41
+ * The job ID is displayed when the job is created using `datachain job run`
42
+ * You can also find the job ID in the Studio UI
43
+ * This is the proper way to stop a running job, as simply closing the logs view will not cancel the job execution
@@ -0,0 +1,47 @@
1
+ # job logs
2
+
3
+ Display logs and current status of jobs in Studio.
4
+
5
+ ## Synopsis
6
+
7
+ ```usage
8
+ usage: datachain job logs [-h] [-v] [-q] [--team TEAM] id
9
+ ```
10
+
11
+ ## Description
12
+
13
+ This command displays the logs and current status of a running job in Studio. The command will show real-time logs from the job execution. Note that closing this command (e.g., with Ctrl+C) will only stop displaying the logs but will not cancel the job execution. To cancel a job, use the `job cancel` command.
14
+
15
+ ## Arguments
16
+
17
+ * `id` - Job ID to show logs for
18
+
19
+ ## Options
20
+
21
+ * `--team TEAM` - Team to check logs for (default: from config)
22
+ * `-h`, `--help` - Show the help message and exit.
23
+ * `-v`, `--verbose` - Be verbose.
24
+ * `-q`, `--quiet` - Be quiet.
25
+
26
+ ## Examples
27
+
28
+ 1. Display logs for a specific job:
29
+ ```bash
30
+ datachain job logs job-123
31
+ ```
32
+
33
+ 2. Display logs for a job in a specific team:
34
+ ```bash
35
+ datachain job logs --team my-team job-123
36
+ ```
37
+
38
+ 3. Display logs with verbose output:
39
+ ```bash
40
+ datachain job logs -v job-123
41
+ ```
42
+
43
+ ## Notes
44
+
45
+ * Closing the logs command (e.g., with Ctrl+C) will only stop displaying the logs but will not cancel the job execution
46
+ * To cancel a running job, use the `datachain job cancel` command
47
+ * The job will continue running in Studio even after you stop viewing the logs
@@ -0,0 +1,67 @@
1
+ # job run
2
+
3
+ Run a job in Studio.
4
+
5
+ ## Synopsis
6
+
7
+ ```usage
8
+ usage: datachain job run [-h] [-v] [-q] [--team TEAM] [--env-file ENV_FILE] [--env ENV [ENV ...]]
9
+ [--workers WORKERS] [--files FILES [FILES ...]] [--python-version PYTHON_VERSION]
10
+ [--req-file REQ_FILE] [--req REQ [REQ ...]]
11
+ file
12
+ ```
13
+
14
+ ## Description
15
+
16
+ This command runs a job in Studio using the specified query file. You can configure various aspects of the job including environment variables, Python version, dependencies, and more.
17
+
18
+ ## Arguments
19
+
20
+ * `file` - Query file to run
21
+
22
+ ## Options
23
+
24
+ * `--team TEAM` - Team to run job for (default: from config)
25
+ * `--env-file ENV_FILE` - File with environment variables for the job
26
+ * `--env ENV` - Environment variables in KEY=VALUE format
27
+ * `--workers WORKERS` - Number of workers for the job
28
+ * `--files FILES` - Additional files to include in the job
29
+ * `--python-version PYTHON_VERSION` - Python version for the job (e.g., 3.9, 3.10, 3.11)
30
+ * `--req-file REQ_FILE` - Python requirements file
31
+ * `--req REQ` - Python package requirements
32
+ * `-h`, `--help` - Show the help message and exit.
33
+ * `-v`, `--verbose` - Be verbose.
34
+ * `-q`, `--quiet` - Be quiet.
35
+
36
+ ## Examples
37
+
38
+ 1. Run a basic job:
39
+ ```bash
40
+ datachain job run query.py
41
+ ```
42
+
43
+ 2. Run a job with specific team and Python version:
44
+ ```bash
45
+ datachain job run --team my-team --python-version 3.11 query.py
46
+ ```
47
+
48
+ 3. Run a job with environment variables and requirements:
49
+ ```bash
50
+ datachain job run --env-file .env --req-file requirements.txt query.py
51
+ ```
52
+
53
+ 4. Run a job with multiple workers and additional files:
54
+ ```bash
55
+ datachain job run --workers 4 --files utils.py config.json query.py
56
+ ```
57
+
58
+ 5. Run a job with inline environment variables and package requirements:
59
+ ```bash
60
+ datachain job run --env API_KEY=123 --req pandas numpy query.py
61
+ ```
62
+
63
+ ## Notes
64
+
65
+ * Closing the logs command (e.g., with Ctrl+C) will only stop displaying the logs but will not cancel the job execution
66
+ * To cancel a running job, use the `datachain job cancel` command
67
+ * The job will continue running in Studio even after you stop viewing the logs
@@ -84,6 +84,18 @@ nav:
84
84
  - Torch: references/torch.md
85
85
  - Functions: references/func.md
86
86
  - Toolkit: references/toolkit.md
87
+ - 📖 CLI Reference:
88
+ - Overview: commands/index.md
89
+ - Commands:
90
+ - auth:
91
+ - login: commands/auth/login.md
92
+ - logout: commands/auth/logout.md
93
+ - token: commands/auth/token.md
94
+ - team: commands/auth/team.md
95
+ - job:
96
+ - run: commands/job/run.md
97
+ - logs: commands/job/logs.md
98
+ - cancel: commands/job/cancel.md
87
99
  - 📡 Interacting with remote storage: references/remotes.md
88
100
  - 🤝 Contributing: contributing.md
89
101
 
@@ -38,8 +38,9 @@ def read_records(
38
38
  single_record = dc.read_records(dc.DEFAULT_FILE_RECORD)
39
39
  ```
40
40
  """
41
- from datachain.query.dataset import adjust_outputs, get_col_types
41
+ from datachain.query.dataset import INSERT_BATCH_SIZE, adjust_outputs, get_col_types
42
42
  from datachain.sql.types import SQLType
43
+ from datachain.utils import batched
43
44
 
44
45
  from .datasets import read_dataset
45
46
 
@@ -89,6 +90,7 @@ def read_records(
89
90
  {c.name: c.type for c in columns if isinstance(c.type, SQLType)},
90
91
  )
91
92
  records = (adjust_outputs(warehouse, record, col_types) for record in to_insert)
92
- warehouse.insert_rows(table, records)
93
+ for chunk in batched(records, INSERT_BATCH_SIZE):
94
+ warehouse.insert_rows(table, chunk)
93
95
  warehouse.insert_rows_done(table)
94
96
  return read_dataset(name=dsr.name, session=session, settings=settings)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: datachain
3
- Version: 0.16.1
3
+ Version: 0.16.2
4
4
  Summary: Wrangle unstructured AI data at scale
5
5
  Author-email: Dmitry Petrov <support@dvc.org>
6
6
  License-Expression: Apache-2.0
@@ -26,6 +26,14 @@ docs/tutorials.md
26
26
  docs/assets/captioned_cartoons.png
27
27
  docs/assets/datachain-white.svg
28
28
  docs/assets/datachain.svg
29
+ docs/commands/index.md
30
+ docs/commands/auth/login.md
31
+ docs/commands/auth/logout.md
32
+ docs/commands/auth/team.md
33
+ docs/commands/auth/token.md
34
+ docs/commands/job/cancel.md
35
+ docs/commands/job/logs.md
36
+ docs/commands/job/run.md
29
37
  docs/css/github-permalink-style.css
30
38
  docs/overrides/main.html
31
39
  docs/references/datachain.md
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes