datachain 0.19.1__tar.gz → 0.20.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of datachain might be problematic. Click here for more details.
- {datachain-0.19.1 → datachain-0.20.0}/.github/workflows/tests-studio.yml +1 -0
- {datachain-0.19.1 → datachain-0.20.0}/PKG-INFO +2 -2
- datachain-0.20.0/docs/commands/auth/team.md +42 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/commands/index.md +2 -0
- datachain-0.20.0/docs/commands/job/clusters.md +39 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/commands/job/run.md +10 -0
- datachain-0.20.0/docs/guide/env.md +18 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/guide/index.md +1 -0
- {datachain-0.19.1 → datachain-0.20.0}/mkdocs.yml +2 -0
- {datachain-0.19.1 → datachain-0.20.0}/pyproject.toml +1 -1
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/__init__.py +3 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/catalog/catalog.py +180 -65
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/__init__.py +0 -7
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/datasets.py +43 -28
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/parser/__init__.py +1 -35
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/parser/job.py +25 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/parser/studio.py +11 -4
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/metastore.py +390 -37
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/schema.py +23 -1
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/sqlite.py +139 -7
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/warehouse.py +26 -7
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/dataset.py +125 -12
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/delta.py +9 -5
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/error.py +36 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dataset_info.py +4 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/datachain.py +86 -7
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/datasets.py +62 -12
- datachain-0.20.0/src/datachain/lib/dc/listings.py +154 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/records.py +1 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/storage.py +14 -2
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/listing.py +3 -1
- datachain-0.20.0/src/datachain/lib/namespaces.py +73 -0
- datachain-0.20.0/src/datachain/lib/projects.py +86 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/settings.py +10 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/listing.py +3 -1
- datachain-0.20.0/src/datachain/namespace.py +65 -0
- datachain-0.20.0/src/datachain/project.py +78 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/dataset.py +71 -46
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/session.py +1 -1
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/remote/studio.py +67 -26
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/studio.py +68 -8
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/PKG-INFO +2 -2
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/SOURCES.txt +8 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/requires.txt +1 -1
- {datachain-0.19.1 → datachain-0.20.0}/tests/conftest.py +81 -4
- {datachain-0.19.1 → datachain-0.20.0}/tests/examples/test_examples.py +2 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_batching.py +5 -5
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_dataset_query.py +20 -2
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_datasets.py +113 -81
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_metastore.py +30 -10
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_pull.py +69 -18
- {datachain-0.19.1 → datachain-0.20.0}/tests/test_atomicity.py +4 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/test_cli_e2e.py +43 -10
- {datachain-0.19.1 → datachain-0.20.0}/tests/test_cli_studio.py +46 -32
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_datachain.py +107 -4
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_listing_info.py +9 -2
- datachain-0.20.0/tests/unit/lib/test_namespace.py +87 -0
- datachain-0.20.0/tests/unit/lib/test_project.py +184 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_dataset.py +25 -1
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_listing.py +20 -4
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_metastore.py +35 -3
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_session.py +32 -9
- {datachain-0.19.1 → datachain-0.20.0}/tests/utils.py +1 -1
- datachain-0.19.1/docs/commands/auth/team.md +0 -36
- datachain-0.19.1/src/datachain/lib/dc/listings.py +0 -43
- {datachain-0.19.1 → datachain-0.20.0}/.cruft.json +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.gitattributes +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.github/ISSUE_TEMPLATE/bug_report.yml +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.github/ISSUE_TEMPLATE/empty_issue.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.github/ISSUE_TEMPLATE/feature_request.yml +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.github/codecov.yaml +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.github/dependabot.yml +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.github/workflows/benchmarks.yml +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.github/workflows/release.yml +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.github/workflows/tests.yml +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.github/workflows/update-template.yaml +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.gitignore +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/.pre-commit-config.yaml +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/CODE_OF_CONDUCT.rst +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/LICENSE +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/README.rst +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/assets/captioned_cartoons.png +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/assets/datachain-white.svg +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/assets/datachain.svg +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/commands/auth/login.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/commands/auth/logout.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/commands/auth/token.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/commands/job/cancel.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/commands/job/logs.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/commands/job/ls.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/contributing.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/css/github-permalink-style.css +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/examples.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/guide/delta.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/guide/processing.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/guide/remotes.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/guide/retry.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/index.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/overrides/main.html +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/quick-start.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/arrowrow.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/bbox.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/file.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/imagefile.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/index.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/pose.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/segment.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/tarvfile.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/textfile.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/data-types/videofile.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/datachain.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/func.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/index.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/toolkit.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/torch.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/references/udf.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/docs/tutorials.md +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/iptc_exif_xmp_lib.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/llava2_image_desc_lib.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/openimage-detect.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/ultralytics-bbox.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/ultralytics-pose.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/computer_vision/ultralytics-segment.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/common_sql_functions.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/json-csv-reader.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/torch-loader.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/udfs/parallel.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/udfs/simple.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/get_started/udfs/stateful.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/incremental_processing/delta.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/incremental_processing/retry.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/incremental_processing/utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/llm_and_nlp/claude-query.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/llm_and_nlp/hf-dataset-llm-eval.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/multimodal/clip_inference.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/multimodal/hf_pipeline.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/multimodal/openai_image_desc_lib.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/multimodal/wds.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/examples/multimodal/wds_filtered.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/noxfile.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/setup.cfg +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/__main__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/asyn.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cache.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/catalog/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/catalog/datasource.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/catalog/loader.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/du.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/index.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/ls.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/misc.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/query.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/commands/show.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/parser/utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/cli/utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/azure.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/fileslice.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/fsspec.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/gcs.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/hf.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/local.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/client/s3.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/config.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/db_engine.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/job.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/data_storage/serializer.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/diff/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/fs/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/fs/reference.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/fs/utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/aggregate.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/array.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/base.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/conditional.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/func.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/numeric.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/path.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/random.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/string.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/func/window.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/job.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/arrow.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/clip.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/flatten.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/python_to_sql.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/sql_to_python.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/unflatten.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/convert/values_to_tuples.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/data_model.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/csv.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/database.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/hf.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/json.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/pandas.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/parquet.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/dc/values.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/file.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/hf.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/image.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/listing_info.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/meta_formats.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/model_store.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/pytorch.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/signal_schema.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/tar.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/text.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/udf.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/udf_signature.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/video.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/webdataset.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/lib/webdataset_laion.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/bbox.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/pose.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/segment.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/ultralytics/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/ultralytics/bbox.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/ultralytics/pose.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/ultralytics/segment.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/model/utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/node.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/nodes_fetcher.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/nodes_thread_pool.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/progress.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/py.typed +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/batch.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/dispatch.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/metrics.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/params.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/queue.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/schema.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/udf.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/query/utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/remote/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/script_meta.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/semver.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/default/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/default/base.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/aggregate.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/array.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/conditional.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/numeric.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/path.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/random.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/functions/string.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/selectable.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/sqlite/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/sqlite/base.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/sqlite/types.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/sqlite/vector.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/types.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/sql/utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/telemetry.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/toolkit/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/toolkit/split.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/torch/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain/utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/dependency_links.txt +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/entry_points.txt +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/src/datachain.egg-info/top_level.txt +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/conftest.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/datasets/.dvc/.gitignore +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/datasets/.dvc/config +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/datasets/.gitignore +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/datasets/laion-tiny.npz.dvc +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/test_datachain.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/test_ls.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/benchmarks/test_version.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/data.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/examples/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/examples/test_wds_e2e.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/examples/wds_data.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/data/Big_Buck_Bunny_360_10s_1MB.mp4 +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/data/lena.jpg +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/fake-service-account-credentials.json +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_aggregate.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_array.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_conditional.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_numeric.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_path.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_random.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/functions/test_string.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/data/running-mask0.png +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/data/running-mask1.png +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/data/running.jpg +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/data/ships.jpg +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/model/test_yolo.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_catalog.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_client.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_cloud_transfer.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_data_storage.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_datachain.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_datachain_merge.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_delta.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_feature_pickling.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_file.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_hf.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_hidden_field.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_image.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_listing.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_ls.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_meta_formats.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_metrics.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_pytorch.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_query.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_read_database.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_retry.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_session.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_toolkit.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_video.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/func/test_warehouse.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/scripts/feature_class.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/scripts/feature_class_exception.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/scripts/feature_class_parallel.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/scripts/feature_class_parallel_data_model.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/scripts/name_len_slow.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/test_import_time.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/test_query_e2e.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/test_telemetry.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/conftest.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_arrow.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_clip.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_datachain_bootstrap.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_datachain_merge.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_diff.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_feature.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_feature_utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_file.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_hf.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_image.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_python_to_sql.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_schema.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_signal_schema.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_sql_to_python.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_text.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_udf.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_udf_signature.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/lib/test_webdataset.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/model/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/model/test_bbox.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/model/test_pose.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/model/test_segment.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/model/test_utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/sqlite/__init__.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/sqlite/test_types.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/sqlite/test_utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_array.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_conditional.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_path.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_random.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_selectable.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/sql/test_string.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_asyn.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_cache.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_catalog.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_catalog_loader.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_cli_parsing.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_client.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_client_gcs.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_client_s3.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_config.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_data_storage.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_database_engine.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_dispatch.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_fileslice.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_func.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_module_exports.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_pytorch.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_query.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_query_metrics.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_query_params.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_script_meta.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_semver.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_serializer.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_utils.py +0 -0
- {datachain-0.19.1 → datachain-0.20.0}/tests/unit/test_warehouse.py +0 -0
|
@@ -98,6 +98,7 @@ jobs:
|
|
|
98
98
|
- name: Run tests
|
|
99
99
|
# Generate `.test_durations` file with `pytest --store-durations --durations-path ../.github/.test_durations ...`
|
|
100
100
|
run: >
|
|
101
|
+
DATACHAIN_METASTORE_ARG_PROJECT=john
|
|
101
102
|
PYTHONPATH="$(pwd)/..:${PYTHONPATH}"
|
|
102
103
|
pytest
|
|
103
104
|
--config-file=pyproject.toml -rs
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: datachain
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 0.20.0
|
|
4
4
|
Summary: Wrangle unstructured AI data at scale
|
|
5
5
|
Author-email: Dmitry Petrov <support@dvc.org>
|
|
6
6
|
License-Expression: Apache-2.0
|
|
@@ -94,7 +94,7 @@ Requires-Dist: scipy; extra == "tests"
|
|
|
94
94
|
Requires-Dist: ultralytics; extra == "tests"
|
|
95
95
|
Provides-Extra: dev
|
|
96
96
|
Requires-Dist: datachain[docs,tests]; extra == "dev"
|
|
97
|
-
Requires-Dist: mypy==1.16.
|
|
97
|
+
Requires-Dist: mypy==1.16.1; extra == "dev"
|
|
98
98
|
Requires-Dist: types-python-dateutil; extra == "dev"
|
|
99
99
|
Requires-Dist: types-pytz; extra == "dev"
|
|
100
100
|
Requires-Dist: types-PyYAML; extra == "dev"
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
# auth team
|
|
2
|
+
|
|
3
|
+
Set the default team for Studio operations.
|
|
4
|
+
|
|
5
|
+
## Synopsis
|
|
6
|
+
|
|
7
|
+
```usage
|
|
8
|
+
usage: datachain auth team [-h] [-v] [-q] [--local] [team_name]
|
|
9
|
+
```
|
|
10
|
+
|
|
11
|
+
## Description
|
|
12
|
+
|
|
13
|
+
This command sets or shows the default team for Studio operations. By default, the team setting is saved globally, but you can use the `--local` option to set it for the current project.
|
|
14
|
+
If team_name is not passed, the current team in use is shown to the user.
|
|
15
|
+
|
|
16
|
+
## Arguments
|
|
17
|
+
|
|
18
|
+
* `team_name` - Optional, Name of the team to set as default
|
|
19
|
+
|
|
20
|
+
## Options
|
|
21
|
+
|
|
22
|
+
* `--local` - Set team locally for the current project
|
|
23
|
+
* `-h`, `--help` - Show the help message and exit.
|
|
24
|
+
* `-v`, `--verbose` - Be verbose.
|
|
25
|
+
* `-q`, `--quiet` - Be quiet.
|
|
26
|
+
|
|
27
|
+
## Examples
|
|
28
|
+
|
|
29
|
+
1. Set default team for all projects:
|
|
30
|
+
```bash
|
|
31
|
+
datachain auth team my-team
|
|
32
|
+
```
|
|
33
|
+
|
|
34
|
+
2. Set default team locally for the current project:
|
|
35
|
+
```bash
|
|
36
|
+
datachain auth team --local my-team
|
|
37
|
+
```
|
|
38
|
+
|
|
39
|
+
3. Print the current default in use
|
|
40
|
+
```bash
|
|
41
|
+
datachain auth team
|
|
42
|
+
```
|
|
@@ -31,3 +31,5 @@ DataChain is a command-line tool for wrangling unstructured AI data at scale. Us
|
|
|
31
31
|
- Monitor job logs with [`datachain job logs`](job/logs.md)
|
|
32
32
|
|
|
33
33
|
- Cancel running jobs with [`datachain job cancel`](job/cancel.md)
|
|
34
|
+
|
|
35
|
+
- Check for the clusters available for jobs [`datachain job clusters`](job/clusters.md)
|
|
@@ -0,0 +1,39 @@
|
|
|
1
|
+
# job clusters
|
|
2
|
+
|
|
3
|
+
List compute clusters in Studio.
|
|
4
|
+
|
|
5
|
+
## Synopsis
|
|
6
|
+
|
|
7
|
+
```usage
|
|
8
|
+
usage: datachain job clusters [-h] [-v] [-q] [--team TEAM]
|
|
9
|
+
```
|
|
10
|
+
|
|
11
|
+
## Description
|
|
12
|
+
|
|
13
|
+
This command lists compute clusters available in Studio. You can specify a team to list clusters for. The command provides information about the compute resources available for running jobs.
|
|
14
|
+
|
|
15
|
+
## Options
|
|
16
|
+
|
|
17
|
+
* `--team TEAM` - Team to list clusters for (default: from config)
|
|
18
|
+
* `-h`, `--help` - Show the help message and exit
|
|
19
|
+
* `-v`, `--verbose` - Be verbose
|
|
20
|
+
* `-q`, `--quiet` - Be quiet
|
|
21
|
+
|
|
22
|
+
## Examples
|
|
23
|
+
|
|
24
|
+
1. List all clusters for the default team:
|
|
25
|
+
```bash
|
|
26
|
+
datachain job clusters
|
|
27
|
+
```
|
|
28
|
+
|
|
29
|
+
2. List clusters for a specific team:
|
|
30
|
+
```bash
|
|
31
|
+
datachain job clusters --team my-team
|
|
32
|
+
```
|
|
33
|
+
|
|
34
|
+
|
|
35
|
+
## Notes
|
|
36
|
+
|
|
37
|
+
* The command shows all compute clusters available to your team
|
|
38
|
+
* Clusters represent the compute resources where your jobs can run
|
|
39
|
+
* Use the `--team` option to view clusters for a different team
|
|
@@ -24,6 +24,7 @@ This command runs a job in Studio using the specified query file. You can config
|
|
|
24
24
|
* `--team TEAM` - Team to run job for (default: from config)
|
|
25
25
|
* `--env-file ENV_FILE` - File with environment variables for the job
|
|
26
26
|
* `--env ENV` - Environment variables in KEY=VALUE format
|
|
27
|
+
* `--cluster-id CLUSTER_ID` - Compute cluster ID to run the job on
|
|
27
28
|
* `--workers WORKERS` - Number of workers for the job
|
|
28
29
|
* `--files FILES` - Additional files to include in the job
|
|
29
30
|
* `--python-version PYTHON_VERSION` - Python version for the job (e.g., 3.9, 3.10, 3.11)
|
|
@@ -71,8 +72,17 @@ datachain job run --repository https://github.com/iterative/datachain query.py
|
|
|
71
72
|
datachain job run --priority 2 query.py
|
|
72
73
|
```
|
|
73
74
|
|
|
75
|
+
8. Run a job in a specific cluster
|
|
76
|
+
```bash
|
|
77
|
+
# Get the cluster id using following command
|
|
78
|
+
datachain job clusters
|
|
79
|
+
# Use the id of an active clusters from above
|
|
80
|
+
datachain job run --cluster-id 1 query.py
|
|
81
|
+
```
|
|
82
|
+
|
|
74
83
|
## Notes
|
|
75
84
|
|
|
76
85
|
* Closing the logs command (e.g., with Ctrl+C) will only stop displaying the logs but will not cancel the job execution
|
|
77
86
|
* To cancel a running job, use the `datachain job cancel` command
|
|
78
87
|
* The job will continue running in Studio even after you stop viewing the logs
|
|
88
|
+
* You can get the list of compute clusters using `datachain job clusters` command.
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
# Environment Variables
|
|
2
|
+
|
|
3
|
+
List of environment variables used to configure DataChain behavior.
|
|
4
|
+
|
|
5
|
+
### Core Configuration
|
|
6
|
+
|
|
7
|
+
- `DATACHAIN_ROOT_DIR` – Specifies the root directory where DataChain will create the `.datachain` folder to store its internal data. (default: the current working directory).
|
|
8
|
+
- `DATACHAIN_SYSTEM_CONFIG_DIR` – Overrides the system-wide configuration directory (default depends on the platform).
|
|
9
|
+
- `DATACHAIN_GLOBAL_CONFIG_DIR` – Overrides the user's global configuration directory (default depends on the platform).
|
|
10
|
+
- `DATACHAIN_NO_ANALYTICS` – Disables telemetry.
|
|
11
|
+
|
|
12
|
+
### Studio Integration
|
|
13
|
+
|
|
14
|
+
- `DATACHAIN_STUDIO_URL` – Custom Studio URL.
|
|
15
|
+
- `DATACHAIN_STUDIO_TOKEN` – Authentication token for Studio.
|
|
16
|
+
- `DATACHAIN_STUDIO_TEAM` – Studio team name.
|
|
17
|
+
|
|
18
|
+
Note: Some environment variables are used internally and may not be documented here. For the most up-to-date list, refer to the source code.
|
|
@@ -10,3 +10,4 @@ Welcome to the DataChain User Guide! This section provides comprehensive documen
|
|
|
10
10
|
- [Data Processing Overview](./processing.md) - Discover DataChain's specialized data processing features.
|
|
11
11
|
- [Delta Processing](./delta.md) - Incremental data processing to efficiently handle large datasets that change over time.
|
|
12
12
|
- [Error Handling and Retries](./retry.md) - Learn how to handle processing errors and selectively reprocess problematic records.
|
|
13
|
+
- [Environment Variables](./env.md) - Configure DataChain's behavior using environment variables.
|
|
@@ -97,6 +97,7 @@ nav:
|
|
|
97
97
|
- logs: commands/job/logs.md
|
|
98
98
|
- cancel: commands/job/cancel.md
|
|
99
99
|
- ls: commands/job/ls.md
|
|
100
|
+
- clusters: commands/job/clusters.md
|
|
100
101
|
- 📚 User Guide:
|
|
101
102
|
- Overview: guide/index.md
|
|
102
103
|
- 📡 Interacting with remote storage: guide/remotes.md
|
|
@@ -104,6 +105,7 @@ nav:
|
|
|
104
105
|
- Overview: guide/processing.md
|
|
105
106
|
- Delta Processing: guide/delta.md
|
|
106
107
|
- Errors Handling and Retries: guide/retry.md
|
|
108
|
+
- Environment Variables: guide/env.md
|
|
107
109
|
- 🤝 Contributing: contributing.md
|
|
108
110
|
|
|
109
111
|
- DataChain Website ↗: https://datachain.ai" target="_blank"
|
|
@@ -1,3 +1,4 @@
|
|
|
1
|
+
from datachain.lib import namespaces, projects
|
|
1
2
|
from datachain.lib.data_model import DataModel, DataType, is_chain_type
|
|
2
3
|
from datachain.lib.dc import (
|
|
3
4
|
C,
|
|
@@ -67,7 +68,9 @@ __all__ = [
|
|
|
67
68
|
"is_chain_type",
|
|
68
69
|
"listings",
|
|
69
70
|
"metrics",
|
|
71
|
+
"namespaces",
|
|
70
72
|
"param",
|
|
73
|
+
"projects",
|
|
71
74
|
"read_csv",
|
|
72
75
|
"read_database",
|
|
73
76
|
"read_dataset",
|