datachain 0.19.2__tar.gz → 0.20.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of datachain might be problematic. Click here for more details.
- {datachain-0.19.2 → datachain-0.20.1}/.github/workflows/tests-studio.yml +1 -0
- {datachain-0.19.2 → datachain-0.20.1}/PKG-INFO +2 -2
- {datachain-0.19.2 → datachain-0.20.1}/docs/commands/job/run.md +1 -1
- datachain-0.20.1/docs/guide/env.md +18 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/guide/index.md +1 -0
- {datachain-0.19.2 → datachain-0.20.1}/mkdocs.yml +1 -0
- {datachain-0.19.2 → datachain-0.20.1}/pyproject.toml +1 -1
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/__init__.py +3 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/catalog/catalog.py +180 -65
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/__init__.py +0 -7
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/commands/datasets.py +43 -28
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/parser/__init__.py +1 -35
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/parser/job.py +3 -3
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/data_storage/metastore.py +390 -37
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/data_storage/sqlite.py +139 -7
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/data_storage/warehouse.py +26 -7
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/dataset.py +125 -12
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/delta.py +9 -5
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/error.py +36 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dataset_info.py +4 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/datachain.py +86 -7
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/datasets.py +62 -12
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/listings.py +3 -3
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/records.py +1 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/storage.py +14 -2
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/listing.py +3 -1
- datachain-0.20.1/src/datachain/lib/namespaces.py +73 -0
- datachain-0.20.1/src/datachain/lib/projects.py +86 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/settings.py +10 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/listing.py +3 -1
- datachain-0.20.1/src/datachain/namespace.py +65 -0
- datachain-0.20.1/src/datachain/project.py +78 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/dataset.py +71 -46
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/session.py +1 -1
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/remote/studio.py +63 -28
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/studio.py +26 -9
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain.egg-info/PKG-INFO +2 -2
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain.egg-info/SOURCES.txt +7 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain.egg-info/requires.txt +1 -1
- {datachain-0.19.2 → datachain-0.20.1}/tests/conftest.py +81 -4
- {datachain-0.19.2 → datachain-0.20.1}/tests/examples/test_examples.py +2 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_batching.py +5 -5
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_dataset_query.py +20 -2
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_datasets.py +113 -81
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_metastore.py +30 -10
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_pull.py +69 -18
- {datachain-0.19.2 → datachain-0.20.1}/tests/test_atomicity.py +4 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/test_cli_e2e.py +43 -10
- {datachain-0.19.2 → datachain-0.20.1}/tests/test_cli_studio.py +43 -32
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_datachain.py +55 -3
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_listing_info.py +9 -2
- datachain-0.20.1/tests/unit/lib/test_namespace.py +87 -0
- datachain-0.20.1/tests/unit/lib/test_project.py +184 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_dataset.py +25 -1
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_listing.py +20 -4
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_metastore.py +35 -3
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_session.py +32 -9
- {datachain-0.19.2 → datachain-0.20.1}/tests/utils.py +1 -1
- {datachain-0.19.2 → datachain-0.20.1}/.cruft.json +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.gitattributes +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.github/ISSUE_TEMPLATE/bug_report.yml +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.github/ISSUE_TEMPLATE/empty_issue.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.github/ISSUE_TEMPLATE/feature_request.yml +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.github/codecov.yaml +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.github/dependabot.yml +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.github/workflows/benchmarks.yml +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.github/workflows/release.yml +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.github/workflows/tests.yml +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.github/workflows/update-template.yaml +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.gitignore +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/.pre-commit-config.yaml +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/CODE_OF_CONDUCT.rst +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/LICENSE +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/README.rst +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/assets/captioned_cartoons.png +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/assets/datachain-white.svg +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/assets/datachain.svg +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/commands/auth/login.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/commands/auth/logout.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/commands/auth/team.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/commands/auth/token.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/commands/index.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/commands/job/cancel.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/commands/job/clusters.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/commands/job/logs.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/commands/job/ls.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/contributing.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/css/github-permalink-style.css +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/examples.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/guide/delta.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/guide/processing.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/guide/remotes.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/guide/retry.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/index.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/overrides/main.html +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/quick-start.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/data-types/arrowrow.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/data-types/bbox.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/data-types/file.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/data-types/imagefile.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/data-types/index.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/data-types/pose.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/data-types/segment.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/data-types/tarvfile.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/data-types/textfile.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/data-types/videofile.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/datachain.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/func.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/index.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/toolkit.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/torch.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/references/udf.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/docs/tutorials.md +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/computer_vision/iptc_exif_xmp_lib.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/computer_vision/llava2_image_desc_lib.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/computer_vision/openimage-detect.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/computer_vision/ultralytics-bbox.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/computer_vision/ultralytics-pose.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/computer_vision/ultralytics-segment.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/get_started/common_sql_functions.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/get_started/json-csv-reader.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/get_started/torch-loader.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/get_started/udfs/parallel.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/get_started/udfs/simple.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/get_started/udfs/stateful.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/incremental_processing/delta.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/incremental_processing/retry.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/incremental_processing/utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/llm_and_nlp/claude-query.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/llm_and_nlp/hf-dataset-llm-eval.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/multimodal/clip_inference.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/multimodal/hf_pipeline.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/multimodal/openai_image_desc_lib.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/multimodal/wds.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/examples/multimodal/wds_filtered.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/noxfile.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/setup.cfg +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/__main__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/asyn.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cache.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/catalog/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/catalog/datasource.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/catalog/loader.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/commands/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/commands/du.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/commands/index.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/commands/ls.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/commands/misc.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/commands/query.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/commands/show.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/parser/studio.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/parser/utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/cli/utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/client/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/client/azure.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/client/fileslice.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/client/fsspec.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/client/gcs.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/client/hf.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/client/local.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/client/s3.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/config.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/data_storage/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/data_storage/db_engine.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/data_storage/job.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/data_storage/schema.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/data_storage/serializer.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/diff/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/fs/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/fs/reference.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/fs/utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/aggregate.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/array.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/base.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/conditional.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/func.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/numeric.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/path.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/random.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/string.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/func/window.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/job.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/arrow.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/clip.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/convert/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/convert/flatten.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/convert/python_to_sql.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/convert/sql_to_python.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/convert/unflatten.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/convert/values_to_tuples.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/data_model.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/csv.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/database.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/hf.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/json.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/pandas.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/parquet.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/dc/values.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/file.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/hf.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/image.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/listing_info.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/meta_formats.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/model_store.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/pytorch.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/signal_schema.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/tar.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/text.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/udf.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/udf_signature.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/video.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/webdataset.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/lib/webdataset_laion.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/model/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/model/bbox.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/model/pose.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/model/segment.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/model/ultralytics/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/model/ultralytics/bbox.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/model/ultralytics/pose.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/model/ultralytics/segment.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/model/utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/node.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/nodes_fetcher.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/nodes_thread_pool.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/progress.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/py.typed +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/batch.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/dispatch.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/metrics.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/params.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/queue.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/schema.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/udf.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/query/utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/remote/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/script_meta.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/semver.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/default/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/default/base.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/functions/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/functions/aggregate.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/functions/array.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/functions/conditional.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/functions/numeric.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/functions/path.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/functions/random.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/functions/string.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/selectable.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/sqlite/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/sqlite/base.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/sqlite/types.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/sqlite/vector.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/types.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/sql/utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/telemetry.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/toolkit/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/toolkit/split.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/torch/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain/utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain.egg-info/dependency_links.txt +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain.egg-info/entry_points.txt +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/src/datachain.egg-info/top_level.txt +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/benchmarks/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/benchmarks/conftest.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/benchmarks/datasets/.dvc/.gitignore +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/benchmarks/datasets/.dvc/config +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/benchmarks/datasets/.gitignore +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/benchmarks/datasets/laion-tiny.npz.dvc +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/benchmarks/test_datachain.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/benchmarks/test_ls.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/benchmarks/test_version.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/data.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/examples/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/examples/test_wds_e2e.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/examples/wds_data.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/data/Big_Buck_Bunny_360_10s_1MB.mp4 +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/data/lena.jpg +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/fake-service-account-credentials.json +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/functions/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/functions/test_aggregate.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/functions/test_array.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/functions/test_conditional.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/functions/test_numeric.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/functions/test_path.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/functions/test_random.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/functions/test_string.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/model/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/model/data/running-mask0.png +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/model/data/running-mask1.png +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/model/data/running.jpg +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/model/data/ships.jpg +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/model/test_yolo.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_catalog.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_client.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_cloud_transfer.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_data_storage.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_datachain.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_datachain_merge.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_delta.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_feature_pickling.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_file.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_hf.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_hidden_field.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_image.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_listing.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_ls.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_meta_formats.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_metrics.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_pytorch.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_query.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_read_database.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_retry.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_session.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_toolkit.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_video.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/func/test_warehouse.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/scripts/feature_class.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/scripts/feature_class_exception.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/scripts/feature_class_parallel.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/scripts/feature_class_parallel_data_model.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/scripts/name_len_slow.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/test_import_time.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/test_query_e2e.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/test_telemetry.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/conftest.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_arrow.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_clip.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_datachain_bootstrap.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_datachain_merge.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_diff.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_feature.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_feature_utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_file.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_hf.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_image.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_python_to_sql.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_schema.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_signal_schema.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_sql_to_python.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_text.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_udf.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_udf_signature.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/lib/test_webdataset.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/model/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/model/test_bbox.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/model/test_pose.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/model/test_segment.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/model/test_utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/sql/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/sql/sqlite/__init__.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/sql/sqlite/test_types.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/sql/sqlite/test_utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/sql/test_array.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/sql/test_conditional.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/sql/test_path.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/sql/test_random.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/sql/test_selectable.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/sql/test_string.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_asyn.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_cache.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_catalog.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_catalog_loader.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_cli_parsing.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_client.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_client_gcs.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_client_s3.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_config.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_data_storage.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_database_engine.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_dispatch.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_fileslice.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_func.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_module_exports.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_pytorch.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_query.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_query_metrics.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_query_params.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_script_meta.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_semver.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_serializer.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_utils.py +0 -0
- {datachain-0.19.2 → datachain-0.20.1}/tests/unit/test_warehouse.py +0 -0
|
@@ -98,6 +98,7 @@ jobs:
|
|
|
98
98
|
- name: Run tests
|
|
99
99
|
# Generate `.test_durations` file with `pytest --store-durations --durations-path ../.github/.test_durations ...`
|
|
100
100
|
run: >
|
|
101
|
+
DATACHAIN_METASTORE_ARG_PROJECT=john
|
|
101
102
|
PYTHONPATH="$(pwd)/..:${PYTHONPATH}"
|
|
102
103
|
pytest
|
|
103
104
|
--config-file=pyproject.toml -rs
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: datachain
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 0.20.1
|
|
4
4
|
Summary: Wrangle unstructured AI data at scale
|
|
5
5
|
Author-email: Dmitry Petrov <support@dvc.org>
|
|
6
6
|
License-Expression: Apache-2.0
|
|
@@ -94,7 +94,7 @@ Requires-Dist: scipy; extra == "tests"
|
|
|
94
94
|
Requires-Dist: ultralytics; extra == "tests"
|
|
95
95
|
Provides-Extra: dev
|
|
96
96
|
Requires-Dist: datachain[docs,tests]; extra == "dev"
|
|
97
|
-
Requires-Dist: mypy==1.16.
|
|
97
|
+
Requires-Dist: mypy==1.16.1; extra == "dev"
|
|
98
98
|
Requires-Dist: types-python-dateutil; extra == "dev"
|
|
99
99
|
Requires-Dist: types-pytz; extra == "dev"
|
|
100
100
|
Requires-Dist: types-PyYAML; extra == "dev"
|
|
@@ -24,7 +24,7 @@ This command runs a job in Studio using the specified query file. You can config
|
|
|
24
24
|
* `--team TEAM` - Team to run job for (default: from config)
|
|
25
25
|
* `--env-file ENV_FILE` - File with environment variables for the job
|
|
26
26
|
* `--env ENV` - Environment variables in KEY=VALUE format
|
|
27
|
-
* `--cluster
|
|
27
|
+
* `--cluster CLUSTER` - Compute cluster to run the job on
|
|
28
28
|
* `--workers WORKERS` - Number of workers for the job
|
|
29
29
|
* `--files FILES` - Additional files to include in the job
|
|
30
30
|
* `--python-version PYTHON_VERSION` - Python version for the job (e.g., 3.9, 3.10, 3.11)
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
# Environment Variables
|
|
2
|
+
|
|
3
|
+
List of environment variables used to configure DataChain behavior.
|
|
4
|
+
|
|
5
|
+
### Core Configuration
|
|
6
|
+
|
|
7
|
+
- `DATACHAIN_ROOT_DIR` – Specifies the root directory where DataChain will create the `.datachain` folder to store its internal data. (default: the current working directory).
|
|
8
|
+
- `DATACHAIN_SYSTEM_CONFIG_DIR` – Overrides the system-wide configuration directory (default depends on the platform).
|
|
9
|
+
- `DATACHAIN_GLOBAL_CONFIG_DIR` – Overrides the user's global configuration directory (default depends on the platform).
|
|
10
|
+
- `DATACHAIN_NO_ANALYTICS` – Disables telemetry.
|
|
11
|
+
|
|
12
|
+
### Studio Integration
|
|
13
|
+
|
|
14
|
+
- `DATACHAIN_STUDIO_URL` – Custom Studio URL.
|
|
15
|
+
- `DATACHAIN_STUDIO_TOKEN` – Authentication token for Studio.
|
|
16
|
+
- `DATACHAIN_STUDIO_TEAM` – Studio team name.
|
|
17
|
+
|
|
18
|
+
Note: Some environment variables are used internally and may not be documented here. For the most up-to-date list, refer to the source code.
|
|
@@ -10,3 +10,4 @@ Welcome to the DataChain User Guide! This section provides comprehensive documen
|
|
|
10
10
|
- [Data Processing Overview](./processing.md) - Discover DataChain's specialized data processing features.
|
|
11
11
|
- [Delta Processing](./delta.md) - Incremental data processing to efficiently handle large datasets that change over time.
|
|
12
12
|
- [Error Handling and Retries](./retry.md) - Learn how to handle processing errors and selectively reprocess problematic records.
|
|
13
|
+
- [Environment Variables](./env.md) - Configure DataChain's behavior using environment variables.
|
|
@@ -105,6 +105,7 @@ nav:
|
|
|
105
105
|
- Overview: guide/processing.md
|
|
106
106
|
- Delta Processing: guide/delta.md
|
|
107
107
|
- Errors Handling and Retries: guide/retry.md
|
|
108
|
+
- Environment Variables: guide/env.md
|
|
108
109
|
- 🤝 Contributing: contributing.md
|
|
109
110
|
|
|
110
111
|
- DataChain Website ↗: https://datachain.ai" target="_blank"
|
|
@@ -1,3 +1,4 @@
|
|
|
1
|
+
from datachain.lib import namespaces, projects
|
|
1
2
|
from datachain.lib.data_model import DataModel, DataType, is_chain_type
|
|
2
3
|
from datachain.lib.dc import (
|
|
3
4
|
C,
|
|
@@ -67,7 +68,9 @@ __all__ = [
|
|
|
67
68
|
"is_chain_type",
|
|
68
69
|
"listings",
|
|
69
70
|
"metrics",
|
|
71
|
+
"namespaces",
|
|
70
72
|
"param",
|
|
73
|
+
"projects",
|
|
71
74
|
"read_csv",
|
|
72
75
|
"read_database",
|
|
73
76
|
"read_dataset",
|