datachain 0.20.4__tar.gz → 0.21.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of datachain might be problematic. Click here for more details.
- {datachain-0.20.4 → datachain-0.21.1}/.github/workflows/tests-studio.yml +0 -1
- {datachain-0.20.4 → datachain-0.21.1}/.pre-commit-config.yaml +1 -1
- {datachain-0.20.4 → datachain-0.21.1}/PKG-INFO +2 -2
- {datachain-0.20.4 → datachain-0.21.1}/docs/guide/index.md +0 -1
- {datachain-0.20.4 → datachain-0.21.1}/examples/get_started/json-csv-reader.py +1 -1
- {datachain-0.20.4 → datachain-0.21.1}/examples/incremental_processing/delta.py +1 -1
- {datachain-0.20.4 → datachain-0.21.1}/examples/llm_and_nlp/hf-dataset-llm-eval.py +5 -15
- {datachain-0.20.4 → datachain-0.21.1}/mkdocs.yml +0 -1
- {datachain-0.20.4 → datachain-0.21.1}/pyproject.toml +2 -3
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/__init__.py +0 -2
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cache.py +2 -2
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/catalog/catalog.py +65 -180
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/__init__.py +11 -2
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/commands/datasets.py +28 -43
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/commands/ls.py +2 -2
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/parser/__init__.py +35 -1
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/client/fsspec.py +3 -5
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/client/hf.py +0 -10
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/client/local.py +4 -4
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/data_storage/metastore.py +37 -405
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/data_storage/sqlite.py +7 -136
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/data_storage/warehouse.py +7 -26
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/dataset.py +12 -126
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/delta.py +7 -11
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/error.py +0 -36
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/func.py +1 -1
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/arrow.py +3 -3
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dataset_info.py +0 -4
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/datachain.py +92 -260
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/datasets.py +50 -104
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/listings.py +3 -3
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/records.py +0 -1
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/storage.py +40 -38
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/file.py +23 -77
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/listing.py +1 -3
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/meta_formats.py +1 -1
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/pytorch.py +1 -1
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/settings.py +0 -10
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/tar.py +2 -1
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/udf_signature.py +1 -1
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/webdataset.py +20 -30
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/listing.py +1 -3
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/dataset.py +46 -71
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/session.py +1 -1
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/remote/studio.py +26 -61
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/studio.py +20 -27
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain.egg-info/PKG-INFO +2 -2
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain.egg-info/SOURCES.txt +0 -7
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain.egg-info/requires.txt +1 -1
- {datachain-0.20.4 → datachain-0.21.1}/tests/conftest.py +4 -76
- {datachain-0.20.4 → datachain-0.21.1}/tests/examples/test_examples.py +0 -2
- {datachain-0.20.4 → datachain-0.21.1}/tests/examples/test_wds_e2e.py +5 -5
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/functions/test_aggregate.py +9 -7
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/functions/test_array.py +21 -20
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/functions/test_conditional.py +7 -6
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/functions/test_numeric.py +5 -4
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/functions/test_path.py +8 -6
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/functions/test_random.py +6 -3
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/functions/test_string.py +7 -6
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_batching.py +5 -5
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_datachain.py +36 -31
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_dataset_query.py +2 -20
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_datasets.py +81 -113
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_delta.py +29 -15
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_file.py +7 -33
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_listing.py +1 -1
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_metastore.py +10 -30
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_pull.py +18 -68
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_retry.py +8 -6
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_toolkit.py +2 -2
- {datachain-0.20.4 → datachain-0.21.1}/tests/test_atomicity.py +0 -3
- {datachain-0.20.4 → datachain-0.21.1}/tests/test_cli_e2e.py +10 -43
- {datachain-0.20.4 → datachain-0.21.1}/tests/test_cli_studio.py +92 -40
- {datachain-0.20.4 → datachain-0.21.1}/tests/test_import_time.py +2 -2
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_datachain.py +110 -213
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_datachain_bootstrap.py +3 -3
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_datachain_merge.py +11 -11
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_diff.py +45 -43
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_feature_utils.py +2 -2
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_file.py +8 -50
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_listing_info.py +2 -7
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_schema.py +4 -1
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_dataset.py +1 -43
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_func.py +125 -149
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_listing.py +4 -20
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_metastore.py +3 -35
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_session.py +9 -31
- {datachain-0.20.4 → datachain-0.21.1}/tests/utils.py +2 -2
- datachain-0.20.4/docs/guide/env.md +0 -18
- datachain-0.20.4/src/datachain/lib/namespaces.py +0 -71
- datachain-0.20.4/src/datachain/lib/projects.py +0 -86
- datachain-0.20.4/src/datachain/namespace.py +0 -65
- datachain-0.20.4/src/datachain/project.py +0 -78
- datachain-0.20.4/tests/unit/lib/test_namespace.py +0 -79
- datachain-0.20.4/tests/unit/lib/test_project.py +0 -157
- {datachain-0.20.4 → datachain-0.21.1}/.cruft.json +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.gitattributes +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.github/ISSUE_TEMPLATE/bug_report.yml +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.github/ISSUE_TEMPLATE/empty_issue.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.github/ISSUE_TEMPLATE/feature_request.yml +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.github/codecov.yaml +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.github/dependabot.yml +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.github/workflows/benchmarks.yml +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.github/workflows/release.yml +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.github/workflows/tests.yml +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.github/workflows/update-template.yaml +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/.gitignore +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/CODE_OF_CONDUCT.rst +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/LICENSE +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/README.rst +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/assets/captioned_cartoons.png +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/assets/datachain-white.svg +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/assets/datachain.svg +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/commands/auth/login.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/commands/auth/logout.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/commands/auth/team.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/commands/auth/token.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/commands/index.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/commands/job/cancel.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/commands/job/clusters.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/commands/job/logs.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/commands/job/ls.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/commands/job/run.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/contributing.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/css/github-permalink-style.css +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/examples.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/guide/delta.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/guide/processing.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/guide/remotes.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/guide/retry.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/index.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/overrides/main.html +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/quick-start.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/data-types/arrowrow.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/data-types/bbox.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/data-types/file.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/data-types/imagefile.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/data-types/index.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/data-types/pose.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/data-types/segment.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/data-types/tarvfile.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/data-types/textfile.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/data-types/videofile.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/datachain.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/func.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/index.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/toolkit.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/torch.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/references/udf.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/docs/tutorials.md +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/computer_vision/iptc_exif_xmp_lib.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/computer_vision/llava2_image_desc_lib.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/computer_vision/openimage-detect.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/computer_vision/ultralytics-bbox.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/computer_vision/ultralytics-pose.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/computer_vision/ultralytics-segment.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/get_started/common_sql_functions.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/get_started/torch-loader.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/get_started/udfs/parallel.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/get_started/udfs/simple.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/get_started/udfs/stateful.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/incremental_processing/retry.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/incremental_processing/utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/llm_and_nlp/claude-query.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/multimodal/clip_inference.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/multimodal/hf_pipeline.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/multimodal/openai_image_desc_lib.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/multimodal/wds.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/examples/multimodal/wds_filtered.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/noxfile.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/setup.cfg +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/__main__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/asyn.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/catalog/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/catalog/datasource.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/catalog/loader.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/commands/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/commands/du.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/commands/index.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/commands/misc.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/commands/query.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/commands/show.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/parser/job.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/parser/studio.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/parser/utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/cli/utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/client/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/client/azure.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/client/fileslice.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/client/gcs.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/client/s3.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/config.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/data_storage/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/data_storage/db_engine.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/data_storage/job.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/data_storage/schema.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/data_storage/serializer.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/diff/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/fs/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/fs/reference.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/fs/utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/aggregate.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/array.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/base.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/conditional.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/numeric.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/path.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/random.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/string.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/func/window.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/job.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/clip.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/convert/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/convert/flatten.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/convert/python_to_sql.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/convert/sql_to_python.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/convert/unflatten.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/convert/values_to_tuples.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/data_model.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/csv.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/database.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/hf.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/json.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/pandas.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/parquet.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/dc/values.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/hf.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/image.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/listing_info.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/model_store.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/signal_schema.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/text.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/udf.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/video.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/lib/webdataset_laion.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/model/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/model/bbox.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/model/pose.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/model/segment.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/model/ultralytics/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/model/ultralytics/bbox.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/model/ultralytics/pose.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/model/ultralytics/segment.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/model/utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/node.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/nodes_fetcher.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/nodes_thread_pool.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/progress.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/py.typed +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/batch.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/dispatch.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/metrics.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/params.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/queue.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/schema.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/udf.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/query/utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/remote/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/script_meta.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/semver.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/default/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/default/base.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/functions/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/functions/aggregate.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/functions/array.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/functions/conditional.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/functions/numeric.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/functions/path.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/functions/random.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/functions/string.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/selectable.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/sqlite/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/sqlite/base.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/sqlite/types.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/sqlite/vector.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/types.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/sql/utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/telemetry.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/toolkit/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/toolkit/split.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/torch/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain/utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain.egg-info/dependency_links.txt +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain.egg-info/entry_points.txt +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/src/datachain.egg-info/top_level.txt +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/benchmarks/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/benchmarks/conftest.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/benchmarks/datasets/.dvc/.gitignore +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/benchmarks/datasets/.dvc/config +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/benchmarks/datasets/.gitignore +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/benchmarks/datasets/laion-tiny.npz.dvc +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/benchmarks/test_datachain.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/benchmarks/test_ls.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/benchmarks/test_version.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/data.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/examples/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/examples/wds_data.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/data/Big_Buck_Bunny_360_10s_1MB.mp4 +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/data/lena.jpg +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/fake-service-account-credentials.json +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/functions/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/model/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/model/data/running-mask0.png +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/model/data/running-mask1.png +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/model/data/running.jpg +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/model/data/ships.jpg +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/model/test_yolo.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_catalog.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_client.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_cloud_transfer.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_data_storage.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_datachain_merge.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_feature_pickling.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_hf.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_hidden_field.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_image.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_ls.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_meta_formats.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_metrics.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_pytorch.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_query.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_read_database.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_session.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_video.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/func/test_warehouse.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/scripts/feature_class.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/scripts/feature_class_exception.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/scripts/feature_class_parallel.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/scripts/feature_class_parallel_data_model.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/scripts/name_len_slow.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/test_query_e2e.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/test_telemetry.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/conftest.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_arrow.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_clip.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_feature.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_hf.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_image.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_python_to_sql.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_signal_schema.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_sql_to_python.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_text.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_udf.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_udf_signature.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/lib/test_webdataset.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/model/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/model/test_bbox.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/model/test_pose.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/model/test_segment.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/model/test_utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/sql/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/sql/sqlite/__init__.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/sql/sqlite/test_types.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/sql/sqlite/test_utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/sql/test_array.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/sql/test_conditional.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/sql/test_path.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/sql/test_random.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/sql/test_selectable.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/sql/test_string.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_asyn.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_cache.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_catalog.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_catalog_loader.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_cli_parsing.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_client.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_client_gcs.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_client_s3.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_config.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_data_storage.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_database_engine.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_dispatch.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_fileslice.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_module_exports.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_pytorch.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_query.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_query_metrics.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_query_params.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_script_meta.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_semver.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_serializer.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_utils.py +0 -0
- {datachain-0.20.4 → datachain-0.21.1}/tests/unit/test_warehouse.py +0 -0
|
@@ -98,7 +98,6 @@ jobs:
|
|
|
98
98
|
- name: Run tests
|
|
99
99
|
# Generate `.test_durations` file with `pytest --store-durations --durations-path ../.github/.test_durations ...`
|
|
100
100
|
run: >
|
|
101
|
-
DATACHAIN_METASTORE_ARG_PROJECT=john
|
|
102
101
|
PYTHONPATH="$(pwd)/..:${PYTHONPATH}"
|
|
103
102
|
pytest
|
|
104
103
|
--config-file=pyproject.toml -rs
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: datachain
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 0.21.1
|
|
4
4
|
Summary: Wrangle unstructured AI data at scale
|
|
5
5
|
Author-email: Dmitry Petrov <support@dvc.org>
|
|
6
6
|
License-Expression: Apache-2.0
|
|
@@ -94,7 +94,7 @@ Requires-Dist: scipy; extra == "tests"
|
|
|
94
94
|
Requires-Dist: ultralytics; extra == "tests"
|
|
95
95
|
Provides-Extra: dev
|
|
96
96
|
Requires-Dist: datachain[docs,tests]; extra == "dev"
|
|
97
|
-
Requires-Dist: mypy==1.16.
|
|
97
|
+
Requires-Dist: mypy==1.16.0; extra == "dev"
|
|
98
98
|
Requires-Dist: types-python-dateutil; extra == "dev"
|
|
99
99
|
Requires-Dist: types-pytz; extra == "dev"
|
|
100
100
|
Requires-Dist: types-PyYAML; extra == "dev"
|
|
@@ -10,4 +10,3 @@ Welcome to the DataChain User Guide! This section provides comprehensive documen
|
|
|
10
10
|
- [Data Processing Overview](./processing.md) - Discover DataChain's specialized data processing features.
|
|
11
11
|
- [Delta Processing](./delta.md) - Incremental data processing to efficiently handle large datasets that change over time.
|
|
12
12
|
- [Error Handling and Retries](./retry.md) - Learn how to handle processing errors and selectively reprocess problematic records.
|
|
13
|
-
- [Environment Variables](./env.md) - Configure DataChain's behavior using environment variables.
|
|
@@ -48,7 +48,7 @@ def main():
|
|
|
48
48
|
|
|
49
49
|
# Print JSON schema in Pydantic format from main COCO annotation
|
|
50
50
|
chain = dc.read_storage(uri, anon="True").filter(dc.C("file.path").glob("*.json"))
|
|
51
|
-
file = chain.limit(1).
|
|
51
|
+
file = next(chain.limit(1).collect("file"))
|
|
52
52
|
print(gen_datamodel_code(file, jmespath="@", model_name="Coco"))
|
|
53
53
|
|
|
54
54
|
# Static JSON schema test parsing 3/7 objects
|
|
@@ -47,7 +47,7 @@ def process_files_with_delta():
|
|
|
47
47
|
print("\nDataset versions:")
|
|
48
48
|
test_dataset = dc.datasets().filter(C("name") == "test_files")
|
|
49
49
|
|
|
50
|
-
for version in test_dataset.
|
|
50
|
+
for version in test_dataset.collect("version"):
|
|
51
51
|
print(f"- Version: {version}")
|
|
52
52
|
|
|
53
53
|
# Show the last 3 records to demonstrate the incremental processing
|
|
@@ -1,5 +1,3 @@
|
|
|
1
|
-
import os
|
|
2
|
-
|
|
3
1
|
from huggingface_hub import InferenceClient
|
|
4
2
|
from requests import HTTPError
|
|
5
3
|
|
|
@@ -25,7 +23,6 @@ def eval_dialog(
|
|
|
25
23
|
) -> DialogEval:
|
|
26
24
|
try:
|
|
27
25
|
completion = client.chat_completion(
|
|
28
|
-
model="meta-llama/Llama-3.3-70B-Instruct",
|
|
29
26
|
messages=[
|
|
30
27
|
{
|
|
31
28
|
"role": "user",
|
|
@@ -34,10 +31,9 @@ def eval_dialog(
|
|
|
34
31
|
],
|
|
35
32
|
response_format={"type": "json", "value": DialogEval.model_json_schema()},
|
|
36
33
|
)
|
|
37
|
-
except HTTPError
|
|
34
|
+
except HTTPError:
|
|
38
35
|
return DialogEval(
|
|
39
|
-
result="Error",
|
|
40
|
-
reason=f"Error while interacting with the Hugging Face API. {e}",
|
|
36
|
+
result="Error", reason="Error while interacting with the Hugging Face API."
|
|
41
37
|
)
|
|
42
38
|
|
|
43
39
|
message = completion.choices[0].message
|
|
@@ -52,15 +48,9 @@ def eval_dialog(
|
|
|
52
48
|
# Save to HF as Parquet. Dataset can be previewed here:
|
|
53
49
|
# https://huggingface.co/datasets/dvcorg/test-datachain-llm-eval/viewer
|
|
54
50
|
(
|
|
55
|
-
dc.read_csv(
|
|
56
|
-
|
|
57
|
-
)
|
|
58
|
-
.settings(parallel=True)
|
|
59
|
-
.setup(
|
|
60
|
-
client=lambda: InferenceClient(
|
|
61
|
-
provider="hf-inference", api_key=os.environ["HF_TOKEN"]
|
|
62
|
-
)
|
|
63
|
-
)
|
|
51
|
+
dc.read_csv("hf://datasets/infinite-dataset-hub/MobilePlanAssistant/data.csv")
|
|
52
|
+
.settings(parallel=10)
|
|
53
|
+
.setup(client=lambda: InferenceClient("meta-llama/Llama-3.1-70B-Instruct"))
|
|
64
54
|
.map(response=eval_dialog)
|
|
65
55
|
.to_parquet("hf://datasets/dvcorg/test-datachain-llm-eval/data.parquet")
|
|
66
56
|
)
|
|
@@ -105,7 +105,6 @@ nav:
|
|
|
105
105
|
- Overview: guide/processing.md
|
|
106
106
|
- Delta Processing: guide/delta.md
|
|
107
107
|
- Errors Handling and Retries: guide/retry.md
|
|
108
|
-
- Environment Variables: guide/env.md
|
|
109
108
|
- 🤝 Contributing: contributing.md
|
|
110
109
|
|
|
111
110
|
- DataChain Website ↗: https://datachain.ai" target="_blank"
|
|
@@ -108,7 +108,7 @@ tests = [
|
|
|
108
108
|
]
|
|
109
109
|
dev = [
|
|
110
110
|
"datachain[docs,tests]",
|
|
111
|
-
"mypy==1.16.
|
|
111
|
+
"mypy==1.16.0",
|
|
112
112
|
"types-python-dateutil",
|
|
113
113
|
"types-pytz",
|
|
114
114
|
"types-PyYAML",
|
|
@@ -221,8 +221,7 @@ ignore = [
|
|
|
221
221
|
"PERF203", # perflint - try-except-in-loop, irrelevant for Python>=3.11
|
|
222
222
|
"PERF401",
|
|
223
223
|
"D100", # undocumented-public-module
|
|
224
|
-
"D205"
|
|
225
|
-
"PLC0415" # import-outside-top-level
|
|
224
|
+
"D205" # one-blank-line-after-class
|
|
226
225
|
]
|
|
227
226
|
select = [
|
|
228
227
|
"B", # flake8-bugbear
|
|
@@ -32,7 +32,6 @@ from datachain.lib.file import (
|
|
|
32
32
|
VideoFrame,
|
|
33
33
|
)
|
|
34
34
|
from datachain.lib.model_store import ModelStore
|
|
35
|
-
from datachain.lib.projects import create as create_project
|
|
36
35
|
from datachain.lib.udf import Aggregator, Generator, Mapper
|
|
37
36
|
from datachain.lib.utils import AbstractUDF, DataChainError
|
|
38
37
|
from datachain.query import metrics, param
|
|
@@ -63,7 +62,6 @@ __all__ = [
|
|
|
63
62
|
"VideoFile",
|
|
64
63
|
"VideoFragment",
|
|
65
64
|
"VideoFrame",
|
|
66
|
-
"create_project",
|
|
67
65
|
"datasets",
|
|
68
66
|
"delete_dataset",
|
|
69
67
|
"is_chain_type",
|
|
@@ -39,7 +39,7 @@ def temporary_cache(
|
|
|
39
39
|
cache.destroy()
|
|
40
40
|
|
|
41
41
|
|
|
42
|
-
class Cache:
|
|
42
|
+
class Cache:
|
|
43
43
|
def __init__(self, cache_dir: str, tmp_dir: str):
|
|
44
44
|
self.odb = LocalHashFileDB(
|
|
45
45
|
LocalFileSystem(),
|
|
@@ -76,9 +76,9 @@ class Cache: # noqa: PLW1641
|
|
|
76
76
|
async def download(
|
|
77
77
|
self, file: "File", client: "Client", callback: Optional[Callback] = None
|
|
78
78
|
) -> None:
|
|
79
|
+
from_path = f"{file.source}/{file.path}"
|
|
79
80
|
from dvc_objects.fs.utils import tmp_fname
|
|
80
81
|
|
|
81
|
-
from_path = file.get_uri()
|
|
82
82
|
odb_fs = self.odb.fs
|
|
83
83
|
tmp_info = odb_fs.join(self.odb.tmp_dir, tmp_fname()) # type: ignore[arg-type]
|
|
84
84
|
size = file.size
|