deriva-ml 1.9.0__tar.gz → 1.9.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {deriva_ml-1.9.0/src/deriva_ml.egg-info → deriva_ml-1.9.1}/PKG-INFO +11 -2
- deriva_ml-1.9.1/README.md +11 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/release.sh +2 -1
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/database_model.py +2 -3
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/dataset.py +4 -6
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/deriva_ml_base.py +2 -2
- {deriva_ml-1.9.0 → deriva_ml-1.9.1/src/deriva_ml.egg-info}/PKG-INFO +11 -2
- deriva_ml-1.9.0/README.md +0 -2
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/.github/workflows/publish-docs.yml +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/.gitignore +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/LICENSE +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/.DS_Store +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/Notebooks/DerivaML Create Notes.ipynb +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/Notebooks/DerivaML Dataset.ipynb +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/Notebooks/DerivaML Execution.ipynb +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/Notebooks/DerivaML Features.ipynb +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/Notebooks/DerivaML Vocabulary.ipynb +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/assets/ERD.png +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/assets/Launcher.png +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/assets/copy_minid.png +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/assets/deriva-logo.png +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/assets/deriva-ml.pdf +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/assets/sharing-at-home.pdf +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/code-docs/dataset.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/code-docs/dataset_aux_classes.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/code-docs/dataset_bag.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/code-docs/deriva_ml_base.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/code-docs/deriva_model.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/code-docs/execution.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/code-docs/execution_configuration.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/code-docs/feature.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/code-docs/upload.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/deriva_ml_structure.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/index.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/release-notes.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/user-guide/datasets.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/user-guide/execution-configuration.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/user-guide/identifiers.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/user-guide/install.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/docs/user-guide/ml_workflow_instruction.md +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/mkdocs.yml +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/pyproject.toml +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/setup.cfg +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/__init__.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/dataset_aux_classes.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/dataset_bag.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/demo_catalog.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/deriva_definitions.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/deriva_model.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/execution.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/execution_configuration.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/execution_environment.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/feature.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/history.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/schema_setup/__init__.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/schema_setup/annotations.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/schema_setup/create_schema.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/schema_setup/policy.json +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/schema_setup/table_comments_utils.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/test_functions.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml/upload.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml.egg-info/SOURCES.txt +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml.egg-info/dependency_links.txt +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml.egg-info/entry_points.txt +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml.egg-info/requires.txt +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/src/deriva_ml.egg-info/top_level.txt +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/tests/__init__.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/tests/derivaml_test.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/tests/runner.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/tests/test_basic_tables.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/tests/test_dataset.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/tests/test_download.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/tests/test_execution.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/tests/test_features.py +0 -0
- {deriva_ml-1.9.0 → deriva_ml-1.9.1}/tests/test_upload.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: deriva-ml
|
|
3
|
-
Version: 1.9.
|
|
3
|
+
Version: 1.9.1
|
|
4
4
|
Summary: Utilities to simplify use of Dervia and Pandas to create reproducable ML pipelines
|
|
5
5
|
Author-email: ISRD <isrd-dev@isi.edu>
|
|
6
6
|
Requires-Python: >=3.10
|
|
@@ -16,5 +16,14 @@ Requires-Dist: setuptools-scm<=6.0
|
|
|
16
16
|
Requires-Dist: nbstripout
|
|
17
17
|
Dynamic: license-file
|
|
18
18
|
|
|
19
|
-
|
|
19
|
+
# DerivaML
|
|
20
|
+
Deriva-ML is a python library to simplify the process of creating and executing reproducible machine learning workflows
|
|
20
21
|
using a deriva catalog.
|
|
22
|
+
|
|
23
|
+
|
|
24
|
+
## Installing the GitHub CLI
|
|
25
|
+
|
|
26
|
+
The script release.sh will create a new release tag in GitHub. This script requires the
|
|
27
|
+
GitHUB CLI be installed.
|
|
28
|
+
|
|
29
|
+
See [https://cli.github.com](https://cli.github.com) for instructions on how to install and configure the CLI.
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
# DerivaML
|
|
2
|
+
Deriva-ML is a python library to simplify the process of creating and executing reproducible machine learning workflows
|
|
3
|
+
using a deriva catalog.
|
|
4
|
+
|
|
5
|
+
|
|
6
|
+
## Installing the GitHub CLI
|
|
7
|
+
|
|
8
|
+
The script release.sh will create a new release tag in GitHub. This script requires the
|
|
9
|
+
GitHUB CLI be installed.
|
|
10
|
+
|
|
11
|
+
See [https://cli.github.com](https://cli.github.com) for instructions on how to install and configure the CLI.
|
|
@@ -9,6 +9,7 @@ fi
|
|
|
9
9
|
|
|
10
10
|
# Default version bump is patch unless specified (patch, minor, or major)
|
|
11
11
|
VERSION_TYPE=${1:-patch}
|
|
12
|
+
|
|
12
13
|
echo "Bumping version: $VERSION_TYPE"
|
|
13
14
|
|
|
14
15
|
# Bump the version using bump-my-version.
|
|
@@ -32,6 +33,6 @@ python -m build
|
|
|
32
33
|
NEW_TAG=$(git describe --tags --abbrev=0)
|
|
33
34
|
echo "New version tag: $NEW_TAG"
|
|
34
35
|
|
|
35
|
-
twine upload
|
|
36
|
+
twine upload dist/*${NEW_TAG/v/}
|
|
36
37
|
|
|
37
38
|
echo "Release process complete!"
|
|
@@ -84,7 +84,7 @@ class DatabaseModel(DerivaModel, metaclass=DatabaseModelMeta):
|
|
|
84
84
|
except KeyError:
|
|
85
85
|
raise DerivaMLException(f"Dataset {dataset_rid} not found")
|
|
86
86
|
|
|
87
|
-
def __init__(self, minid: DatasetMinid, bag_path: Path):
|
|
87
|
+
def __init__(self, minid: DatasetMinid, bag_path: Path, dbase_path: Path):
|
|
88
88
|
"""Create a new DatabaseModel.
|
|
89
89
|
|
|
90
90
|
Args:
|
|
@@ -95,8 +95,7 @@ class DatabaseModel(DerivaModel, metaclass=DatabaseModelMeta):
|
|
|
95
95
|
self.bag_path = bag_path
|
|
96
96
|
self.minid = minid
|
|
97
97
|
self.dataset_rid = minid.dataset_rid
|
|
98
|
-
|
|
99
|
-
self.dbase_file = dir_path / f"{minid.version_rid}.db"
|
|
98
|
+
self.dbase_file = dbase_path / f"{minid.version_rid}.db"
|
|
100
99
|
self.dbase = sqlite3.connect(self.dbase_file)
|
|
101
100
|
|
|
102
101
|
super().__init__(
|
|
@@ -67,11 +67,12 @@ class Dataset:
|
|
|
67
67
|
|
|
68
68
|
_Logger = logging.getLogger("deriva_ml")
|
|
69
69
|
|
|
70
|
-
def __init__(self, model: DerivaModel, cache_dir: Path):
|
|
70
|
+
def __init__(self, model: DerivaModel, cache_dir: Path, working_dir: Path):
|
|
71
71
|
self._model = model
|
|
72
72
|
self._ml_schema = ML_SCHEMA
|
|
73
73
|
self.dataset_table = self._model.schemas[self._ml_schema].tables["Dataset"]
|
|
74
74
|
self._cache_dir = cache_dir
|
|
75
|
+
self._working_dir = working_dir
|
|
75
76
|
self._logger = logging.getLogger("deriva_ml")
|
|
76
77
|
|
|
77
78
|
def _is_dataset_rid(self, dataset_rid: RID, deleted: bool = False) -> bool:
|
|
@@ -783,7 +784,6 @@ class Dataset:
|
|
|
783
784
|
snapshot: Optional[Dataset] = None,
|
|
784
785
|
dataset_nesting_depth: Optional[int] = None,
|
|
785
786
|
) -> set[tuple[Table, ...]]:
|
|
786
|
-
|
|
787
787
|
snapshot_catalog = snapshot if snapshot else self
|
|
788
788
|
|
|
789
789
|
dataset_table = snapshot_catalog._model.schemas[self._ml_schema].tables[
|
|
@@ -831,9 +831,7 @@ class Dataset:
|
|
|
831
831
|
nested_paths = set()
|
|
832
832
|
if dataset_rid:
|
|
833
833
|
for c in snapshot_catalog.list_dataset_children(dataset_rid=dataset_rid):
|
|
834
|
-
nested_paths |= self._collect_paths(
|
|
835
|
-
c, snapshot=snapshot_catalog
|
|
836
|
-
)
|
|
834
|
+
nested_paths |= self._collect_paths(c, snapshot=snapshot_catalog)
|
|
837
835
|
else:
|
|
838
836
|
# Initialize nesting depth if not already provided.
|
|
839
837
|
dataset_nesting_depth = (
|
|
@@ -979,7 +977,7 @@ class Dataset:
|
|
|
979
977
|
if dataset.materialize
|
|
980
978
|
else self._download_dataset_minid(minid)
|
|
981
979
|
)
|
|
982
|
-
return DatabaseModel(minid, bag_path).get_dataset()
|
|
980
|
+
return DatabaseModel(minid, bag_path, self._working_dir).get_dataset()
|
|
983
981
|
|
|
984
982
|
def _version_snapshot(self, dataset: DatasetSpec) -> str:
|
|
985
983
|
"""Return a catalog with snapshot for the specified dataset version"""
|
|
@@ -163,7 +163,7 @@ class DerivaML(Dataset):
|
|
|
163
163
|
self.cache_dir.mkdir(parents=True, exist_ok=True)
|
|
164
164
|
|
|
165
165
|
# Initialize dataset class.
|
|
166
|
-
super().__init__(self.model, self.cache_dir)
|
|
166
|
+
super().__init__(self.model, self.cache_dir, self.working_dir)
|
|
167
167
|
self._logger = logging.getLogger("deriva_ml")
|
|
168
168
|
self._logger.setLevel(logging_level)
|
|
169
169
|
|
|
@@ -257,7 +257,7 @@ class DerivaML(Dataset):
|
|
|
257
257
|
def _get_notebook_path(self) -> Path | None:
|
|
258
258
|
"""Return the absolute path of the current notebook."""
|
|
259
259
|
|
|
260
|
-
server, session =
|
|
260
|
+
server, session = DerivaML._get_notebook_session()
|
|
261
261
|
if server and session:
|
|
262
262
|
self._check_nbstrip_status()
|
|
263
263
|
relative_path = session["notebook"]["path"]
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: deriva-ml
|
|
3
|
-
Version: 1.9.
|
|
3
|
+
Version: 1.9.1
|
|
4
4
|
Summary: Utilities to simplify use of Dervia and Pandas to create reproducable ML pipelines
|
|
5
5
|
Author-email: ISRD <isrd-dev@isi.edu>
|
|
6
6
|
Requires-Python: >=3.10
|
|
@@ -16,5 +16,14 @@ Requires-Dist: setuptools-scm<=6.0
|
|
|
16
16
|
Requires-Dist: nbstripout
|
|
17
17
|
Dynamic: license-file
|
|
18
18
|
|
|
19
|
-
|
|
19
|
+
# DerivaML
|
|
20
|
+
Deriva-ML is a python library to simplify the process of creating and executing reproducible machine learning workflows
|
|
20
21
|
using a deriva catalog.
|
|
22
|
+
|
|
23
|
+
|
|
24
|
+
## Installing the GitHub CLI
|
|
25
|
+
|
|
26
|
+
The script release.sh will create a new release tag in GitHub. This script requires the
|
|
27
|
+
GitHUB CLI be installed.
|
|
28
|
+
|
|
29
|
+
See [https://cli.github.com](https://cli.github.com) for instructions on how to install and configure the CLI.
|
deriva_ml-1.9.0/README.md
DELETED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|