jupyter-analysis-tools 1.5.1__py3-none-any.whl → 1.6.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,7 +1,7 @@
1
1
  # -*- coding: utf-8 -*-
2
2
  # __init__.py
3
3
 
4
- __version__ = "1.5.1"
4
+ __version__ = "1.6.1"
5
5
 
6
6
  from .binning import reBin
7
7
  from .git import checkRepo, isNBstripoutActivated, isNBstripoutInstalled, isRepo
@@ -0,0 +1,170 @@
1
+ # -*- coding: utf-8 -*-
2
+ # datastore.py
3
+
4
+ import filecmp
5
+ import getpass
6
+ import tempfile
7
+ import warnings
8
+ from pathlib import Path
9
+
10
+ from pybis import Openbis
11
+
12
+
13
+ class DataStore:
14
+ url = None
15
+ _availObj = None
16
+ _userspace = None
17
+
18
+ def __init__(self, url, username=None):
19
+ self.url = url
20
+ self.username = username
21
+ if self.username is None:
22
+ self.username = getpass.getuser()
23
+ print(f"Working as user '{self.username}'.")
24
+ # to generate PAT you need to login normally
25
+ self.ds = Openbis(url=self.url, verify_certificates=True)
26
+ # arg. *save_token* saves the openBIS token to ~/.pybis permanently
27
+ self.ds.login(
28
+ self.username,
29
+ getpass.getpass(prompt=f"Password for {self.username}: "),
30
+ save_token=False,
31
+ )
32
+ # create the PAT with the given name, don't store it
33
+ self.ds.get_or_create_personal_access_token("test-session")
34
+
35
+ @property
36
+ def userspace(self):
37
+ uspace = self._userspace
38
+ if uspace is None:
39
+ allspaces = self.ds.get_spaces()
40
+ uspace = allspaces.df[
41
+ allspaces.df.code.str.endswith(self.username.upper())
42
+ ].code.values[0]
43
+ self._userspace = uspace
44
+ return uspace
45
+
46
+ @userspace.setter
47
+ def userspace(self, name):
48
+ name = name.upper()
49
+ if name in self.ds.get_spaces().df.code.values:
50
+ self._userspace = name
51
+
52
+ @staticmethod
53
+ def identifier(objects, code):
54
+ return objects[objects.code == code].identifier.tolist()[0]
55
+
56
+ def createProject(self, projectName, space, spacePrefix=None):
57
+ """Finds the requested project in the DataStore.
58
+ Matching project names can be limited to a given *spacePrefix*.
59
+ If the project is not found, a new project with the given code in the given space
60
+ is created."""
61
+ # get available projects, accessible by the current user
62
+ projectsAvail = self.ds.get_projects()
63
+ if spacePrefix:
64
+ projectsAvail = [prj for prj in projectsAvail if f"/{spacePrefix}_" in prj.identifier]
65
+ projects = [prj for prj in projectsAvail if prj.code == projectName]
66
+ assert len(projects) <= 1, f"Multiple projects found for '{projectName}'"
67
+ dsProject = None
68
+ if len(projects): # get the existing object
69
+ dsProject = projects[0]
70
+ else: # create it, if not found
71
+ print(f"Creating project '{projectName}'")
72
+ dsProject = self.ds.new_project(code=projectName, space=space)
73
+ dsProject.save()
74
+ assert dsProject
75
+ return dsProject
76
+
77
+ def createCollection(self, collName, projectObj, defaultObjType=None):
78
+ collections = self.ds.get_collections(project=projectObj)
79
+ dsColl = [coll for coll in collections if coll.code == collName.upper()]
80
+ if len(dsColl):
81
+ dsColl = dsColl[0]
82
+ else: # create it, if not found
83
+ print(f"Creating collection '{collName}'")
84
+ dsColl = self.ds.new_collection(
85
+ code=collName, type="COLLECTION", project=projectObj, props={"$name": collName}
86
+ )
87
+ dsColl.save()
88
+ assert dsColl
89
+ # update properties (name, default view and object type) if not set)
90
+ props = dsColl.props.all() # props as dict
91
+ propKey = "$name"
92
+ if propKey in props and props[propKey] is None:
93
+ props[propKey] = collName
94
+ propKey = "$default_collection_view"
95
+ if propKey in props.keys() and props[propKey] is None:
96
+ propVal = [
97
+ item
98
+ for item in self.ds.get_vocabulary(propKey + "s").get_terms().df.code
99
+ if "list" in item.lower()
100
+ ]
101
+ assert len(propVal)
102
+ props[propKey] = propVal[0]
103
+ if defaultObjType:
104
+ propKey = "$default_object_type"
105
+ if propKey in props.keys() and props[propKey] is None:
106
+ props[propKey] = defaultObjType
107
+ # print(f"Setting '{collName}' properties:\n {props}")
108
+ dsColl.set_props(props)
109
+ dsColl.save()
110
+ return dsColl
111
+
112
+ def createObject(
113
+ self,
114
+ projectName: str,
115
+ collectionName: str = None,
116
+ space: str = None,
117
+ spacePrefix: str = None,
118
+ objType: str = None,
119
+ props: dict = None,
120
+ ):
121
+ dsProject = self.createProject(projectName, space, spacePrefix=spacePrefix)
122
+ dsColl = None
123
+ if collectionName is None: # collectionName is required
124
+ return None
125
+ dsColl = self.createCollection(collectionName, dsProject, defaultObjType=objType)
126
+ obj = self.ds.get_objects(type=objType, where={"$name": props["$name"]}).objects
127
+ if len(obj):
128
+ obj = obj[0]
129
+ prefix = objType
130
+ msg = "'{}' exists already in {}! Updating ...".format(
131
+ obj.props["$name"], obj.project.identifier
132
+ )
133
+ warnings.warn_explicit(msg, UserWarning, prefix, 0)
134
+ else: # does not exist yet
135
+ objName = f" '{props['$name']}'" if len(props.get("$name", "")) else ""
136
+ print(f"Creating new {objType}{objName} in {dsColl.identifier}")
137
+ obj = self.ds.new_object(type=objType, props=props, collection=dsColl)
138
+ obj.set_props(props)
139
+ return obj
140
+
141
+ def findObjects(self, *args, **kwargs):
142
+ return self.ds.get_objects(**kwargs)
143
+
144
+ def uploadDataset(self, obj, datasetType, fpaths=[]):
145
+ def _checkFile(localPath, remoteFiles):
146
+ remoteFile = [f for f in remoteFiles if f.name == localPath.name]
147
+ if not len(remoteFile): # file exists in the dataset as well
148
+ return False
149
+ return filecmp.cmp(localPath, remoteFile[0], shallow=False)
150
+
151
+ if not len(fpaths):
152
+ return # nothing to do
153
+ for dataset in obj.get_datasets(type=datasetType):
154
+ with tempfile.TemporaryDirectory() as tempdir:
155
+ dataset.download(destination=tempdir)
156
+ dsFiles = [f for f in Path(tempdir).rglob("*") if f.is_file()]
157
+ if len(fpaths) == len(dsFiles):
158
+ if all([_checkFile(fpath, dsFiles) for fpath in fpaths]):
159
+ print(
160
+ f"All local files of {datasetType} match files in dataset, "
161
+ "not updating."
162
+ )
163
+ continue # skip deletion below
164
+ print(f"Dataset {datasetType} needs update, deleting existing dataset:")
165
+ dataset.delete("Needs update")
166
+ if not len(obj.get_datasets(type=datasetType)): # didn't exist yet or all deleted
167
+ dataset = self.ds.new_dataset(
168
+ type=datasetType, collection=obj.collection, object=obj, files=fpaths
169
+ )
170
+ dataset.save()
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: jupyter-analysis-tools
3
- Version: 1.5.1
3
+ Version: 1.6.1
4
4
  Summary: Yet another Python library with helpers and utilities for data analysis and processing.
5
5
  Author-email: Ingo Breßler <ingo.bressler@bam.de>, "Brian R. Pauw" <brian.pauw@bam.de>
6
6
  License-Expression: MIT
@@ -35,10 +35,10 @@ Requires-Dist: matplotlib
35
35
  Requires-Dist: ipywidgets
36
36
  Dynamic: license-file
37
37
 
38
- # Jupyter Analysis Tools (v1.5.1)
38
+ # Jupyter Analysis Tools (v1.6.1)
39
39
 
40
40
  [![PyPI Package latest release](https://img.shields.io/pypi/v/jupyter-analysis-tools.svg)](https://pypi.org/project/jupyter-analysis-tools)
41
- [![Commits since latest release](https://img.shields.io/github/commits-since/BAMresearch/jupyter-analysis-tools/v1.5.1.svg)](https://github.com/BAMresearch/jupyter-analysis-tools/compare/v1.5.1...main)
41
+ [![Commits since latest release](https://img.shields.io/github/commits-since/BAMresearch/jupyter-analysis-tools/v1.6.1.svg)](https://github.com/BAMresearch/jupyter-analysis-tools/compare/v1.6.1...main)
42
42
  [![License](https://img.shields.io/pypi/l/jupyter-analysis-tools.svg)](https://en.wikipedia.org/wiki/MIT_license)
43
43
  [![Supported versions](https://img.shields.io/pypi/pyversions/jupyter-analysis-tools.svg)](https://pypi.org/project/jupyter-analysis-tools)
44
44
  [![PyPI Wheel](https://img.shields.io/pypi/wheel/jupyter-analysis-tools.svg)](https://pypi.org/project/jupyter-analysis-tools#files)
@@ -97,6 +97,28 @@ are installed:
97
97
 
98
98
  # CHANGELOG
99
99
 
100
+ ## v1.6.1 (2025-09-19)
101
+
102
+ ### Bug fixes
103
+
104
+ * **DataStore**: regression of handling of existing objects ([`28bd44c`](https://github.com/BAMresearch/jupyter-analysis-tools/commit/28bd44cf019aea0203ad252fd434860f45a1e54a))
105
+
106
+ * **DataStore**: proper forwarding of spacePrefix for filtering relevant spaces ([`c4117f3`](https://github.com/BAMresearch/jupyter-analysis-tools/commit/c4117f3b04b9f6237f6d8471bef2d76c379e6f11))
107
+
108
+ * **DataStore**: use the URL provided by constructor ([`fcc46fb`](https://github.com/BAMresearch/jupyter-analysis-tools/commit/fcc46fb941006b489054dc492f433e62d77cb605))
109
+
110
+ ## v1.6.0 (2025-09-19)
111
+
112
+ ### Bug fixes
113
+
114
+ * **DataStore**: f-string syntax ([`9166382`](https://github.com/BAMresearch/jupyter-analysis-tools/commit/916638264be58e75fdfba15d9c6a6584ace92199))
115
+
116
+ * **Tests**: pybis module required for collecting in new datastore module ([`ea6a21d`](https://github.com/BAMresearch/jupyter-analysis-tools/commit/ea6a21df3656dcc5f926aa7ff67a7136806ded3b))
117
+
118
+ ### Features
119
+
120
+ * **DataStore**: new module for managing objects in OpenBIS ([`cdf0a27`](https://github.com/BAMresearch/jupyter-analysis-tools/commit/cdf0a27c0ae1412acd5329532ec8ec1fa7e6be94))
121
+
100
122
  ## v1.5.1 (2025-08-04)
101
123
 
102
124
  ### Bug fixes
@@ -1,7 +1,8 @@
1
- jupyter_analysis_tools/__init__.py,sha256=wJgXbkvBGUcYsY4GmME-p9uQjFMk9TvzAfbOjOl_1zc,398
1
+ jupyter_analysis_tools/__init__.py,sha256=A7AiYc6fGhMxcTkYmkh7R7xKIa3N_CWhHrkssN-4HEY,398
2
2
  jupyter_analysis_tools/analysis.py,sha256=AiAvUO648f0PYXqLfal1kDH926neasE5c1RYFu9wtYg,1768
3
3
  jupyter_analysis_tools/binning.py,sha256=d6eXRC3IOnnJIF25OfEASyWedT71EX2nF7jAgGJ9suQ,14536
4
4
  jupyter_analysis_tools/datalocations.py,sha256=BakfiZOMcBwp-_DAn7l57lGWZmZGNnk0j73V75nLBUA,4322
5
+ jupyter_analysis_tools/datastore.py,sha256=JZqEr-taNmNLbkDOoaRVP5m-D9t4h1nUTcpkil-7H64,6903
5
6
  jupyter_analysis_tools/distrib.py,sha256=uyh2jXDdXR6dfd36CAoE5_psoFF0bfA6l1wletPD7Xo,16515
6
7
  jupyter_analysis_tools/git.py,sha256=mqSk5nnAFrmk1_2KFuKVrDWOkRbGbAQOq2N1DfxhNpg,2216
7
8
  jupyter_analysis_tools/plotting.py,sha256=X5Orrwiof-9MuYMKDJEXIlIt0K6bQT6ktFFjXKIVApI,1962
@@ -10,10 +11,10 @@ jupyter_analysis_tools/ssfz2json.py,sha256=aEJo8No_PZ021RJGqDz9g2uZVh9y2G-wNvUB7
10
11
  jupyter_analysis_tools/ssfz_compare.py,sha256=__6qXALyX5pdUBYSEjzNoVHa470QX8Cg_LASpahtAGI,1557
11
12
  jupyter_analysis_tools/utils.py,sha256=c8q2-0v7wEjJ_3w5YTZdjFSf-RP1gPUpMJpv5KUyilU,8800
12
13
  jupyter_analysis_tools/widgets.py,sha256=rA8qPvY9nS1OtykZwXtCTG29K-N_MYFVb5Aj8yK40_s,2996
13
- jupyter_analysis_tools-1.5.1.dist-info/licenses/AUTHORS.rst,sha256=-twUESsY0XqFQ0MIC0ylKhglNwL8lyHmGXriM3RF-2s,93
14
- jupyter_analysis_tools-1.5.1.dist-info/licenses/LICENSE,sha256=jRVl3hmCq0Qv1wifm-EelEKhFWecdoWdhcxSte4a1_c,1125
15
- jupyter_analysis_tools-1.5.1.dist-info/METADATA,sha256=hagcHmj9cDY740-W1ENigKPUMzIHNIX-CZzr2kCjh2Y,45652
16
- jupyter_analysis_tools-1.5.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
17
- jupyter_analysis_tools-1.5.1.dist-info/entry_points.txt,sha256=-LU146dufa_JTwarciGzC6bjsl8pqY_8Z49ODYQ4lPY,124
18
- jupyter_analysis_tools-1.5.1.dist-info/top_level.txt,sha256=ei_0x-BF85FLoJ_h67ySwDFowtqus_gI4_0GR466PEU,23
19
- jupyter_analysis_tools-1.5.1.dist-info/RECORD,,
14
+ jupyter_analysis_tools-1.6.1.dist-info/licenses/AUTHORS.rst,sha256=-twUESsY0XqFQ0MIC0ylKhglNwL8lyHmGXriM3RF-2s,93
15
+ jupyter_analysis_tools-1.6.1.dist-info/licenses/LICENSE,sha256=jRVl3hmCq0Qv1wifm-EelEKhFWecdoWdhcxSte4a1_c,1125
16
+ jupyter_analysis_tools-1.6.1.dist-info/METADATA,sha256=wRW9Y1cn-hXYw8PhmvszNUpwZ2H-tt8oYB52q34WJH4,46812
17
+ jupyter_analysis_tools-1.6.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
18
+ jupyter_analysis_tools-1.6.1.dist-info/entry_points.txt,sha256=-LU146dufa_JTwarciGzC6bjsl8pqY_8Z49ODYQ4lPY,124
19
+ jupyter_analysis_tools-1.6.1.dist-info/top_level.txt,sha256=ei_0x-BF85FLoJ_h67ySwDFowtqus_gI4_0GR466PEU,23
20
+ jupyter_analysis_tools-1.6.1.dist-info/RECORD,,