metadata-crawler 2510.0.0__py3-none-any.whl → 2510.0.2__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of metadata-crawler might be problematic. Click here for more details.
- metadata_crawler/_version.py +1 -1
- metadata_crawler/api/config.py +10 -3
- {metadata_crawler-2510.0.0.dist-info → metadata_crawler-2510.0.2.dist-info}/METADATA +1 -1
- {metadata_crawler-2510.0.0.dist-info → metadata_crawler-2510.0.2.dist-info}/RECORD +7 -7
- {metadata_crawler-2510.0.0.dist-info → metadata_crawler-2510.0.2.dist-info}/WHEEL +0 -0
- {metadata_crawler-2510.0.0.dist-info → metadata_crawler-2510.0.2.dist-info}/entry_points.txt +0 -0
- {metadata_crawler-2510.0.0.dist-info → metadata_crawler-2510.0.2.dist-info}/licenses/LICENSE +0 -0
metadata_crawler/_version.py
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "2510.0.
|
|
1
|
+
__version__ = "2510.0.2"
|
metadata_crawler/api/config.py
CHANGED
|
@@ -264,8 +264,15 @@ class PathSpecs(BaseModel):
|
|
|
264
264
|
self, data: Dict[str, Any], rel_path: Path
|
|
265
265
|
) -> None:
|
|
266
266
|
dir_parts = rel_path.parent.parts
|
|
267
|
+
|
|
267
268
|
if self.dir_parts and len(dir_parts) == len(self.dir_parts):
|
|
268
|
-
|
|
269
|
+
data.update(
|
|
270
|
+
{
|
|
271
|
+
k: v
|
|
272
|
+
for (k, v) in zip(self.dir_parts, dir_parts)
|
|
273
|
+
if k not in data
|
|
274
|
+
}
|
|
275
|
+
)
|
|
269
276
|
elif self.dir_parts:
|
|
270
277
|
raise MetadataCrawlerException(
|
|
271
278
|
(
|
|
@@ -273,7 +280,6 @@ class PathSpecs(BaseModel):
|
|
|
273
280
|
f"- needs: {len(self.dir_parts)} has: {len(dir_parts)}"
|
|
274
281
|
)
|
|
275
282
|
) from None
|
|
276
|
-
data.update({k: v for (k, v) in _parts.items() if k not in data})
|
|
277
283
|
|
|
278
284
|
def _get_metadata_from_filename(
|
|
279
285
|
self, data: Dict[str, Any], rel_path: Path
|
|
@@ -281,6 +287,7 @@ class PathSpecs(BaseModel):
|
|
|
281
287
|
if self.file_parts is None:
|
|
282
288
|
return
|
|
283
289
|
file_parts = rel_path.name.split(self.file_sep)
|
|
290
|
+
_parts: Dict[str, str] = {}
|
|
284
291
|
if len(file_parts) == len(self.file_parts):
|
|
285
292
|
_parts = dict(zip(self.file_parts, file_parts))
|
|
286
293
|
elif (
|
|
@@ -413,7 +420,7 @@ class DataSpecs(BaseModel):
|
|
|
413
420
|
class Datasets(BaseModel):
|
|
414
421
|
"""Definition of datasets that should be crawled."""
|
|
415
422
|
|
|
416
|
-
__pydantic_extra__: Dict[str,
|
|
423
|
+
__pydantic_extra__: Dict[str, Any] = Field(init=False)
|
|
417
424
|
model_config = ConfigDict(extra="allow")
|
|
418
425
|
root_path: str | Path
|
|
419
426
|
drs_format: str = "freva"
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
metadata_crawler/__init__.py,sha256=dT4ZOngmtO-7fiWqdo80JmeRacG09fy1T8C0bZpFR6Q,7167
|
|
2
2
|
metadata_crawler/__main__.py,sha256=4m56VOh7bb5xmZqb09fFbquke8g6KZfMbb3CUdBA60M,163
|
|
3
|
-
metadata_crawler/_version.py,sha256=
|
|
3
|
+
metadata_crawler/_version.py,sha256=cCJnX2HNJPOzLxMTBvT8O-8ZwJBo4VIGD003JPBKf2U,25
|
|
4
4
|
metadata_crawler/cli.py,sha256=qi77QXtuwO1N3MvLbacdaOZwzpT22FJMpnnp1k6yj-Y,17347
|
|
5
5
|
metadata_crawler/data_collector.py,sha256=7N0zQcxjsqITUVr0JnkFu_beMzrTW-paaw69ESC9rkQ,9063
|
|
6
6
|
metadata_crawler/logger.py,sha256=wNImwUVw0ycvIYrxzthWAgOCujJZhVDCSiCH5KKX5EA,4743
|
|
@@ -9,7 +9,7 @@ metadata_crawler/run.py,sha256=_6mx29Co1HwfPNFWtzTR65CNlopqubj-McmavRM7i80,12869
|
|
|
9
9
|
metadata_crawler/utils.py,sha256=Nm1DkyBD8PyBOP-EUf-Vqs-mLQUPu-6gWPgvNkGDmq8,14124
|
|
10
10
|
metadata_crawler/api/__init__.py,sha256=UUF0_FKgfqgcXYmknxB0Wt1jaLNaf-w_q0tWVJhgV0M,28
|
|
11
11
|
metadata_crawler/api/cli.py,sha256=pgj3iB_Irt74VbG3ZKStLRHKYY_I4bZpbOW1famKDnQ,1498
|
|
12
|
-
metadata_crawler/api/config.py,sha256=
|
|
12
|
+
metadata_crawler/api/config.py,sha256=BCVRqkdQJoNlfZ2--y2xDSeOLsARsB-YZLAvHJrRmvk,28921
|
|
13
13
|
metadata_crawler/api/drs_config.toml,sha256=c3Gc8MGH22xlDOLH_y2TXiiEydmhjzvish-fQi5aGRA,10622
|
|
14
14
|
metadata_crawler/api/index.py,sha256=0yqtXYOyWJJKKkCkIJbUUVG1w2Wt_icYJjXJPZZjSvU,4715
|
|
15
15
|
metadata_crawler/api/metadata_stores.py,sha256=UekPl16KlaF7xiD4X7KVo3EMWz9KE-MT7gKxvgZyvXU,24016
|
|
@@ -27,8 +27,8 @@ metadata_crawler/backends/swift.py,sha256=az3ctF_npadjzAybX65CQbDLGoxRnk0ZR7vByo
|
|
|
27
27
|
metadata_crawler/ingester/__init__.py,sha256=Y-c9VkQWMHDLb9WagwITCaEODlYa4p8xW-BkzzSRZXw,55
|
|
28
28
|
metadata_crawler/ingester/mongo.py,sha256=Ntt3zKVtAX6wDB5aQYCoYrkVWrnvJU2oJJyfYGW30lU,6546
|
|
29
29
|
metadata_crawler/ingester/solr.py,sha256=kpUAnI5iSsvNGagM_gqbTJZr8HNpYSFZFvNOcbHXB9o,9528
|
|
30
|
-
metadata_crawler-2510.0.
|
|
31
|
-
metadata_crawler-2510.0.
|
|
32
|
-
metadata_crawler-2510.0.
|
|
33
|
-
metadata_crawler-2510.0.
|
|
34
|
-
metadata_crawler-2510.0.
|
|
30
|
+
metadata_crawler-2510.0.2.dist-info/entry_points.txt,sha256=4LzS7pbqwUPTD6C-iW42vuhXdtsOJmKXqFZpdpaKwF8,428
|
|
31
|
+
metadata_crawler-2510.0.2.dist-info/licenses/LICENSE,sha256=GAUualebvSlegSVqb86FUqHrHM8WyM145__Nm2r_dfA,1496
|
|
32
|
+
metadata_crawler-2510.0.2.dist-info/WHEEL,sha256=G2gURzTEtmeR8nrdXUJfNiB3VYVxigPQ-bEQujpNiNs,82
|
|
33
|
+
metadata_crawler-2510.0.2.dist-info/METADATA,sha256=oCLBZE2ujhvQjDHNW2Eb1UP5UL6iXvA4edVo0NoodlE,13006
|
|
34
|
+
metadata_crawler-2510.0.2.dist-info/RECORD,,
|
|
File without changes
|
{metadata_crawler-2510.0.0.dist-info → metadata_crawler-2510.0.2.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
{metadata_crawler-2510.0.0.dist-info → metadata_crawler-2510.0.2.dist-info}/licenses/LICENSE
RENAMED
|
File without changes
|