OneStop4All-Indexer 2.8.0.dev20__tar.gz → 2.8.0rc2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2/OneStop4All_Indexer.egg-info}/PKG-INFO +1 -1
- {onestop4all_indexer-2.8.0.dev20/OneStop4All_Indexer.egg-info → onestop4all_indexer-2.8.0rc2}/PKG-INFO +1 -1
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_dataservice.py +5 -1
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_organization.py +9 -1
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/setup.py +1 -1
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/cli.py +4 -7
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/LICENSE +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/OneStop4All_Indexer.egg-info/SOURCES.txt +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/OneStop4All_Indexer.egg-info/dependency_links.txt +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/OneStop4All_Indexer.egg-info/entry_points.txt +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/OneStop4All_Indexer.egg-info/requires.txt +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/OneStop4All_Indexer.egg-info/top_level.txt +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/__init__.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/repository_base.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/repository_n4eorganization.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/repository_person.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/repository_resource_links.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/repository_theme.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/__init__.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_article.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_base.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_dataset.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_document.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_learningresource.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_metadatastandards.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_repository.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_service.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_software.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/pyproject.toml +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/setup.cfg +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/__init__.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/configs.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/harvest.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/solr.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/sparql.py +0 -0
- {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/util.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: OneStop4All-Indexer
|
|
3
|
-
Version: 2.8.
|
|
3
|
+
Version: 2.8.0rc2
|
|
4
4
|
Summary: Library to harvest data from NFDI4Earth-KnowledgeHub to OneStop4All-Index
|
|
5
5
|
Author: Markus Konkol, Arne Vogt, Tom Niers, Ralf Klammer
|
|
6
6
|
Author-email: m.konkol@52north.org, a.vogt@52north.org, tom.niers@tu-dresden.de, ralf.klammer@tu-dresden.de
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: OneStop4All-Indexer
|
|
3
|
-
Version: 2.8.
|
|
3
|
+
Version: 2.8.0rc2
|
|
4
4
|
Summary: Library to harvest data from NFDI4Earth-KnowledgeHub to OneStop4All-Index
|
|
5
5
|
Author: Markus Konkol, Arne Vogt, Tom Niers, Ralf Klammer
|
|
6
6
|
Author-email: m.konkol@52north.org, a.vogt@52north.org, tom.niers@tu-dresden.de, ralf.klammer@tu-dresden.de
|
{onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_dataservice.py
RENAMED
|
@@ -511,7 +511,11 @@ class DataService_HarvesterBatched(DataService_Harvester):
|
|
|
511
511
|
hits = sparql.execute_query(self.sparql_endpoint, query)
|
|
512
512
|
return hits
|
|
513
513
|
|
|
514
|
-
def harvest(self, records, batch_size=10):
|
|
514
|
+
def harvest(self, records=None, batch_size=10):
|
|
515
|
+
|
|
516
|
+
if records is None:
|
|
517
|
+
records = self.get_all_ids()
|
|
518
|
+
|
|
515
519
|
services = {}
|
|
516
520
|
# dsh_batched.parse_response(triples, services)
|
|
517
521
|
while True:
|
|
@@ -173,7 +173,6 @@ class Organization_Harvester(Harvester):
|
|
|
173
173
|
"http://www.w3.org/2004/02/skos/core#altLabel": "altLabel",
|
|
174
174
|
"http://www.w3.org/1999/02/22-rdf-syntax-ns#type": "type",
|
|
175
175
|
"http://nfdi4earth.de/ontology/sourceSystemURL": "sourceSystemURL",
|
|
176
|
-
"http://nfdi4earth.de/ontology/hasSignedCommitment": "hasSignedCommitment",
|
|
177
176
|
"http://nfdi4earth.de/ontology/sourceSystemID": "sourceSystem" + self.flatten_separator + "id"
|
|
178
177
|
}
|
|
179
178
|
|
|
@@ -250,6 +249,15 @@ class Organization_Harvester(Harvester):
|
|
|
250
249
|
dict=organizations[subject],
|
|
251
250
|
attribute=attribute,
|
|
252
251
|
value=object)
|
|
252
|
+
|
|
253
|
+
elif (predicate == "http://nfdi4earth.de/ontology/hasSignedCommitment"
|
|
254
|
+
and not self.does_object_exist(object, "hasSignedCommitment", organizations[subject])
|
|
255
|
+
and int(object[0])):
|
|
256
|
+
self.addValue(
|
|
257
|
+
dict=organizations[subject],
|
|
258
|
+
attribute="hasSignedCommitment",
|
|
259
|
+
value=object)
|
|
260
|
+
|
|
253
261
|
elif (
|
|
254
262
|
predicate == "http://www.w3.org/ns/org#subOrganizationOf"
|
|
255
263
|
and (subject, object) not in issuborganization
|
|
@@ -2,7 +2,7 @@ from setuptools import find_packages, setup
|
|
|
2
2
|
|
|
3
3
|
setup(
|
|
4
4
|
name="OneStop4All-Indexer",
|
|
5
|
-
version="2.8.0.
|
|
5
|
+
version="2.8.0.rc2",
|
|
6
6
|
description="Library to harvest data from NFDI4Earth-KnowledgeHub to OneStop4All-Index",
|
|
7
7
|
author="Markus Konkol, Arne Vogt, Tom Niers, Ralf Klammer",
|
|
8
8
|
author_email="m.konkol@52north.org, a.vogt@52north.org, tom.niers@tu-dresden.de, ralf.klammer@tu-dresden.de",
|
|
@@ -2,8 +2,11 @@ import logging
|
|
|
2
2
|
|
|
3
3
|
import click
|
|
4
4
|
|
|
5
|
+
from data_repositories import RepositoryPerson, RepositoryTheme
|
|
6
|
+
from harvesters.harvester_dataservice import DataService_HarvesterBatched
|
|
5
7
|
from utils import cli_startup, config, run as run_harvesting, Solr
|
|
6
8
|
|
|
9
|
+
|
|
7
10
|
log = logging.getLogger(__name__)
|
|
8
11
|
|
|
9
12
|
|
|
@@ -129,12 +132,6 @@ def dataservices(**options):
|
|
|
129
132
|
|
|
130
133
|
@debug.command()
|
|
131
134
|
def dataservices_batched():
|
|
132
|
-
from utils import config
|
|
133
|
-
from harvesters.harvester_dataservice import DataService_HarvesterBatched
|
|
134
|
-
from data_repositories import RepositoryPerson, RepositoryTheme
|
|
135
|
-
|
|
136
|
-
print("und los")
|
|
137
|
-
print(config)
|
|
138
135
|
persons_repo = RepositoryPerson()
|
|
139
136
|
themes_repo = RepositoryTheme()
|
|
140
137
|
dsh_batched = DataService_HarvesterBatched(
|
|
@@ -148,7 +145,7 @@ def dataservices_batched():
|
|
|
148
145
|
# print(f"Batch {i//batch_size}: IDs {i} to {i+batch_size}")
|
|
149
146
|
ids_batched = ids[i : i + batch_size]
|
|
150
147
|
print(f"Batch {i//batch_size}: IDs {ids_batched}")
|
|
151
|
-
triples = dsh_batched.
|
|
148
|
+
triples = dsh_batched.harvest(ids_batched)
|
|
152
149
|
print(f"Batch {i//batch_size}: Triples {len(triples)}")
|
|
153
150
|
|
|
154
151
|
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_article.py
RENAMED
|
File without changes
|
{onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_base.py
RENAMED
|
File without changes
|
{onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_dataset.py
RENAMED
|
File without changes
|
{onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_document.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_repository.py
RENAMED
|
File without changes
|
{onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_service.py
RENAMED
|
File without changes
|
{onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_software.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|