OneStop4All-Indexer 2.8.0.dev20__tar.gz → 2.8.0rc2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (36) hide show
  1. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2/OneStop4All_Indexer.egg-info}/PKG-INFO +1 -1
  2. {onestop4all_indexer-2.8.0.dev20/OneStop4All_Indexer.egg-info → onestop4all_indexer-2.8.0rc2}/PKG-INFO +1 -1
  3. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_dataservice.py +5 -1
  4. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_organization.py +9 -1
  5. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/setup.py +1 -1
  6. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/cli.py +4 -7
  7. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/LICENSE +0 -0
  8. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/OneStop4All_Indexer.egg-info/SOURCES.txt +0 -0
  9. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/OneStop4All_Indexer.egg-info/dependency_links.txt +0 -0
  10. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/OneStop4All_Indexer.egg-info/entry_points.txt +0 -0
  11. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/OneStop4All_Indexer.egg-info/requires.txt +0 -0
  12. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/OneStop4All_Indexer.egg-info/top_level.txt +0 -0
  13. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/__init__.py +0 -0
  14. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/repository_base.py +0 -0
  15. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/repository_n4eorganization.py +0 -0
  16. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/repository_person.py +0 -0
  17. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/repository_resource_links.py +0 -0
  18. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/data_repositories/repository_theme.py +0 -0
  19. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/__init__.py +0 -0
  20. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_article.py +0 -0
  21. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_base.py +0 -0
  22. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_dataset.py +0 -0
  23. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_document.py +0 -0
  24. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_learningresource.py +0 -0
  25. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_metadatastandards.py +0 -0
  26. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_repository.py +0 -0
  27. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_service.py +0 -0
  28. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/harvesters/harvester_software.py +0 -0
  29. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/pyproject.toml +0 -0
  30. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/setup.cfg +0 -0
  31. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/__init__.py +0 -0
  32. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/configs.py +0 -0
  33. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/harvest.py +0 -0
  34. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/solr.py +0 -0
  35. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/sparql.py +0 -0
  36. {onestop4all_indexer-2.8.0.dev20 → onestop4all_indexer-2.8.0rc2}/utils/util.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: OneStop4All-Indexer
3
- Version: 2.8.0.dev20
3
+ Version: 2.8.0rc2
4
4
  Summary: Library to harvest data from NFDI4Earth-KnowledgeHub to OneStop4All-Index
5
5
  Author: Markus Konkol, Arne Vogt, Tom Niers, Ralf Klammer
6
6
  Author-email: m.konkol@52north.org, a.vogt@52north.org, tom.niers@tu-dresden.de, ralf.klammer@tu-dresden.de
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: OneStop4All-Indexer
3
- Version: 2.8.0.dev20
3
+ Version: 2.8.0rc2
4
4
  Summary: Library to harvest data from NFDI4Earth-KnowledgeHub to OneStop4All-Index
5
5
  Author: Markus Konkol, Arne Vogt, Tom Niers, Ralf Klammer
6
6
  Author-email: m.konkol@52north.org, a.vogt@52north.org, tom.niers@tu-dresden.de, ralf.klammer@tu-dresden.de
@@ -511,7 +511,11 @@ class DataService_HarvesterBatched(DataService_Harvester):
511
511
  hits = sparql.execute_query(self.sparql_endpoint, query)
512
512
  return hits
513
513
 
514
- def harvest(self, records, batch_size=10):
514
+ def harvest(self, records=None, batch_size=10):
515
+
516
+ if records is None:
517
+ records = self.get_all_ids()
518
+
515
519
  services = {}
516
520
  # dsh_batched.parse_response(triples, services)
517
521
  while True:
@@ -173,7 +173,6 @@ class Organization_Harvester(Harvester):
173
173
  "http://www.w3.org/2004/02/skos/core#altLabel": "altLabel",
174
174
  "http://www.w3.org/1999/02/22-rdf-syntax-ns#type": "type",
175
175
  "http://nfdi4earth.de/ontology/sourceSystemURL": "sourceSystemURL",
176
- "http://nfdi4earth.de/ontology/hasSignedCommitment": "hasSignedCommitment",
177
176
  "http://nfdi4earth.de/ontology/sourceSystemID": "sourceSystem" + self.flatten_separator + "id"
178
177
  }
179
178
 
@@ -250,6 +249,15 @@ class Organization_Harvester(Harvester):
250
249
  dict=organizations[subject],
251
250
  attribute=attribute,
252
251
  value=object)
252
+
253
+ elif (predicate == "http://nfdi4earth.de/ontology/hasSignedCommitment"
254
+ and not self.does_object_exist(object, "hasSignedCommitment", organizations[subject])
255
+ and int(object[0])):
256
+ self.addValue(
257
+ dict=organizations[subject],
258
+ attribute="hasSignedCommitment",
259
+ value=object)
260
+
253
261
  elif (
254
262
  predicate == "http://www.w3.org/ns/org#subOrganizationOf"
255
263
  and (subject, object) not in issuborganization
@@ -2,7 +2,7 @@ from setuptools import find_packages, setup
2
2
 
3
3
  setup(
4
4
  name="OneStop4All-Indexer",
5
- version="2.8.0.dev20",
5
+ version="2.8.0.rc2",
6
6
  description="Library to harvest data from NFDI4Earth-KnowledgeHub to OneStop4All-Index",
7
7
  author="Markus Konkol, Arne Vogt, Tom Niers, Ralf Klammer",
8
8
  author_email="m.konkol@52north.org, a.vogt@52north.org, tom.niers@tu-dresden.de, ralf.klammer@tu-dresden.de",
@@ -2,8 +2,11 @@ import logging
2
2
 
3
3
  import click
4
4
 
5
+ from data_repositories import RepositoryPerson, RepositoryTheme
6
+ from harvesters.harvester_dataservice import DataService_HarvesterBatched
5
7
  from utils import cli_startup, config, run as run_harvesting, Solr
6
8
 
9
+
7
10
  log = logging.getLogger(__name__)
8
11
 
9
12
 
@@ -129,12 +132,6 @@ def dataservices(**options):
129
132
 
130
133
  @debug.command()
131
134
  def dataservices_batched():
132
- from utils import config
133
- from harvesters.harvester_dataservice import DataService_HarvesterBatched
134
- from data_repositories import RepositoryPerson, RepositoryTheme
135
-
136
- print("und los")
137
- print(config)
138
135
  persons_repo = RepositoryPerson()
139
136
  themes_repo = RepositoryTheme()
140
137
  dsh_batched = DataService_HarvesterBatched(
@@ -148,7 +145,7 @@ def dataservices_batched():
148
145
  # print(f"Batch {i//batch_size}: IDs {i} to {i+batch_size}")
149
146
  ids_batched = ids[i : i + batch_size]
150
147
  print(f"Batch {i//batch_size}: IDs {ids_batched}")
151
- triples = dsh_batched.get_triples_for_subjects(ids_batched)
148
+ triples = dsh_batched.harvest(ids_batched)
152
149
  print(f"Batch {i//batch_size}: Triples {len(triples)}")
153
150
 
154
151