PyPI - commonmeta-py - Versions diffs - 0.126__py3-none-any.whl → 0.127__py3-none-any.whl - Mend

commonmeta-py 0.126py3-none-any.whl → 0.127py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

commonmeta/__init__.py CHANGED Viewed

@@ -10,7 +10,7 @@ commonmeta-py is a Python library to convert scholarly metadata
 """
 __title__ = "commonmeta-py"
-__version__ = "0.126"
+__version__ = "0.127"
 __author__ = "Martin Fenner"
 __license__ = "MIT"
@@ -96,6 +96,7 @@ from .utils import (
     normalize_url,
     pages_as_string,
     replace_curie,
+    string_to_slug,
     to_csl,
     validate_orcid,
     validate_ror,

commonmeta/utils.py CHANGED Viewed

@@ -128,6 +128,57 @@ FOS_MAPPINGS = {
     "Other humanities": "http://www.oecd.org/science/inno/38235147.pdf?6.5",
 }
+FOS_TO_STRING_MAPPINGS = {
+    "Natural sciences": "naturalSciences",
+    "Mathematics": "mathematics",
+    "Computer and information sciences": "computerAndInformationSciences",
+    "Physical sciences": "physicalSciences",
+    "Chemical sciences": "chemicalSciences",
+    "Earth and related environmental sciences": "earthAndRelatedEnvironmentalSciences",
+    "Biological sciences": "biologicalSciences",
+    "Other natural sciences": "otherNaturalSciences",
+    "Engineering and technology": "engineeringAndTechnology",
+    "Civil engineering": "civilEngineering",
+    "Electrical engineering, electronic engineering, information engineering": "electricalEngineering",
+    "Mechanical engineering": "mechanicalEngineering",
+    "Chemical engineering": "chemicalEngineering",
+    "Materials engineering": "materialsEngineering",
+    "Medical engineering": "medicalEngineering",
+    "Environmental engineering": "environmentalEngineering",
+    "Environmental biotechnology": "environmentalBiotechnology",
+    "Industrial biotechnology": "industrialBiotechnology",
+    "Nano technology": "nanoTechnology",
+    "Other engineering and technologies": "otherEngineeringAndTechnologies",
+    "Medical and health sciences": "medicalAndHealthSciences",
+    "Basic medicine": "basicMedicine",
+    "Clinical medicine": "clinicalMedicine",
+    "Health sciences": "healthSciences",
+    "Health biotechnology": "healthBiotechnology",
+    "Other medical sciences": "otherMedicalSciences",
+    "Agricultural sciences": "agriculturalSciences",
+    "Agriculture, forestry, and fisheries": "agricultureForestryAndFisheries",
+    "Animal and dairy science": "animalAndDairyScience",
+    "Veterinary science": "veterinaryScience",
+    "Agricultural biotechnology": "agriculturalBiotechnology",
+    "Other agricultural sciences": "otherAgriculturalSciences",
+    "Social science": "socialScience",
+    "Psychology": "psychology",
+    "Economics and business": "economicsAndBusiness",
+    "Educational sciences": "educationalSciences",
+    "Sociology": "sociology",
+    "Law": "law",
+    "Political science": "politicalScience",
+    "Social and economic geography": "socialAndEconomicGeography",
+    "Media and communications": "mediaAndCommunications",
+    "Other social sciences": "otherSocialSciences",
+    "Humanities": "humanities",
+    "History and archaeology": "historyAndArchaeology",
+    "Languages and literature": "languagesAndLiterature",
+    "Philosophy, ethics and religion": "philosophyEthicsAndReligion",
+    "Arts (arts, history of arts, performing arts, music)": "artsArtsHistoryOfArtsPerformingArtsMusic",
+    "Other humanities": "otherHumanities",
+}
 def normalize_id(pid: Optional[str], **kwargs) -> Optional[str]:
     """Check for valid DOI or HTTP(S) URL"""
@@ -1274,6 +1325,26 @@ def subjects_as_string(subjects):
     return ", ".join(keywords)
+def string_to_slug(text):
+    """makes a string lowercase and removes non-alphanumeric characters"""
+    # Remove FOS (Fields of Science) prefix
+    text = text.removeprefix("FOS: ")
+    # Lookup FOS name
+    slug = FOS_TO_STRING_MAPPINGS.get(text, None)
+    if slug is not None:
+        return slug.lower()
+    # Replace spaces with hyphens
+    slug = re.sub(r"\s+", "-", text.lower())
+    # Remove special characters
+    slug = re.sub(r"[^a-z0-9-]", "", slug)
+    # Remove multiple consecutive hyphens
+    slug = re.sub(r"-+", "-", slug)
+    # Remove leading and trailing hyphens
+    slug = slug.strip("-")
+    return slug
 # def reverse():
 #       return { 'citation': wrap(related_identifiers).select do |ri|
 #                         ri['relationType'] == 'IsReferencedBy'

commonmeta/writers/inveniordm_writer.py CHANGED Viewed

@@ -1,13 +1,13 @@
 """InvenioRDM writer for commonmeta-py"""
 import logging
-import re
 from time import time
 from typing import Dict, Optional
 import orjson as json
 import pydash as py_
 import requests
+from urllib3._collections import HTTPHeaderDict
 from ..base_utils import compact, parse_attributes, presence, wrap
 from ..constants import (
@@ -18,13 +18,14 @@ from ..constants import (
     Commonmeta,
 )
 from ..date_utils import get_iso8601_date
-from ..doi_utils import doi_as_url, doi_from_url, normalize_doi
+from ..doi_utils import doi_from_url, normalize_doi
 from ..utils import (
     FOS_MAPPINGS,
     get_language,
     id_from_url,
     normalize_url,
     pages_as_string,
+    string_to_slug,
     validate_orcid,
     validate_ror,
 )
@@ -399,28 +400,17 @@ def push_inveniordm(metadata: Commonmeta, host: str, token: str, **kwargs) -> Di
             "doi": doi,
         }
-        # extract optional information needed but not upserted to the InvenioRDM API:
-        # rid is the InvenioRDM record id,
-        # uuid is the Rogue Scholar uuid,
-        # community_id is the id of the primary community of the record
+        # extract optional information needed
+        # uuid is the Rogue Scholar uuid
+        # community_id is the id of the primary community of the record,
+        # in the case of Rogue Scholar the blog community
         if hasattr(metadata, "identifiers") and metadata.identifiers:
-            rid_index = None
-            uuid_index = None
             for i, identifier in enumerate(metadata.identifiers):
-                if identifier.get("identifierType") == "RID" and identifier.get(
-                    "identifier"
-                ):
-                    record["id"] = identifier.get("identifier")
-                    rid_index = i
-                elif identifier.get("identifierType") == "UUID" and identifier.get(
+                if identifier.get("identifierType") == "UUID" and identifier.get(
                     "identifier"
                 ):
                     record["uuid"] = identifier.get("identifier")
-                    uuid_index = i
-            if rid_index is not None:
-                metadata.identifiers.pop(rid_index)
-            if uuid_index is not None:
-                metadata.identifiers.pop(uuid_index)
         if hasattr(metadata, "relations") and metadata.relations:
             community_index = None
@@ -434,6 +424,7 @@ def push_inveniordm(metadata: Commonmeta, host: str, token: str, **kwargs) -> Di
                         record["community"] = slug
                         record["community_id"] = community_id
                         community_index = i
+                        break
             if community_index is not None:
                 metadata.relations.pop(community_index)
@@ -496,8 +487,14 @@ def add_record_to_communities(
 ) -> dict:
     """Add record to one or more InvenioRDM communities"""
+    communities = get_record_communities(record, host, token)
+    community_ids = [c.get("id") for c in communities] if communities else []
     # Add record to primary community if primary community is specified
-    if record.get("community_id", None) is not None:
+    if (
+        record.get("community_id", None) is not None
+        and record.get("community_id") not in community_ids
+    ):
         record = add_record_to_community(record, host, token, record["community_id"])
     # Add record to subject area community if subject area community is specified
@@ -509,9 +506,8 @@ def add_record_to_communities(
             slug = string_to_slug(subject_name)
             if slug in COMMUNITY_TRANSLATIONS:
                 slug = COMMUNITY_TRANSLATIONS[slug]
             community_id = search_by_slug(slug, "topic", host, token)
-            if community_id:
+            if community_id and community_id not in community_ids:
                 record = add_record_to_community(record, host, token, community_id)
     # Add record to communities defined as IsPartOf relation in InvenioRDM RelatedIdentifiers
@@ -522,7 +518,7 @@ def add_record_to_communities(
             ).startswith(f"https://{host}/api/communities/"):
                 slug = identifier.get("identifier").split("/")[5]
                 community_id = search_by_slug(slug, "topic", host, token)
-                if community_id:
+                if community_id and community_id not in community_ids:
                     record = add_record_to_community(record, host, token, community_id)
     return record
@@ -664,8 +660,6 @@ def publish_draft_record(record, host, token):
             record["status"] = "error_publish_draft_record"
             return record
         data = response.json()
-        record["uuid"] = py_.get(data, "metadata.identifiers.0.identifier")
-        record["doi"] = (doi_as_url(py_.get(data, "pids.doi.identifier")),)
         record["created"] = data.get("created", None)
         record["updated"] = data.get("updated", None)
         record["status"] = "published"
@@ -676,17 +670,39 @@ def publish_draft_record(record, host, token):
         return record
+def get_record_communities(record, host, token):
+    """Get record communities by id"""
+    headers = {
+        "Authorization": f"Bearer {token}",
+        "Content-Type": "application/json",
+    }
+    try:
+        response = requests.get(
+            f"https://{host}/api/records/{record['id']}/communities",
+            headers=headers,
+        )
+        response.raise_for_status()
+        data = response.json()
+        if py_.get(data, "hits.total", 0) > 0:
+            return py_.get(data, "hits.hits")
+        return None
+    except requests.exceptions.RequestException as e:
+        logger.error(f"Error getting communities: {str(e)}", exc_info=True)
+        return None
 def add_record_to_community(record, host, token, community_id):
-    """Add a record to a community in InvenioRDM"""
+    """Add a record to a community"""
     headers = {
         "Authorization": f"Bearer {token}",
         "Content-Type": "application/json",
     }
+    json = {"communities": [{"id": community_id}]}
     try:
         response = requests.post(
             f"https://{host}/api/records/{record['id']}/communities",
             headers=headers,
-            json={"id": community_id},
+            json=json,
         )
         response.raise_for_status()
         return record
@@ -750,7 +766,11 @@ def search_by_slug(slug: str, type_value: str, host: str, token: str) -> Optiona
         "Authorization": f"Bearer {token}",
         "Content-Type": "application/json",
     }
-    params = {"q": f"slug:{slug} AND type:{type_value}", "size": 1}
+    params = HTTPHeaderDict()
+    params.add("q", f"slug:{slug}")
+    params.add("type", type_value)
+    params.add("type", "subject")
+    params.add("size", 1)
     try:
         response = requests.get(
             f"https://{host}/api/communities", headers=headers, params=params
@@ -765,18 +785,5 @@ def search_by_slug(slug: str, type_value: str, host: str, token: str) -> Optiona
         return None
-def string_to_slug(text):
-    """makes a string lowercase and removes non-alphanumeric characters"""
-    # Replace spaces with hyphens
-    slug = re.sub(r"\s+", "-", text.lower())
-    # Remove special characters
-    slug = re.sub(r"[^a-z0-9-]", "", slug)
-    # Remove multiple consecutive hyphens
-    slug = re.sub(r"-+", "-", slug)
-    # Remove leading and trailing hyphens
-    slug = slug.strip("-")
-    return slug
 class InvenioRDMError(Exception):
     """Custom exception for InvenioRDM API errors"""

{commonmeta_py-0.126.dist-info → commonmeta_py-0.127.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: commonmeta-py
-Version: 0.126
+Version: 0.127
 Summary: Library for conversions to/from the Commonmeta scholarly metadata format
 Project-URL: Homepage, https://python.commonmeta.org
 Project-URL: Repository, https://github.com/front-matter/commonmeta-py

{commonmeta_py-0.126.dist-info → commonmeta_py-0.127.dist-info}/RECORD RENAMED Viewed

@@ -1,4 +1,4 @@
-commonmeta/__init__.py,sha256=imnf6kwadjjF_Pq3XiozlWDZ5DKHoIOuIcrwypD4zxs,2098
+commonmeta/__init__.py,sha256=42EVUELvqJzvTf3X-JSjCvuqNyS1chKRYTzVrwp8ZY0,2118
 commonmeta/api_utils.py,sha256=P8LMHHYiF4OTi97_5k4KstcBreooMkOAKZ4ebxsAv4o,2691
 commonmeta/author_utils.py,sha256=3lYW5s1rOUWNTKs1FP6XLfEUY3yCLOe_3L_VdJTDMp0,8585
 commonmeta/base_utils.py,sha256=-MGy9q2uTiJEkPWQUYOJMdq-3tRpNnvBwlLjvllQ5g8,11164
@@ -10,7 +10,7 @@ commonmeta/file_utils.py,sha256=eFYDWyR8Gr722nvFmp542hCm-TGmO_q4ciZ85IPHpjA,2893
 commonmeta/metadata.py,sha256=90aTe47d071wHxwcNsOqU5lSVPKP8wAPnPHhddj3Fuo,18443
 commonmeta/schema_utils.py,sha256=zn3gqAHciUOQmrw9okR68weFs-yqPPyORFt-Zl1D3Lw,1924
 commonmeta/translators.py,sha256=CBMK4jrXRmGZiAhCh6wsJjhbDJWbcsda8UvXFXxccAw,1363
-commonmeta/utils.py,sha256=pJnh3EzOU1E2nutnAZsopY_NsUX6zYmxoj5bIYqqWvE,50574
+commonmeta/utils.py,sha256=HzgVlcRqtDXMwlbTXL0AKL3jHB6E9kEAljS5nXKdOm0,53852
 commonmeta/readers/__init__.py,sha256=vOf7UsOKNoh_ZCuyexxhAmPMt8wjB-pF_CfpWRaN8pk,45
 commonmeta/readers/bibtex_reader.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 commonmeta/readers/cff_reader.py,sha256=HMFK6QIg_XIlhmYIWL4EfIyuidYl5L_0TAwyG78XPlU,6244
@@ -80,11 +80,11 @@ commonmeta/writers/commonmeta_writer.py,sha256=QpfyhG__7o_XpsOTCPWxGymO7YKwZi2LQ
 commonmeta/writers/crossref_xml_writer.py,sha256=rcPOfrGxU4mX7_fFywYWDW2FFUoKW9wD-JzW8nX1ipI,33915
 commonmeta/writers/csl_writer.py,sha256=4gDYs1EzK4_L2UIRTfs25wgHmYRwdRP2zmfxF9387oU,2779
 commonmeta/writers/datacite_writer.py,sha256=bcinpwhq7XnVthKHH8-sdXA34dSlvFH4ImYH768iaQU,6428
-commonmeta/writers/inveniordm_writer.py,sha256=MeMFImmjhmtCyNPq3Txd6COIvayE3PImmxm0_nDfDmQ,26796
+commonmeta/writers/inveniordm_writer.py,sha256=w4DTPjWk1YBtva9RWAq9DnDzmhpa0ejws2h2h-Pfz7A,26854
 commonmeta/writers/ris_writer.py,sha256=3SdyEvMRaPRP1SV1MB-MXBlunE7x6og7RF1zuWtetPc,2094
 commonmeta/writers/schema_org_writer.py,sha256=s18_x0ReXwAGBoEAwp2q-HCgFQ-h5qRg6JyAlqCoSFE,5871
-commonmeta_py-0.126.dist-info/METADATA,sha256=w6m0e9-YGX-8r8u0AHoI5h71SaLIdwGmtrJTY4df4r0,7656
-commonmeta_py-0.126.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-commonmeta_py-0.126.dist-info/entry_points.txt,sha256=U4w4BoRuS3rN5t5Y-uYSyOeU5Lh_VRVMS9OIDzIgw4w,50
-commonmeta_py-0.126.dist-info/licenses/LICENSE,sha256=wsIvxF9Q9GC9vA_s79zTWP3BkXJdfUNRmALlU8GbW1s,1074
-commonmeta_py-0.126.dist-info/RECORD,,
+commonmeta_py-0.127.dist-info/METADATA,sha256=JHsi5YfGnb7zlq9vkkG_rh0PqIRbfKnLC7bM5QF8v1I,7656
+commonmeta_py-0.127.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+commonmeta_py-0.127.dist-info/entry_points.txt,sha256=U4w4BoRuS3rN5t5Y-uYSyOeU5Lh_VRVMS9OIDzIgw4w,50
+commonmeta_py-0.127.dist-info/licenses/LICENSE,sha256=wsIvxF9Q9GC9vA_s79zTWP3BkXJdfUNRmALlU8GbW1s,1074
+commonmeta_py-0.127.dist-info/RECORD,,

{commonmeta_py-0.126.dist-info → commonmeta_py-0.127.dist-info}/WHEEL RENAMED Viewed

File without changes

{commonmeta_py-0.126.dist-info → commonmeta_py-0.127.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{commonmeta_py-0.126.dist-info → commonmeta_py-0.127.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

commonmeta-py 0.126__py3-none-any.whl → 0.127__py3-none-any.whl

commonmeta-py 0.126py3-none-any.whl → 0.127py3-none-any.whl