RubyGems - briard - Versions diffs - 2.4.1 → 2.6.0 - Mend

briard 2.4.1 → 2.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (81) hide show

checksums.yaml +4 -4
data/.github/workflows/codeql-analysis.yml +72 -0
data/.github/workflows/rubocop.yml +50 -0
data/.rubocop.yml +144 -620
data/.rubocop_todo.yml +76 -0
data/CHANGELOG.md +22 -0
data/Gemfile +2 -0
data/Gemfile.lock +43 -6
data/Rakefile +1 -1
data/{bolognese.gemspec → briard.gemspec} +46 -38
data/lib/briard/array.rb +2 -2
data/lib/briard/author_utils.rb +79 -71
data/lib/briard/cli.rb +12 -13
data/lib/briard/crossref_utils.rb +73 -61
data/lib/briard/datacite_utils.rb +132 -106
data/lib/briard/doi_utils.rb +10 -10
data/lib/briard/metadata.rb +96 -106
data/lib/briard/metadata_utils.rb +87 -78
data/lib/briard/readers/bibtex_reader.rb +65 -65
data/lib/briard/readers/cff_reader.rb +88 -70
data/lib/briard/readers/citeproc_reader.rb +90 -84
data/lib/briard/readers/codemeta_reader.rb +68 -50
data/lib/briard/readers/crosscite_reader.rb +2 -2
data/lib/briard/readers/crossref_reader.rb +249 -210
data/lib/briard/readers/datacite_json_reader.rb +3 -3
data/lib/briard/readers/datacite_reader.rb +225 -189
data/lib/briard/readers/npm_reader.rb +49 -42
data/lib/briard/readers/ris_reader.rb +82 -80
data/lib/briard/readers/schema_org_reader.rb +182 -159
data/lib/briard/string.rb +1 -1
data/lib/briard/utils.rb +4 -4
data/lib/briard/version.rb +3 -1
data/lib/briard/whitelist_scrubber.rb +11 -4
data/lib/briard/writers/bibtex_writer.rb +14 -8
data/lib/briard/writers/cff_writer.rb +33 -26
data/lib/briard/writers/codemeta_writer.rb +19 -15
data/lib/briard/writers/csv_writer.rb +6 -4
data/lib/briard/writers/datacite_json_writer.rb +8 -2
data/lib/briard/writers/jats_writer.rb +33 -28
data/lib/briard/writers/rdf_xml_writer.rb +1 -1
data/lib/briard/writers/ris_writer.rb +30 -18
data/lib/briard/writers/turtle_writer.rb +1 -1
data/lib/briard.rb +6 -6
data/rubocop.sarif +0 -0
data/spec/array_spec.rb +5 -5
data/spec/author_utils_spec.rb +151 -132
data/spec/datacite_utils_spec.rb +135 -83
data/spec/doi_utils_spec.rb +168 -164
data/spec/find_from_format_spec.rb +69 -69
data/spec/fixtures/vcr_cassettes/Briard_Metadata/sanitize/onlies_keep_specific_tags.yml +65 -0
data/spec/fixtures/vcr_cassettes/Briard_Metadata/sanitize/removes_a_tags.yml +65 -0
data/spec/metadata_spec.rb +91 -90
data/spec/readers/bibtex_reader_spec.rb +43 -38
data/spec/readers/cff_reader_spec.rb +165 -153
data/spec/readers/citeproc_reader_spec.rb +45 -40
data/spec/readers/codemeta_reader_spec.rb +128 -115
data/spec/readers/crosscite_reader_spec.rb +34 -24
data/spec/readers/crossref_reader_spec.rb +1098 -939
data/spec/readers/datacite_json_reader_spec.rb +53 -40
data/spec/readers/datacite_reader_spec.rb +1541 -1337
data/spec/readers/npm_reader_spec.rb +48 -43
data/spec/readers/ris_reader_spec.rb +53 -47
data/spec/readers/schema_org_reader_spec.rb +329 -267
data/spec/spec_helper.rb +6 -5
data/spec/utils_spec.rb +371 -347
data/spec/writers/bibtex_writer_spec.rb +143 -143
data/spec/writers/cff_writer_spec.rb +96 -90
data/spec/writers/citation_writer_spec.rb +34 -33
data/spec/writers/citeproc_writer_spec.rb +226 -224
data/spec/writers/codemeta_writer_spec.rb +18 -16
data/spec/writers/crosscite_writer_spec.rb +91 -73
data/spec/writers/crossref_writer_spec.rb +99 -91
data/spec/writers/csv_writer_spec.rb +70 -70
data/spec/writers/datacite_json_writer_spec.rb +78 -68
data/spec/writers/datacite_writer_spec.rb +417 -322
data/spec/writers/jats_writer_spec.rb +177 -161
data/spec/writers/rdf_xml_writer_spec.rb +68 -63
data/spec/writers/ris_writer_spec.rb +162 -162
data/spec/writers/turtle_writer_spec.rb +47 -47
metadata +250 -160
data/.github/workflows/release.yml +0 -47

data/lib/briard/readers/npm_reader.rb CHANGED Viewed

@@ -3,39 +3,41 @@
 module Briard
   module Readers
     module NpmReader
-      def get_npm(id: nil, **options)
-        return { "string" => nil, "state" => "not_found" } unless id.present?
+      def get_npm(id: nil, **_options)
+        return { 'string' => nil, 'state' => 'not_found' } unless id.present?
         id = normalize_id(id)
-        response = Maremma.get(id, accept: "json", raw: true)
-        string = response.body.fetch("data", nil)
+        response = Maremma.get(id, accept: 'json', raw: true)
+        string = response.body.fetch('data', nil)
-        { "string" => string }
+        { 'string' => string }
       end
       def read_npm(string: nil, **options)
         if string.present?
           errors = jsonlint(string)
-          return { "errors" => errors } if errors.present?
+          return { 'errors' => errors } if errors.present?
         end
-        read_options = ActiveSupport::HashWithIndifferentAccess.new(options.except(:doi, :id, :url, :sandbox, :validate, :ra))
+        read_options = ActiveSupport::HashWithIndifferentAccess.new(options.except(:doi, :id, :url,
+                                                                                   :sandbox, :validate, :ra))
         meta = string.present? ? Maremma.from_json(string) : {}
         types = {
-          "resourceTypeGeneral" => "Software",
-          "reourceType" => "NPM Package",
-          "schemaOrg" => "SoftwareSourceCode",
-          "citeproc" => "article",
-          "bibtex" => "misc",
-          "ris" => "GEN"
+          'resourceTypeGeneral' => 'Software',
+          'reourceType' => 'NPM Package',
+          'schemaOrg' => 'SoftwareSourceCode',
+          'citeproc' => 'article',
+          'bibtex' => 'misc',
+          'ris' => 'GEN'
         }.compact
-        creators = if meta.fetch("author", nil).present?
-          get_authors(Array.wrap(meta.fetch("author", nil)))
-        else
-          [{ "nameType" => "Organizational", "name" => ":(unav)" }]
-        end
+        creators = if meta.fetch('author', nil).present?
+                     get_authors(Array.wrap(meta.fetch('author', nil)))
+                   else
+                     [{ 'nameType' => 'Organizational', 'name' => ':(unav)' }]
+                   end
         # contributors = get_authors(from_citeproc(Array.wrap(meta.fetch("editor", nil))))
         # dates = if date = get_date_from_date_parts(meta.fetch("issued", nil))
         #           if Date.edtf(date).present?
@@ -44,8 +46,8 @@ module Briard
         #           end
         #         end
         # publication_year = get_date_from_date_parts(meta.fetch("issued", nil)).to_s[0..3]
-        rights_list = if meta.fetch("license", nil)
-                        [{ "rights" => meta.fetch("license") }.compact]
+        rights_list = if meta.fetch('license', nil)
+                        [{ 'rights' => meta.fetch('license') }.compact]
                       end
         # related_identifiers = if meta.fetch("container-title", nil).present? && meta.fetch("ISSN", nil).present?
         #                         [{ "type" => "Periodical",
@@ -83,31 +85,36 @@ module Briard
         # id = Array.wrap(identifiers).first.to_h.fetch("identifier", nil)
         # doi = Array.wrap(identifiers).find { |r| r["identifierType"] == "DOI" }.to_h.fetch("identifier", nil)
         # state = id.present? || read_options.present? ? "findable" : "not_found"
-        subjects = Array.wrap(meta.fetch("keywords", nil)).map do |s|
-          { "subject" => s }
+        subjects = Array.wrap(meta.fetch('keywords', nil)).map do |s|
+          { 'subject' => s }
         end
-        {
-          #"id" => id,
-          #"identifiers" => identifiers,
-          "types" => types,
-          #"doi" => doi_from_url(doi),
-          #"url" => normalize_id(meta.fetch("URL", nil)),
-          "titles" => [{ "title" => meta.fetch("name", nil) }],
-          "creators" => creators,
-          #"contributors" => contributors,
-          #"container" => container,
-          #"publisher" => meta.fetch("publisher", nil),
-          #"related_identifiers" => related_identifiers,
-          #"dates" => dates,
-          #"publication_year" => publication_year,
-          "descriptions" => meta.fetch("description", nil).present? ? [{ "description" => sanitize(meta.fetch("description")), "descriptionType" => "Abstract" }] : [],
-          "rights_list" => rights_list,
-          "version_info" => meta.fetch("version", nil),
-          "subjects" => subjects
-          #"state" => state
+        {
+          # "id" => id,
+          # "identifiers" => identifiers,
+          'types' => types,
+          # "doi" => doi_from_url(doi),
+          # "url" => normalize_id(meta.fetch("URL", nil)),
+          'titles' => [{ 'title' => meta.fetch('name', nil) }],
+          'creators' => creators,
+          # "contributors" => contributors,
+          # "container" => container,
+          # "publisher" => meta.fetch("publisher", nil),
+          # "related_identifiers" => related_identifiers,
+          # "dates" => dates,
+          # "publication_year" => publication_year,
+          'descriptions' => if meta.fetch('description', nil).present?
+                              [{ 'description' => sanitize(meta.fetch('description')),
+                                 'descriptionType' => 'Abstract' }]
+                            else
+                              []
+                            end,
+          'rights_list' => rights_list,
+          'version_info' => meta.fetch('version', nil),
+          'subjects' => subjects
+          # "state" => state
         }.merge(read_options)
       end
     end

data/lib/briard/readers/ris_reader.rb CHANGED Viewed

@@ -4,110 +4,112 @@ module Briard
   module Readers
     module RisReader
       RIS_TO_SO_TRANSLATIONS = {
-        "BLOG" => "BlogPosting",
-        "GEN" => "CreativeWork",
-        "CTLG" => "DataCatalog",
-        "DATA" => "Dataset",
-        "FIGURE" => "ImageObject",
-        "THES" => "Thesis",
-        "MPCT" => "Movie",
-        "JOUR" => "ScholarlyArticle",
-        "COMP" => "SoftwareSourceCode",
-        "VIDEO" => "VideoObject",
-        "ELEC" => "WebPage"
-      }
+        'BLOG' => 'BlogPosting',
+        'GEN' => 'CreativeWork',
+        'CTLG' => 'DataCatalog',
+        'DATA' => 'Dataset',
+        'FIGURE' => 'ImageObject',
+        'THES' => 'Thesis',
+        'MPCT' => 'Movie',
+        'JOUR' => 'ScholarlyArticle',
+        'COMP' => 'SoftwareSourceCode',
+        'VIDEO' => 'VideoObject',
+        'ELEC' => 'WebPage'
+      }.freeze
-      RIS_TO_CP_TRANSLATIONS = {
-        "JOUR" => "article-journal"
-      }
+      RIS_TO_CP_TRANSLATIONS = { 'JOUR' => 'article-journal' }.freeze
       RIS_TO_BIB_TRANSLATIONS = {
-        "JOUR" => "article",
-        "BOOK" => "book",
-        "CHAP" => "inbook",
-        "CPAPER" => "inproceedings",
-        "GEN" => "misc",
-        "THES" => "phdthesis",
-        "CONF" => "proceedings",
-        "RPRT" => "techreport",
-        "UNPD" => "unpublished"
-      }
+        'JOUR' => 'article',
+        'BOOK' => 'book',
+        'CHAP' => 'inbook',
+        'CPAPER' => 'inproceedings',
+        'GEN' => 'misc',
+        'THES' => 'phdthesis',
+        'CONF' => 'proceedings',
+        'RPRT' => 'techreport',
+        'UNPD' => 'unpublished'
+      }.freeze
       def read_ris(string: nil, **options)
-        read_options = ActiveSupport::HashWithIndifferentAccess.new(options.except(:doi, :id, :url, :sandbox, :validate, :ra))
+        read_options = ActiveSupport::HashWithIndifferentAccess.new(options.except(:doi, :id, :url,
+                                                                                   :sandbox, :validate, :ra))
         meta = ris_meta(string: string)
-        ris_type = meta.fetch("TY", nil) || "GEN"
-        schema_org = RIS_TO_SO_TRANSLATIONS[ris_type] || "CreativeWork"
+        ris_type = meta.fetch('TY', nil) || 'GEN'
+        schema_org = RIS_TO_SO_TRANSLATIONS[ris_type] || 'CreativeWork'
         types = {
-          "resourceTypeGeneral" => Metadata::RIS_TO_DC_TRANSLATIONS[ris_type],
-          "schemaOrg" => schema_org,
-          "citeproc" => RIS_TO_CP_TRANSLATIONS[schema_org] || "misc",
-          "ris" => ris_type
+          'resourceTypeGeneral' => Metadata::RIS_TO_DC_TRANSLATIONS[ris_type],
+          'schemaOrg' => schema_org,
+          'citeproc' => RIS_TO_CP_TRANSLATIONS[schema_org] || 'misc',
+          'ris' => ris_type
         }.compact
-        id = normalize_doi(options[:doi] || meta.fetch("DO", nil))
+        id = normalize_doi(options[:doi] || meta.fetch('DO', nil))
-        author = Array.wrap(meta.fetch("AU", nil)).map { |a| { "creatorName" => a } }
-        date_parts = meta.fetch("PY", nil).to_s.split("/")
-        created_date_parts = meta.fetch("Y1", nil).to_s.split("/")
+        author = Array.wrap(meta.fetch('AU', nil)).map { |a| { 'creatorName' => a } }
+        date_parts = meta.fetch('PY', nil).to_s.split('/')
+        created_date_parts = meta.fetch('Y1', nil).to_s.split('/')
         dates = []
-        dates << { "date" => get_date_from_parts(*date_parts), "dateType" => "Issued" } if meta.fetch("PY", nil).present?
-        dates << { "date" => get_date_from_parts(*created_date_parts), "dateType" => "Created" } if meta.fetch("Y1", nil).present?
-        publication_year = get_date_from_parts(*date_parts).to_s[0..3]
-        related_identifiers = if meta.fetch("T2", nil).present? && meta.fetch("SN", nil).present?
-          [{ "type" => "Periodical",
-             "id" => meta.fetch("SN", nil),
-             "relatedIdentifierType" => "ISSN",
-             "relationType" => "IsPartOf",
-             "title" => meta.fetch("T2", nil), }.compact]
-        else
-          []
+        if meta.fetch('PY', nil).present?
+          dates << { 'date' => get_date_from_parts(*date_parts), 'dateType' => 'Issued' }
         end
-        container = if meta.fetch("T2", nil).present?
-          { "type" => "Journal",
-            "title" => meta.fetch("T2", nil),
-            "identifier" => meta.fetch("SN", nil),
-            "volume" => meta.fetch("VL", nil),
-            "issue" => meta.fetch("IS", nil),
-            "firstPage" => meta.fetch("SP", nil),
-            "lastPage" => meta.fetch("EP", nil) }.compact
-        else
-          nil
+        if meta.fetch('Y1', nil).present?
+          dates << { 'date' => get_date_from_parts(*created_date_parts), 'dateType' => 'Created' }
         end
-        state = meta.fetch("DO", nil).present? || read_options.present? ? "findable" : "not_found"
-        subjects = Array.wrap(meta.fetch("KW", nil)).reduce([]) do |sum, subject|
+        publication_year = get_date_from_parts(*date_parts).to_s[0..3]
+        related_identifiers = if meta.fetch('T2', nil).present? && meta.fetch('SN', nil).present?
+                                [{ 'type' => 'Periodical',
+                                   'id' => meta.fetch('SN', nil),
+                                   'relatedIdentifierType' => 'ISSN',
+                                   'relationType' => 'IsPartOf',
+                                   'title' => meta.fetch('T2', nil) }.compact]
+                              else
+                                []
+                              end
+        container = if meta.fetch('T2', nil).present?
+                      { 'type' => 'Journal',
+                        'title' => meta.fetch('T2', nil),
+                        'identifier' => meta.fetch('SN', nil),
+                        'volume' => meta.fetch('VL', nil),
+                        'issue' => meta.fetch('IS', nil),
+                        'firstPage' => meta.fetch('SP', nil),
+                        'lastPage' => meta.fetch('EP', nil) }.compact
+                    end
+        state = meta.fetch('DO', nil).present? || read_options.present? ? 'findable' : 'not_found'
+        subjects = Array.wrap(meta.fetch('KW', nil)).reduce([]) do |sum, subject|
           sum += name_to_fos(subject)
           sum
         end
-        { "id" => id,
-          "types" => types,
-          "doi" => doi_from_url(id),
-          "url" => meta.fetch("UR", nil),
-          "titles" => meta.fetch("T1", nil).present? ? [{ "title" => meta.fetch("T1", nil) }] : nil,
-          "creators" => get_authors(author),
-          "publisher" => meta.fetch("PB", "(:unav)"),
-          "container" => container,
-          "related_identifiers" => related_identifiers,
-          "dates" => dates,
-          "publication_year" => publication_year,
-          "descriptions" => meta.fetch("AB", nil).present? ? [{ "description" => sanitize(meta.fetch("AB")), "descriptionType" => "Abstract" }] : nil,
-          "subjects" => subjects,
-          "language" => meta.fetch("LA", nil),
-          "state" => state
-        }.merge(read_options)
+        { 'id' => id,
+          'types' => types,
+          'doi' => doi_from_url(id),
+          'url' => meta.fetch('UR', nil),
+          'titles' => meta.fetch('T1', nil).present? ? [{ 'title' => meta.fetch('T1', nil) }] : nil,
+          'creators' => get_authors(author),
+          'publisher' => meta.fetch('PB', '(:unav)'),
+          'container' => container,
+          'related_identifiers' => related_identifiers,
+          'dates' => dates,
+          'publication_year' => publication_year,
+          'descriptions' => if meta.fetch('AB', nil).present?
+                              [{ 'description' => sanitize(meta.fetch('AB')),
+                                 'descriptionType' => 'Abstract' }]
+                            end,
+          'subjects' => subjects,
+          'language' => meta.fetch('LA', nil),
+          'state' => state }.merge(read_options)
       end
       def ris_meta(string: nil)
-        h = Hash.new { |h,k| h[k] = [] }
-        string.split("\n").reduce(h) do |sum, line|
-          k, v = line.split("-",2)
+        h = Hash.new { |h, k| h[k] = [] }
+        string.split("\n").each_with_object(h) do |line, _sum|
+          k, v = line.split('-', 2)
           h[k.strip] << v.to_s.strip
-          sum
-        end.map { |k,v| [k, v.unwrap] }.to_h.compact
+        end.transform_values(&:unwrap).compact
       end
     end
   end