RubyGems - relaton-nist - Versions diffs - 1.7.4 → 1.9.2 - Mend

relaton-nist 1.7.4 → 1.9.2

Files changed (23) hide show

checksums.yaml +4 -4
data/.github/workflows/rake.yml +1 -11
data/.gitignore +1 -0
data/.rubocop.yml +1 -1
data/README.adoc +19 -0
data/bin/rspec +29 -0
data/grammars/basicdoc.rng +165 -20
data/grammars/biblio.rng +5 -6
data/grammars/isodoc.rng +532 -16
data/grammars/nist.rng +9 -0
data/grammars/reqt.rng +31 -2
data/lib/relaton_nist/data_fetcher.rb +221 -0
data/lib/relaton_nist/hit.rb +3 -1
data/lib/relaton_nist/hit_collection.rb +71 -58
data/lib/relaton_nist/nist_bibliographic_item.rb +1 -1
data/lib/relaton_nist/nist_bibliography.rb +16 -6
data/lib/relaton_nist/processor.rb +5 -0
data/lib/relaton_nist/scrapper.rb +198 -265
data/lib/relaton_nist/version.rb +1 -1
data/lib/relaton_nist/xml_parser.rb +1 -1
data/lib/relaton_nist.rb +1 -0
data/relaton_nist.gemspec +3 -5
metadata +9 -7

data/lib/relaton_nist/nist_bibliographic_item.rb CHANGED Viewed

@@ -67,7 +67,7 @@ module RelatonNist
     # @return [RelatonNist::GbBibliographicItem]
     def self.from_hash(hash)
       item_hash = RelatonNist::HashConverter.hash_to_bib(hash)
-      new **item_hash
+      new(**item_hash)
     end
     # @param opts [Hash]

data/lib/relaton_nist/nist_bibliography.rb CHANGED Viewed

@@ -14,9 +14,9 @@ module RelatonNist
       # @param text [String]
       # @return [RelatonNist::HitCollection]
       def search(text, year = nil, opts = {})
-        HitCollection.new text, year, opts
-      rescue OpenURI::HTTPError, SocketError, OpenSSL::SSL::SSLError
-        raise RelatonBib::RequestError, "Could not access https://www.nist.gov"
+        HitCollection.search text, year, opts
+      rescue OpenURI::HTTPError, SocketError, OpenSSL::SSL::SSLError => e
+        raise RelatonBib::RequestError, e.message
       end
       # @param code [String] the NIST standard Code to look up (e..g "8200")
@@ -174,7 +174,17 @@ module RelatonNist
         }
         ref = matches[:code] ? "#{matches[:serie]} #{matches[:code]}" : code
         result = search(ref, year, opts)
-        result.select { |i| search_filter i, matches, code }
+        selected_result = result.select { |i| search_filter i, matches, code }
+        return selected_result if selected_result.any? || !matches[:code]
+        search full_ref(matches)
+      end
+      def full_ref(matches)
+        ref = "#{matches[:serie]} #{matches[:code]}"
+        ref += long_to_short(matches[:prt1], matches[:prt2]).to_s
+        ref += long_to_short(matches[:vol1], matches[:vol2]).to_s
+        ref
       end
       def match(regex, code)
@@ -192,11 +202,11 @@ module RelatonNist
           (?<code>[0-9-]{3,}[A-Z]?)
           (?<prt1>pt\d+)?
           (?<vol1>v\d+)?
-          (?<ver1>ver[\d\.]+)?
+          (?<ver1>ver[\d.]+)?
           (?<rev1>r\d+)?
           (\s(?<prt2>Part\s\d+))?
           (\s(?<vol2>Vol\.\s\d+))?
-          (\s(?<ver2>(Ver\.|Version)\s[\d\.]+))?
+          (\s(?<ver2>(Ver\.|Version)\s[\d.]+))?
           (\s(?<rev2>Rev\.\s\d+))?
           (\s(?<add>Add)endum)?
         }x =~ item.hit[:code]

data/lib/relaton_nist/processor.rb CHANGED Viewed

@@ -7,6 +7,7 @@ module RelatonNist
       @prefix = "NIST"
       @defaultprefix = %r{^(NIST|NISTGCR|ITL Bulletin|JPCRD|NISTIR|CSRC|FIPS)(/[^\s])?\s}
       @idtype = "NIST"
+      @datasets = %w[nist-tech-pubs]
     end
     # @param code [String]
@@ -17,6 +18,10 @@ module RelatonNist
       ::RelatonNist::NistBibliography.get(code, date, opts)
     end
+    def fetch_data(_source, opts)
+      DataFetcher.fetch(**opts)
+    end
     # @param xml [String]
     # @return [RelatonNist::GbBibliographicItem]
     def from_xml(xml)

data/lib/relaton_nist/scrapper.rb CHANGED Viewed

@@ -11,23 +11,17 @@ module RelatonNist
       # @param hit_data [Hash]
       # @return [Hash]
       def parse_page(hit_data)
-        item_data = if hit_data[:json]
-                      from_json hit_data
-                    else
-                      from_csrs hit_data
-                    end
-        # doctype = "standard"
+        item_data = from_json hit_data
         titles = fetch_titles(hit_data)
         unless /^(SP|NISTIR|FIPS) /.match? item_data[:docid][0].id
-          # doctype = id_cleanup(item_data[:docid][0].id)
           item_data[:docid][0] = RelatonBib::DocumentIdentifier.new(
-            id: titles[0][:content].upcase, type: "NIST"
+            id: titles[0][:content].upcase, type: "NIST",
           )
         end
         item_data[:fetched] = Date.today.to_s
         item_data[:type] = "standard"
         item_data[:title] = titles
-        item_data[:doctype] = "standard" # doctype
+        item_data[:doctype] = "standard"
         NistBibliographicItem.new(**item_data)
       end
@@ -44,7 +38,7 @@ module RelatonNist
           edition: fetch_edition(json),
           language: [json["language"]],
           script: [json["script"]],
-          docstatus: fetch_status(json, hit_data[:status]),
+          docstatus: fetch_status(json), # hit_data[:status]),
           copyright: fetch_copyright(json["published-date"]),
           relation: fetch_relations_json(json),
           place: ["Gaithersburg, MD"],
@@ -53,119 +47,58 @@ module RelatonNist
         }
       end
-      def from_csrs(hit_data)
-        doc = get_page hit_data[:url]
-        {
-          # id: fetch_id(doc),
-          link: fetch_link(doc),
-          docid: fetch_docid(doc),
-          date: fetch_dates(doc, hit_data[:release_date]),
-          contributor: fetch_contributors(doc),
-          edition: fetch_edition(hit_data[:code]),
-          language: ["en"],
-          script: ["Latn"],
-          abstract: fetch_abstract(doc),
-          docstatus: fetch_status(doc, hit_data[:status]),
-          copyright: fetch_copyright(doc),
-          relation: fetch_relations(doc),
-          series: fetch_series(doc),
-          keyword: fetch_keywords(doc),
-          commentperiod: fetch_commentperiod(doc),
-        }
-      end
       # rubocop:enable Metrics/AbcSize, Metrics/MethodLength
-      # Strip status from doc id
-      # @param id String
-      # @return String
-      # def id_cleanup(id)
-      #   id.sub(/ \(WITHDRAWN\)/, "").sub(/ \(([^) ]+ )?DRAFT\)/i, "")
-      # end
-      # Get page.
-      # @param path [String] page's path
-      # @return [Array<Nokogiri::HTML::Document, String>]
-      def get_page(url)
-        uri = URI url
-        resp = Net::HTTP.get_response(uri)
-        %r{(?<=newLocation = 'https://' \+ window.location.hostname \+ ')(?<path>[^']+)} =~ resp.body
-        if path
-          uri = URI HitCollection::DOMAIN + path
-          resp = Net::HTTP.get_response(uri)
-        end
-        Nokogiri::HTML(resp.body)
-      rescue SocketError, Timeout::Error, Errno::EINVAL, Errno::ECONNRESET,
-             EOFError, Net::HTTPBadResponse, Net::HTTPHeaderSyntaxError,
-             Net::ProtocolError, OpenSSL::SSL::SSLError
-        raise RelatonBib::RequestError, "Could not access #{url}"
-      end
       # Fetch docid.
-      # @param doc [Nokogiri::HTML::Document, String]
+      # @param docid [String]
       # @return [Array<RelatonBib::DocumentIdentifier>]
-      def fetch_docid(doc)
-        item_ref = if doc.is_a? String then doc
-                   else
-                     doc.at(
-                       "//div[contains(@class, 'publications-detail')]/h3"
-                     )&.text&.strip&.sub(/(?<=\w)\([^\)]+\)$/) do |m|
-                       " " + m.upcase
-                     end&.squeeze(" ")&.gsub(/&#13;|\n|\r/, "")
-                   end
-        item_ref ||= "?"
-        item_ref.sub! /\sAddendum$/, "-Add"
+      def fetch_docid(docid)
+        item_ref = docid
+        # item_ref ||= "?"
+        item_ref.sub!(/\sAddendum$/, "-Add")
         [RelatonBib::DocumentIdentifier.new(id: item_ref, type: "NIST")]
       end
-      # Fetch id.
-      # @param doc [Nokogiri::HTML::Document]
-      # @return [String]
-      # def fetch_id(doc)
-      #   doc.at("//div[contains(@class, 'publications-detail')]/h3").text.
-      #     strip.gsub(/\s/, "")
-      # end
       # Fetch status.
-      # @param doc [Nokogiri::HTML::Document, Hash]
-      # @param status [String]
+      # @param doc [Hash]
       # @return [RelatonNist::DocumentStatus]
-      def fetch_status(doc, status)
-        if doc.is_a? Hash
-          stage = doc["status"]
-          subst = doc["substage"]
-          iter = doc["iteration"] == "initial" ? 1 : doc["iteration"]
-        else
-          case status
-          when "draft (obsolete)"
-            stage = "draft-public"
-            subst = "withdrawn"
-          when "retired draft"
-            stage = "draft-public"
-            subst = "retired"
-          when "withdrawn"
-            stage = "final"
-            subst = "withdrawn"
-          when /^draft/
-            stage = "draft-public"
-            subst = "active"
-          else
-            stage = status
-            subst = "active"
-          end
-          iter = nil
-          if stage.include? "draft"
-            iter = 1
-            history = doc.xpath("//span[@id='pub-history-container']/a"\
-                                "|//span[@id='pub-history-container']/span")
-            history.each_with_index do |h, idx|
-              next if h.name == "a"
-              iter = idx + 1 if idx.positive?
-              break
-            end
-          end
-        end
+      def fetch_status(doc) # , status)
+        # if doc.is_a? Hash
+        stage = doc["status"]
+        subst = doc["substage"]
+        iter = doc["iteration"] == "initial" ? 1 : doc["iteration"]
+        # else
+        #   case status
+        #   when "draft (obsolete)"
+        #     stage = "draft-public"
+        #     subst = "withdrawn"
+        #   when "retired draft"
+        #     stage = "draft-public"
+        #     subst = "retired"
+        #   when "withdrawn"
+        #     stage = "final"
+        #     subst = "withdrawn"
+        #   when /^draft/
+        #     stage = "draft-public"
+        #     subst = "active"
+        #   else
+        #     stage = status
+        #     subst = "active"
+        #   end
+        #   iter = nil
+        #   if stage.include? "draft"
+        #     iter = 1
+        #     history = doc.xpath("//span[@id='pub-history-container']/a"\
+        #                         "|//span[@id='pub-history-container']/span")
+        #     history.each_with_index do |h, idx|
+        #       next if h.name == "a"
+        #       iter = idx + 1 if idx.positive?
+        #       break
+        #     end
+        #   end
+        # end
         RelatonNist::DocumentStatus.new stage: stage, substage: subst, iteration: iter.to_s
       end
@@ -179,49 +112,49 @@ module RelatonNist
       end
       # Fetch dates
-      # @param doc [Nokogiri::HTML::Document]
+      # @param doc [Hash]
       # @param release_date [Date]
       # @return [Array<Hash>]
       def fetch_dates(doc, release_date) # rubocop:disable Metrics/AbcSize,Metrics/MethodLength
         dates = [{ type: "published", on: release_date.to_s }]
-        if doc.is_a? Hash
-          issued = RelatonBib.parse_date doc["issued-date"]
-          updated = RelatonBib.parse_date doc["updated-date"]
-          dates << { type: "updated", on: updated.to_s } if updated
-          obsoleted = RelatonBib.parse_date doc["obsoleted-date"]
-          dates << { type: "obsoleted", on: obsoleted.to_s } if obsoleted
-        else
-          d = doc.at("//span[@id='pub-release-date']")&.text&.strip
-          issued = RelatonBib.parse_date d
-        end
+        # if doc.is_a? Hash
+        issued = RelatonBib.parse_date doc["issued-date"]
+        updated = RelatonBib.parse_date doc["updated-date"]
+        dates << { type: "updated", on: updated.to_s } if updated
+        obsoleted = RelatonBib.parse_date doc["obsoleted-date"]
+        dates << { type: "obsoleted", on: obsoleted.to_s } if obsoleted
+        # else
+        #   d = doc.at("//span[@id='pub-release-date']")&.text&.strip
+        #   issued = RelatonBib.parse_date d
+        # end
         dates << { type: "issued", on: issued.to_s }
         dates
       end
       # rubocop:disable Metrics/AbcSize, Metrics/MethodLength
-      # @param doc [Nokogiri::HTML::Document, Hash]
+      # @param doc [Hash]
       # @return [Array<RelatonBib::ContributionInfo>]
       def fetch_contributors(doc)
         contribs = []
-        if doc.is_a? Hash
-          contribs += contributors_json(
-            doc["authors"], "author", doc["language"], doc["script"]
-          )
-          contribs + contributors_json(
-            doc["editors"], "editor", doc["language"], doc["script"]
-          )
-        else
-          name = "National Institute of Standards and Technology"
-          org = RelatonBib::Organization.new(
-            name: name, url: "www.nist.gov", abbreviation: "NIST",
-          )
-          contribs << RelatonBib::ContributionInfo.new(entity: org, role: [type: "publisher"])
-          authors = doc.at('//h4[.="Author(s)"]/following-sibling::p')
-          contribs += contributors(authors, "author")
-          editors = doc.at('//h4[.="Editor(s)"]/following-sibling::p')
-          contribs + contributors(editors, "editor")
-        end
+        # if doc.is_a? Hash
+        contribs += contributors_json(
+          doc["authors"], "author", doc["language"], doc["script"]
+        )
+        contribs + contributors_json(
+          doc["editors"], "editor", doc["language"], doc["script"]
+        )
+        # else
+        #   name = "National Institute of Standards and Technology"
+        #   org = RelatonBib::Organization.new(
+        #     name: name, url: "www.nist.gov", abbreviation: "NIST",
+        #   )
+        #   contribs << RelatonBib::ContributionInfo.new(entity: org, role: [type: "publisher"])
+        #   authors = doc.at('//h4[.="Author(s)"]/following-sibling::p')
+        #   contribs += contributors(authors, "author")
+        #   editors = doc.at('//h4[.="Editor(s)"]/following-sibling::p')
+        #   contribs + contributors(editors, "editor")
+        # end
       end
       # @param doc [Array<Hash>]
@@ -256,37 +189,37 @@ module RelatonNist
       # @param doc [Nokogiri::HTML::Element, Array<Hash>]
       # @param role [String]
       # @return [Array<RelatonBib::ContributionInfo>]
-      def contributors(doc, role, lang = "en", script = "Latn")
-        return [] if doc.nil?
-        doc.text.split(", ").map do |contr|
-          /(?<an>.+?)(\s+\((?<abbrev>.+?)\))?$/ =~ contr.strip
-          if abbrev && an.downcase !~ /(task|force|group)/ && an.split.size.between?(2, 3)
-            fullname = RelatonBib::FullName.new(
-              completename: RelatonBib::LocalizedString.new(an, lang, script)
-            )
-            case abbrev
-            when "NIST"
-              org_name = "National Institute of Standards and Technology"
-              url = "www.nist.gov"
-            when "MITRE"
-              org_name = abbrev
-              url = "www.mitre.org"
-            else
-              org_name = abbrev
-              url = nil
-            end
-            org = RelatonBib::Organization.new name: org_name, url: url, abbreviation: abbrev
-            affiliation = RelatonBib::Affiliation.new organization: org
-            entity = RelatonBib::Person.new(
-              name: fullname, affiliation: [affiliation],
-            )
-          else
-            entity = RelatonBib::Organization.new name: an, abbreviation: abbrev
-          end
-          RelatonBib::ContributionInfo.new entity: entity, role: [type: role]
-        end
-      end
+      # def contributors(doc, role, lang = "en", script = "Latn")
+      #   return [] if doc.nil?
+      #   doc.text.split(", ").map do |contr|
+      #     /(?<an>.+?)(\s+\((?<abbrev>.+?)\))?$/ =~ contr.strip
+      #     if abbrev && an.downcase !~ /(task|force|group)/ && an.split.size.between?(2, 3)
+      #       fullname = RelatonBib::FullName.new(
+      #         completename: RelatonBib::LocalizedString.new(an, lang, script)
+      #       )
+      #       case abbrev
+      #       when "NIST"
+      #         org_name = "National Institute of Standards and Technology"
+      #         url = "www.nist.gov"
+      #       when "MITRE"
+      #         org_name = abbrev
+      #         url = "www.mitre.org"
+      #       else
+      #         org_name = abbrev
+      #         url = nil
+      #       end
+      #       org = RelatonBib::Organization.new name: org_name, url: url, abbreviation: abbrev
+      #       affiliation = RelatonBib::Affiliation.new organization: org
+      #       entity = RelatonBib::Person.new(
+      #         name: fullname, affiliation: [affiliation],
+      #       )
+      #     else
+      #       entity = RelatonBib::Organization.new name: an, abbreviation: abbrev
+      #     end
+      #     RelatonBib::ContributionInfo.new entity: entity, role: [type: role]
+      #   end
+      # end
       # rubocop:enable Metrics/CyclomaticComplexity, Metrics/AbcSize, Metrics/MethodLength
       # @param name [Hash]
@@ -313,16 +246,16 @@ module RelatonNist
         [RelatonBib::LocalizedString.new(part, lang, script)]
       end
-      # @param doc [String, Hash]
+      # @param doc [Hash]
       # @return [String, NilClass]
       def fetch_edition(doc)
-        if doc.is_a? Hash
-          return unless doc["edition"]
+        # if doc.is_a? Hash
+        return unless doc["edition"]
-          rev = doc["edition"]
-        else
-          return unless /(?<=Rev\.\s)(?<rev>\d+)/ =~ doc
-        end
+        rev = doc["edition"]
+        # else
+        #   return unless /(?<=Rev\.\s)(?<rev>\d+)/ =~ doc
+        # end
         "Revision #{rev}"
       end
@@ -330,17 +263,17 @@ module RelatonNist
       # Fetch abstracts.
       # @param doc [Nokigiri::HTML::Document]
       # @return [Array<Hash>]
-      def fetch_abstract(doc)
-        abstract_content = doc.xpath(
-          '//div[contains(@class, "pub-abstract-callout")]/div[1]/p',
-        ).text
-        [{
-          content: abstract_content,
-          language: "en",
-          script: "Latn",
-          format: "text/plain",
-        }]
-      end
+      # def fetch_abstract(doc)
+      #   abstract_content = doc.xpath(
+      #     '//div[contains(@class, "pub-abstract-callout")]/div[1]/p',
+      #   ).text
+      #   [{
+      #     content: abstract_content,
+      #     language: "en",
+      #     script: "Latn",
+      #     format: "text/plain",
+      #   }]
+      # end
       # Fetch copyright.
       # @param doc [Nokogiri::HTL::Document, String]
@@ -348,30 +281,30 @@ module RelatonNist
       def fetch_copyright(doc)
         name = "National Institute of Standards and Technology"
         url = "www.nist.gov"
-        d = if doc.is_a? String then doc
-            else
-              doc.at("//span[@id='pub-release-date']")&.text&.strip
-            end
-        from = d&.match(/\d{4}/)&.to_s
+        # d = if doc.is_a? String then doc
+        #     else
+        #       doc.at("//span[@id='pub-release-date']")&.text&.strip
+        #     end
+        from = doc&.match(/\d{4}/)&.to_s
         [{ owner: [{ name: name, abbreviation: "NIST", url: url }], from: from }]
       end
       # rubocop:disable Metrics/MethodLength, Metrics/AbcSize
       # Fetch links.
-      # @param doc [Nokogiri::HTML::Document, Hash]
+      # @param doc [Hash]
       # @return [Array<Hash>]
       def fetch_link(doc)
         links = []
-        if doc.is_a? Hash
-          links << { type: "uri", content: doc["uri"] } if doc["uri"]
-          doi = "https://doi.org/" + doc["doi"] if doc["doi"]
-        else
-          pub = doc.at "//p/strong[contains(., 'Publication:')]"
-          pdf = pub&.at "./following-sibling::a[.=' Local Download']"
-          doi = pub&.at("./following-sibling::a[contains(.,'(DOI)')]")&.attr :href
-          links << { type: "pdf", content: pdf[:href] } if pdf
-        end
+        # if doc.is_a? Hash
+        links << { type: "uri", content: doc["uri"] } if doc["uri"]
+        doi = "https://doi.org/" + doc["doi"] if doc["doi"]
+        # else
+        #   pub = doc.at "//p/strong[contains(., 'Publication:')]"
+        #   pdf = pub&.at "./following-sibling::a[.=' Local Download']"
+        #   doi = pub&.at("./following-sibling::a[contains(.,'(DOI)')]")&.attr :href
+        #   links << { type: "pdf", content: pdf[:href] } if pdf
+        # end
         links << { type: "doi", content: doi } if doi
         links
       end
@@ -380,19 +313,19 @@ module RelatonNist
       # Fetch relations.
       # @param doc [Nokogiri::HTML::Document]
       # @return [Array<RelatonNist::DocumentRelation>]
-      def fetch_relations(doc)
-        relations = doc.xpath('//span[@id="pub-supersedes-container"]/a').map do |r|
-          doc_relation "supersedes", r.text, DOMAIN + r[:href]
-        end
-        relations += doc.xpath('//span[@id="pub-part-container"]/a').map do |r|
-          doc_relation "partOf", r.text, DOMAIN + r[:href]
-        end
-        relations + doc.xpath('//span[@id="pub-related-container"]/a').map do |r|
-          doc_relation "updates", r.text, DOMAIN + r[:href]
-        end
-      end
+      # def fetch_relations(doc)
+      #   relations = doc.xpath('//span[@id="pub-supersedes-container"]/a').map do |r|
+      #     doc_relation "supersedes", r.text, DOMAIN + r[:href]
+      #   end
+      #   relations += doc.xpath('//span[@id="pub-part-container"]/a').map do |r|
+      #     doc_relation "partOf", r.text, DOMAIN + r[:href]
+      #   end
+      #   relations + doc.xpath('//span[@id="pub-related-container"]/a').map do |r|
+      #     doc_relation "updates", r.text, DOMAIN + r[:href]
+      #   end
+      # end
       # rubocop:enable Metrics/AbcSize
       def fetch_relations_json(doc)
@@ -425,62 +358,62 @@ module RelatonNist
       # @param doc [Nokogiri::HTML::Document]
       # @return [Array<RelatonBib::Series>]
-      def fetch_series(doc)
-        series = doc.xpath "//span[@id='pub-history-container']/a"\
-          "|//span[@id='pub-history-container']/span"
-        series.map.with_index do |s, idx|
-          next if s.name == "span"
-          iter = if idx.zero? then "I"
-                 else idx + 1
-                 end
-          content = s.text.match(/^[^\(]+/).to_s.strip.squeeze " "
-          ref = case s.text
-                when /^Draft/
-                  content.match(/(?<=Draft\s).+/).to_s + " (#{iter}PD)"
-                when /\(Draft\)/ then content + " (#{iter}PD)"
-                else content
-                end
-          fref = RelatonBib::FormattedRef.new(
-            content: ref, language: "en", script: "Latn", format: "text/plain",
-          )
-          RelatonBib::Series.new(formattedref: fref)
-        end.select { |s| s }
-      end
+      # def fetch_series(doc)
+      #   series = doc.xpath "//span[@id='pub-history-container']/a"\
+      #     "|//span[@id='pub-history-container']/span"
+      #   series.map.with_index do |s, idx|
+      #     next if s.name == "span"
+      #     iter = if idx.zero? then "I"
+      #            else idx + 1
+      #            end
+      #     content = s.text.match(/^[^\(]+/).to_s.strip.squeeze " "
+      #     ref = case s.text
+      #           when /^Draft/
+      #             content.match(/(?<=Draft\s).+/).to_s + " (#{iter}PD)"
+      #           when /\(Draft\)/ then content + " (#{iter}PD)"
+      #           else content
+      #           end
+      #     fref = RelatonBib::FormattedRef.new(
+      #       content: ref, language: "en", script: "Latn", format: "text/plain",
+      #     )
+      #     RelatonBib::Series.new(formattedref: fref)
+      #   end.select { |s| s }
+      # end
       # rubocop:enable Metrics/MethodLength, Metrics/AbcSize
-      # @param doc [Nokogiri::HTML::Document, Hash]
+      # @param doc [Hash]
       # @return [Array<RelatonNist::Keyword>]
       def fetch_keywords(doc)
-        kws = if doc.is_a? Hash
-                doc["keywords"]
-              else
-                doc.xpath "//span[@id='pub-keywords-container']/span"
-              end
-        kws.map { |kw| kw.is_a?(String) ? kw : kw.text }
+        # kws = if doc.is_a? Hash
+        #         doc["keywords"]
+        #       else
+        #         doc.xpath "//span[@id='pub-keywords-container']/span"
+        #       end
+        doc["keywords"].map { |kw| kw.is_a?(String) ? kw : kw.text }
       end
       # rubocop:disable Metrics/AbcSize
       # @param doc [Nokogiri::HTML::Document]
       # @return [RelatonNist::CommentPeriod, NilClass]
-      def fetch_commentperiod(doc)
-        cp = doc.at "//span[@id='pub-comments-due']"
-        return unless cp
+      # def fetch_commentperiod(doc)
+      #   cp = doc.at "//span[@id='pub-comments-due']"
+      #   return unless cp
-        to = Date.strptime cp.text.strip, "%B %d, %Y"
+      #   to = Date.strptime cp.text.strip, "%B %d, %Y"
-        d = doc.at("//span[@id='pub-release-date']").text.strip
-        from = Date.strptime(d, "%B %Y").to_s
+      #   d = doc.at("//span[@id='pub-release-date']").text.strip
+      #   from = Date.strptime(d, "%B %Y").to_s
-        ex = doc.at "//strong[contains(.,'The comment closing date has been "\
-        "extended to')]"
-        ext = ex&.text&.match(/\w+\s\d{2},\s\d{4}/).to_s
-        extended = ext.empty? ? nil : Date.strptime(ext, "%B %d, %Y")
-        CommentPeriod.new from: from, to: to, extended: extended
-      end
+      #   ex = doc.at "//strong[contains(.,'The comment closing date has been "\
+      #   "extended to')]"
+      #   ext = ex&.text&.match(/\w+\s\d{2},\s\d{4}/).to_s
+      #   extended = ext.empty? ? nil : Date.strptime(ext, "%B %d, %Y")
+      #   CommentPeriod.new from: from, to: to, extended: extended
+      # end
       # rubocop:enable Metrics/AbcSize
       # @param json [Hash]