RubyGems - metanorma-standoc - Versions diffs - 1.10.5 → 1.11.0 - Mend

metanorma-standoc 1.10.5 → 1.11.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (66) hide show

checksums.yaml +4 -4
data/README.adoc +19 -23
data/Rakefile +1 -1
data/lib/asciidoctor/standoc/base.rb +14 -17
data/lib/asciidoctor/standoc/basicdoc.rng +21 -4
data/lib/asciidoctor/standoc/blocks.rb +26 -23
data/lib/asciidoctor/standoc/blocks_notes.rb +17 -22
data/lib/asciidoctor/standoc/cleanup.rb +46 -12
data/lib/asciidoctor/standoc/cleanup_block.rb +5 -70
data/lib/asciidoctor/standoc/cleanup_image.rb +6 -7
data/lib/asciidoctor/standoc/cleanup_inline.rb +44 -102
data/lib/asciidoctor/standoc/cleanup_maths.rb +5 -6
data/lib/asciidoctor/standoc/cleanup_ref.rb +5 -0
data/lib/asciidoctor/standoc/cleanup_reqt.rb +51 -33
data/lib/asciidoctor/standoc/cleanup_section_names.rb +5 -5
data/lib/asciidoctor/standoc/cleanup_symbols.rb +48 -0
data/lib/asciidoctor/standoc/cleanup_table.rb +68 -0
data/lib/asciidoctor/standoc/cleanup_terms.rb +38 -78
data/lib/asciidoctor/standoc/cleanup_terms_designations.rb +162 -0
data/lib/asciidoctor/standoc/cleanup_text.rb +5 -2
data/lib/asciidoctor/standoc/cleanup_xref.rb +107 -0
data/lib/asciidoctor/standoc/converter.rb +15 -0
data/lib/asciidoctor/standoc/inline.rb +7 -5
data/lib/asciidoctor/standoc/isodoc.rng +435 -78
data/lib/asciidoctor/standoc/lists.rb +15 -15
data/lib/asciidoctor/standoc/macros.rb +14 -43
data/lib/asciidoctor/standoc/macros_note.rb +45 -0
data/lib/asciidoctor/standoc/macros_plantuml.rb +29 -14
data/lib/asciidoctor/standoc/macros_terms.rb +82 -20
data/lib/asciidoctor/standoc/ref_sect.rb +24 -17
data/lib/asciidoctor/standoc/reqt.rb +2 -2
data/lib/asciidoctor/standoc/reqt.rng +23 -2
data/lib/asciidoctor/standoc/term_lookup_cleanup.rb +50 -11
data/lib/asciidoctor/standoc/terms.rb +21 -3
data/lib/asciidoctor/standoc/utils.rb +36 -23
data/lib/asciidoctor/standoc/validate.rb +45 -27
data/lib/asciidoctor/standoc/validate_section.rb +5 -2
data/lib/metanorma/standoc/version.rb +1 -1
data/metanorma-standoc.gemspec +1 -1
data/spec/asciidoctor/base_spec.rb +4 -36
data/spec/asciidoctor/blank_spec.rb +37 -0
data/spec/asciidoctor/blocks_spec.rb +296 -47
data/spec/asciidoctor/cleanup_blocks_spec.rb +1018 -0
data/spec/asciidoctor/cleanup_sections_spec.rb +153 -12
data/spec/asciidoctor/cleanup_spec.rb +179 -1265
data/spec/asciidoctor/cleanup_terms_spec.rb +990 -0
data/spec/asciidoctor/inline_spec.rb +38 -2
data/spec/asciidoctor/lists_spec.rb +6 -6
data/spec/asciidoctor/macros_plantuml_spec.rb +37 -2
data/spec/asciidoctor/macros_spec.rb +226 -138
data/spec/asciidoctor/refs_spec.rb +4 -26
data/spec/asciidoctor/section_spec.rb +18 -18
data/spec/asciidoctor/validate_spec.rb +109 -1
data/spec/assets/xref_error.adoc +1 -0
data/spec/fixtures/datamodel_description_sections_tree.xml +327 -326
data/spec/spec_helper.rb +6 -7
data/spec/vcr_cassettes/dated_iso_ref_joint_iso_iec.yml +51 -51
data/spec/vcr_cassettes/dated_iso_ref_joint_iso_iec1.yml +13 -13
data/spec/vcr_cassettes/isobib_get_123.yml +13 -13
data/spec/vcr_cassettes/isobib_get_123_1.yml +26 -26
data/spec/vcr_cassettes/isobib_get_123_1_fr.yml +34 -34
data/spec/vcr_cassettes/isobib_get_123_2001.yml +12 -12
data/spec/vcr_cassettes/isobib_get_124.yml +13 -13
data/spec/vcr_cassettes/rfcbib_get_rfc8341.yml +16 -16
data/spec/vcr_cassettes/separates_iev_citations_by_top_level_clause.yml +51 -49
metadata +13 -5

data/lib/asciidoctor/standoc/cleanup_image.rb CHANGED Viewed

@@ -15,9 +15,8 @@ module Asciidoctor
       def svgmap_moveattrs(xmldoc)
         xmldoc.xpath("//svgmap").each do |s|
           f = s.at(".//figure") or next
-          if (t = s.at("./name")) && !f.at("./name")
+          (t = s.at("./name")) && !f.at("./name") and
             f.children.first.previous = t.remove
-          end
           if s["id"] && guid?(f["id"])
             f["id"] = s["id"]
             s.delete("id")
@@ -26,13 +25,13 @@ module Asciidoctor
         end
       end
-      def svgmap_moveattrs1(s, f)
+      def svgmap_moveattrs1(svgmap, figure)
         %w(unnumbered number subsequence keep-with-next
-           keep-lines-together).each do |a|
-          next if f[a] || !s[a]
+           keep-lines-together tag multilingual-rendering).each do |a|
+          next if figure[a] || !svgmap[a]
-          f[a] = s[a]
-          s.delete(a)
+          figure[a] = svgmap[a]
+          svgmap.delete(a)
         end
       end

data/lib/asciidoctor/standoc/cleanup_inline.rb CHANGED Viewed

@@ -1,4 +1,5 @@
 require "metanorma-utils"
+require "digest"
 module Asciidoctor
   module Standoc
@@ -55,114 +56,30 @@ module Asciidoctor
         end
       end
-      # extending localities to cover ISO referencing
-      LOCALITY_REGEX_STR = <<~REGEXP.freeze
-        ^((?<locality>section|clause|part|paragraph|chapter|page|
-                      table|annex|figure|example|note|formula|list|time|anchor|
-                      locality:[^ \\t\\n\\r:,;=]+)(\\s+|=)
-               (?<ref>[^"][^ \\t\\n,:-]*|"[^"]+")
-                 (-(?<to>[^"][^ \\t\\n,:-]*|"[^"]"))?|
-          (?<locality2>whole|locality:[^ \\t\\n\\r:,;=]+))(?<punct>[,:;]?)\\s*
-         (?<text>.*)$
-      REGEXP
-      LOCALITY_RE = Regexp.new(LOCALITY_REGEX_STR.gsub(/\s/, ""),
-                               Regexp::IGNORECASE | Regexp::MULTILINE)
-      def tq(text)
-        text.sub(/^"/, "").sub(/"$/, "")
-      end
-      def extract_localities(elem)
-        f = elem&.children&.first or return
-        f.text? or return
-        head = f.remove.text
-        tail = elem&.children&.remove
-        extract_localities1(elem, head)
-        tail and elem << tail
-      end
-      def extract_localities1(elem, text)
-        b = elem.add_child("<localityStack/>").first if LOCALITY_RE.match text
-        while (m = LOCALITY_RE.match text)
-          ref = m[:ref] ? "<referenceFrom>#{tq m[:ref]}</referenceFrom>" : ""
-          refto = m[:to] ? "<referenceTo>#{tq m[:to]}</referenceTo>" : ""
-          loc = m[:locality]&.downcase || m[:locality2]&.downcase
-          b.add_child("<locality type='#{loc}'>#{ref}#{refto}</locality>")
-          text = m[:text]
-          b = elem.add_child("<localityStack/>").first if m[:punct] == ";"
-        end
-        elem.add_child(text) if text
-      end
-      def xref_to_eref(elem)
-        elem["bibitemid"] = elem["target"]
-        unless elem["citeas"] = @anchors&.dig(elem["target"], :xref)
-          @internal_eref_namespaces.include?(elem["type"]) or
-            @log.add("Crossreferences", elem,
-                     "#{elem['target']} does not have a corresponding "\
-                     "anchor ID in the bibliography!")
-        end
-        elem.delete("target")
-        extract_localities(elem) unless elem.children.empty?
-      end
-      def xref_cleanup(xmldoc)
-        xmldoc.xpath("//xref").each do |x|
-          /:/.match(x["target"]) and xref_to_internal_eref(x)
-          next unless x.name == "xref"
-          if refid? x["target"]
-            x.name = "eref"
-            xref_to_eref(x)
-          else x.delete("type")
-          end
-        end
-      end
-      def xref_to_internal_eref(elem)
-        a = elem["target"].split(":", 3)
-        unless a.size < 2 || a[0].empty? || a[1].empty?
-          elem["target"] = "#{a[0]}_#{a[1]}"
-          a.size > 2 and
-            elem.children = %{anchor="#{a[2..-1].join}",#{elem&.children&.text}}
-          elem["type"] = a[0]
-          @internal_eref_namespaces << a[0]
-          elem.name = "eref"
-          xref_to_eref(elem)
-        end
-      end
-      def quotesource_cleanup(xmldoc)
-        xmldoc.xpath("//quote/source | //terms/source").each do |x|
-          xref_to_eref(x)
+      def concept_cleanup(xmldoc)
+        xmldoc.xpath("//concept[not(termxref)]").each do |x|
+          term = x.at("./refterm")
+          term&.remove if term&.text&.empty?
+          concept_cleanup1(x)
         end
       end
-      def origin_cleanup(xmldoc)
-        xmldoc.xpath("//origin/concept[termref]").each do |x|
-          t = x.at("./termref")
-          x.replace(t)
-        end
-        xmldoc.xpath("//origin").each do |x|
-          x["citeas"] = @anchors&.dig(x["bibitemid"], :xref) or
-            @log.add("Crossreferences", x,
-                     "#{x['bibitemid']} does not have a corresponding anchor "\
-                     "ID in the bibliography!")
-          extract_localities(x) unless x.children.empty?
+      def concept_cleanup1(elem)
+        elem.children.remove if elem&.children&.text&.strip&.empty?
+        key_extract_locality(elem)
+        if /:/.match?(elem["key"]) then concept_termbase_cleanup(elem)
+        elsif refid? elem["key"] then concept_eref_cleanup(elem)
+        else concept_xref_cleanup(elem)
         end
+        elem.delete("key")
       end
-      def concept_cleanup(xmldoc)
-        xmldoc.xpath("//concept[not(termxref)]").each do |x|
+      def related_cleanup(xmldoc)
+        xmldoc.xpath("//related[not(termxref)]").each do |x|
           term = x.at("./refterm")
-          term&.remove if term&.text&.empty?
-          x.children.remove if x&.children&.text&.strip&.empty?
-          key_extract_locality(x)
-          if /:/.match?(x["key"]) then concept_termbase_cleanup(x)
-          elsif refid? x["key"] then concept_eref_cleanup(x)
-          else concept_xref_cleanup(x)
-          end
-          x.delete("key")
+          term.replace("<preferred>#{term_expr(term.children.to_xml)}"\
+                       "</preferred>")
+          concept_cleanup1(x)
         end
       end
@@ -203,11 +120,13 @@ module Asciidoctor
       end
       IDREF = "//*/@id | //review/@from | //review/@to | "\
-        "//callout/@target | //citation/@bibitemid | //eref/@bibitemid".freeze
+              "//callout/@target | //citation/@bibitemid | "\
+              "//eref/@bibitemid".freeze
       def anchor_cleanup(elem)
         anchor_cleanup1(elem)
         xreftarget_cleanup(elem)
+        contenthash_id_cleanup(elem)
       end
       def anchor_cleanup1(elem)
@@ -233,6 +152,29 @@ module Asciidoctor
           end
         end
       end
+      def guid?(str)
+        /^_[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/
+          .match?(str)
+      end
+      def contenthash_id_cleanup(doc)
+        ids = doc.xpath("//*[@id]").each_with_object({}) do |x, m|
+          next unless guid?(x["id"])
+          m[x["id"]] = contenthash(x)
+          x["id"] = m[x["id"]]
+        end
+        [%w(review from), %(review to), %(callout target), %(eref bibitemid),
+         %(citation bibitemid), %(xref target), %(xref to)].each do |a|
+          doc.xpath("//#{a[0]}").each { |x| ids[a[1]] and x[a[1]] = ids[a[1]] }
+        end
+      end
+      def contenthash(elem)
+        Digest::MD5.hexdigest("#{elem.path}////#{elem.text}")
+          .sub(/^(.{8})(.{4})(.{4})(.{4})(.{12})$/, "_\\1-\\2-\\3-\\4-\\5")
+      end
     end
   end
 end

data/lib/asciidoctor/standoc/cleanup_maths.rb CHANGED Viewed

@@ -69,13 +69,12 @@ module Asciidoctor
         return false if char.length > 1
         if /\p{Greek}/.match?(char)
-          /\p{Lower}/.match(char) && !mathml_mi_italics[:lowergreek] ||
-            /\p{Upper}/.match(char) && !mathml_mi_italics[:uppergreek]
+          (/\p{Lower}/.match(char) && !mathml_mi_italics[:lowergreek]) ||
+            (/\p{Upper}/.match(char) && !mathml_mi_italics[:uppergreek])
         elsif /\p{Latin}/.match?(char)
-          /\p{Lower}/.match(char) && !mathml_mi_italics[:lowerroman] ||
-            /\p{Upper}/.match(char) && !mathml_mi_italics[:upperroman]
-        else
-          false
+          (/\p{Lower}/.match(char) && !mathml_mi_italics[:lowerroman]) ||
+            (/\p{Upper}/.match(char) && !mathml_mi_italics[:upperroman])
+        else false
         end
       end

data/lib/asciidoctor/standoc/cleanup_ref.rb CHANGED Viewed

@@ -84,6 +84,11 @@ module Asciidoctor
         biblio_reorder(xmldoc)
         biblio_nested(xmldoc)
         biblio_renumber(xmldoc)
+        biblio_no_ext(xmldoc)
+      end
+      def biblio_no_ext(xmldoc)
+        xmldoc.xpath("//bibitem/ext").each(&:remove)
       end
       def biblio_nested(xmldoc)

data/lib/asciidoctor/standoc/cleanup_reqt.rb CHANGED Viewed

@@ -3,37 +3,61 @@ module Asciidoctor
     module Cleanup
       def requirement_cleanup(xmldoc)
         requirement_metadata(xmldoc)
-        requirement_descriptions(xmldoc)
         requirement_inherit(xmldoc)
+        requirement_descriptions(xmldoc)
       end
       REQRECPER = "//requirement | //recommendation | //permission".freeze
       def requirement_inherit(xmldoc)
         xmldoc.xpath(REQRECPER).each do |r|
-          ins = r.at("./classification") ||
-            r.at("./description | ./measurementtarget | ./specification | "\
-                 "./verification | ./import | ./description | ./requirement | "\
-                 "./recommendation | ./permission | ./component")
+          ins = requirement_inherit_insert(r)
           r.xpath("./*//inherit").each { |i| ins.previous = i }
         end
       end
+      def requirement_inherit_insert(reqt)
+        ins = reqt.at("./classification") || reqt.at(
+          "./description | ./measurementtarget | ./specification | "\
+          "./verification | ./import | ./description | ./component | "\
+          "./requirement | ./recommendation | ./permission",
+        ) and return ins
+        requirement_inherit_insert1(reqt)
+      end
+      def requirement_inherit_insert1(reqt)
+        if t = reqt.at("./title")
+          t.next = " "
+          t.next
+        else
+          if reqt.children.empty? then reqt.add_child(" ")
+          else reqt.children.first.previous = " "
+          end
+          reqt.children.first
+        end
+      end
       def requirement_descriptions(xmldoc)
         xmldoc.xpath(REQRECPER).each do |r|
+          r.xpath(".//p[not(./*)][normalize-space(.)='']").each(&:remove)
           r.children.each do |e|
-            unless e.element? && (reqt_subpart(e.name) ||
-                %w(requirement recommendation permission).include?(e.name))
-              next if e.text.strip.empty?
-              t = Nokogiri::XML::Element.new("description", r)
-              e.before(t)
-              t.children = e.remove
-            end
+            requirement_description_wrap(r, e)
           end
           requirement_description_cleanup1(r)
         end
       end
+      def requirement_description_wrap(reqt, text)
+        return if text.element? && (reqt_subpart(text.name) ||
+                %w(requirement recommendation
+                   permission).include?(text.name)) ||
+          text.text.strip.empty?
+        t = Nokogiri::XML::Element.new("description", reqt)
+        text.before(t)
+        t.children = text.remove
+      end
       def requirement_description_cleanup1(reqt)
         while d = reqt.at("./description[following-sibling::*[1]"\
                           "[self::description]]")
@@ -48,45 +72,39 @@ module Asciidoctor
       def requirement_metadata(xmldoc)
         xmldoc.xpath(REQRECPER).each do |r|
           dl = r&.at("./dl[@metadata = 'true']")&.remove or next
-          requirement_metadata1(r, dl)
+          requirement_metadata1(r, dl, r.at("./title"))
         end
       end
-      def requirement_metadata1(reqt, dlist)
-        unless ins = reqt.at("./title")
+      def requirement_metadata1_tags
+        %w(label subject inherit)
+      end
+      def requirement_metadata1(reqt, dlist, ins)
+        unless ins
           reqt.children.first.previous = " "
           ins = reqt.children.first
         end
-        %w(label subject inherit).each do |a|
-          ins = reqt_dl_to_elems(ins, reqt, dlist, a)
+        %w(obligation model type).each do |a|
+          dl_to_attrs(reqt, dlist, a)
         end
-        reqt_dl_to_classif(ins, reqt, dlist)
-      end
-      def reqt_dl_to_elems(ins, reqt, dlist, name)
-        if a = reqt.at("./#{name}[last()]")
-          ins = a
+        requirement_metadata1_tags.each do |a|
+          ins = dl_to_elems(ins, reqt, dlist, a)
         end
-        dlist.xpath("./dt[text()='#{name}']").each do |e|
-          val = e.at("./following::dd/p") || e.at("./following::dd")
-          val.name = name
-          ins.next = val
-          ins = ins.next
-        end
-        ins
+        reqt_dl_to_classif(ins, reqt, dlist)
       end
       def reqt_dl_to_classif(ins, reqt, dlist)
-        if a = reqt.at("./classification[last()]")
-          ins = a
-        end
+        if a = reqt.at("./classification[last()]") then ins = a end
         dlist.xpath("./dt[text()='classification']").each do |e|
           val = e.at("./following::dd/p") || e.at("./following::dd")
           req_classif_parse(val.text).each do |r|
             ins.next = "<classification><tag>#{r[0]}</tag>"\
                        "<value>#{r[1]}</value></classification>"
+            ins = ins.next
           end
         end
+        ins
       end
     end
   end

data/lib/asciidoctor/standoc/cleanup_section_names.rb CHANGED Viewed

@@ -78,12 +78,12 @@ module Asciidoctor
       def sections_variant_title_cleanup(xml)
         path = SECTION_CONTAINERS.map { |x| "./ancestor::#{x}" }.join(" | ")
         xml.xpath("//p[@variant_title]").each do |p|
+          p.name = "variant-title"
+          p.delete("id")
+          p.delete("variant_title")
           p.xpath("(#{path})[last()]").each do |sect|
-            p.name = "variant-title"
-            p.delete("id")
-            if ins = sect.at("./title") then ins.next = p
-            else sect.children.first.previous = p
-            end
+            ins = sect.at("./title") and ins.next = p or
+              sect.children.first.previous = p
           end
         end
       end

data/lib/asciidoctor/standoc/cleanup_symbols.rb ADDED Viewed

@@ -0,0 +1,48 @@
+module Asciidoctor
+  module Standoc
+    module Cleanup
+      # Indices sort after letter but before any following
+      # letter (x, x_m, x_1, xa); we use colon to force that sort order.
+      # Numbers sort *after* letters; we use thorn to force that sort order.
+      def symbol_key(sym)
+        key = sym.dup
+        key.traverse do |n|
+          n.name == "math" and
+            n.replace(grkletters(MathML2AsciiMath.m2a(n.to_xml)))
+        end
+        ret = Nokogiri::XML(key.to_xml)
+        HTMLEntities.new.decode(ret.text.downcase)
+          .gsub(/[\[\]{}<>()]/, "").gsub(/\s/m, "")
+          .gsub(/[[:punct:]]|[_^]/, ":\\0").gsub(/`/, "")
+          .gsub(/[0-9]+/, "þ\\0")
+      end
+      def grkletters(text)
+        text.gsub(/\b(alpha|beta|gamma|delta|epsilon|zeta|eta|theta|iota|kappa|
+                      lambda|mu|nu|xi|omicron|pi|rho|sigma|tau|upsilon|phi|chi|
+                      psi|omega)\b/xi, "&\\1;")
+      end
+      def extract_symbols_list(dlist)
+        dl_out = []
+        dlist.xpath("./dt | ./dd").each do |dtd|
+          if dtd.name == "dt"
+            dl_out << { dt: dtd.remove, key: symbol_key(dtd) }
+          else
+            dl_out.last[:dd] = dtd.remove
+          end
+        end
+        dl_out
+      end
+      def symbols_cleanup(docxml)
+        docxml.xpath("//definitions/dl").each do |dl|
+          dl_out = extract_symbols_list(dl)
+          dl_out.sort! { |a, b| a[:key] <=> b[:key] || a[:dt] <=> b[:dt] }
+          dl.children = dl_out.map { |d| d[:dt].to_s + d[:dd].to_s }.join("\n")
+        end
+        docxml
+      end
+    end
+  end
+end

data/lib/asciidoctor/standoc/cleanup_table.rb ADDED Viewed

@@ -0,0 +1,68 @@
+module Asciidoctor
+  module Standoc
+    module Cleanup
+      def dl1_table_cleanup(xmldoc)
+        q = "//table/following-sibling::*[1][self::dl]"
+        xmldoc.xpath(q).each do |s|
+          s["key"] == "true" and s.previous_element << s.remove
+        end
+      end
+      # move Key dl after table footer
+      def dl2_table_cleanup(xmldoc)
+        q = "//table/following-sibling::*[1][self::p]"
+        xmldoc.xpath(q).each do |s|
+          if s.text =~ /^\s*key[^a-z]*$/i && s&.next_element&.name == "dl"
+            s.next_element["key"] = "true"
+            s.previous_element << s.next_element.remove
+            s.remove
+          end
+        end
+      end
+      def insert_thead(table)
+        thead = table.at("./thead")
+        return thead unless thead.nil?
+        if tname = table.at("./name")
+          thead = tname.add_next_sibling("<thead/>").first
+          return thead
+        end
+        table.children.first.add_previous_sibling("<thead/>").first
+      end
+      def header_rows_cleanup(xmldoc)
+        xmldoc.xpath("//table[@headerrows]").each do |s|
+          thead = insert_thead(s)
+          (thead.xpath("./tr").size...s["headerrows"].to_i).each do
+            row = s.at("./tbody/tr")
+            row.parent = thead
+          end
+          thead.xpath(".//td").each { |n| n.name = "th" }
+          s.delete("headerrows")
+        end
+      end
+      def table_cleanup(xmldoc)
+        dl1_table_cleanup(xmldoc)
+        dl2_table_cleanup(xmldoc)
+        notes_table_cleanup(xmldoc)
+        header_rows_cleanup(xmldoc)
+      end
+      # move notes into table
+      def notes_table_cleanup(xmldoc)
+        nomatches = false
+        until nomatches
+          nomatches = true
+          xmldoc.xpath("//table/following-sibling::*[1]"\
+                       "[self::note[not(@keep-separate = 'true')]]").each do |n|
+            n.delete("keep-separate")
+            n.previous_element << n.remove
+            nomatches = false
+          end
+        end
+      end
+    end
+  end
+end