RubyGems - isodoc - Versions diffs - 0.4.5 → 0.5.5 - Mend

isodoc 0.4.5 → 0.5.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

checksums.yaml +4 -4
data/bin/rspec +18 -0
data/isodoc.gemspec +1 -1
data/lib/isodoc.rb +34 -5
data/lib/isodoc/blocks.rb +62 -50
data/lib/isodoc/cleanup.rb +34 -10
data/lib/isodoc/html.rb +31 -16
data/lib/isodoc/i18n-en.yaml +72 -0
data/lib/isodoc/i18n-fr.yaml +65 -0
data/lib/isodoc/i18n-zh-Hans.yaml +64 -0
data/lib/isodoc/i18n.rb +90 -0
data/lib/isodoc/inline.rb +25 -18
data/lib/isodoc/iso2wordhtml.rb +30 -7
data/lib/isodoc/lists.rb +29 -9
data/lib/isodoc/metadata.rb +54 -38
data/lib/isodoc/notes.rb +32 -32
data/lib/isodoc/postprocessing.rb +65 -46
data/lib/isodoc/references.rb +63 -29
data/lib/isodoc/section.rb +94 -44
data/lib/isodoc/table.rb +19 -19
data/lib/isodoc/terms.rb +5 -6
data/lib/isodoc/utils.rb +48 -5
data/lib/isodoc/version.rb +1 -1
data/lib/isodoc/xref_gen.rb +87 -75
data/spec/isodoc/blocks_spec.rb +618 -0
data/spec/isodoc/lists_spec.rb +227 -0
data/spec/isodoc/section_spec.rb +419 -0
data/spec/isodoc/table_spec.rb +135 -0
data/spec/isodoc/xref_spec.rb +1073 -0
data/spec/spec_helper.rb +26 -0
metadata +17 -6

data/lib/isodoc/utils.rb CHANGED

@@ -1,5 +1,3 @@
-#require "uuidtools"
 module IsoDoc
   class Convert
     def ns(xpath)
@@ -11,7 +9,7 @@ module IsoDoc
     def insert_tab(out, n)
       out.span **attr_code(style: "mso-tab-count:#{n}") do |span|
-        [1..n].each { |i| span << "&#xA0; " }
+        [1..n].each { span << "&#xA0; " }
       end
     end
@@ -31,7 +29,7 @@ module IsoDoc
       STAGE_ABBRS[stage.to_sym] || "??"
     end
-    NOKOHEAD = <<~HERE
+    NOKOHEAD = <<~HERE.freeze
     <!DOCTYPE html SYSTEM
     "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
     <html xmlns="http://www.w3.org/1999/xhtml">
@@ -39,7 +37,6 @@ module IsoDoc
     <body> </body> </html>
     HERE
     # block for processing XML document fragments as XHTML,
     # to allow for HTMLentities
     def noko(&block)
@@ -76,5 +73,51 @@ module IsoDoc
     def from_xhtml(xml)
       xml.to_xml.sub(%r{ xmlns="http://www.w3.org/1999/xhtml"}, "")
     end
+    CLAUSE_ANCESTOR =
+      ".//ancestor::*[local-name() = 'subsection' or "\
+      "local-name() = 'foreword' or "\
+      "local-name() = 'introduction' or local-name() = 'terms' or "\
+      "local-name() = 'clause' or local-name() = 'references' or "\
+      "local-name() = 'annex']/@id".freeze
+    def get_clause_id(node)
+      clause = node.xpath(CLAUSE_ANCESTOR)
+      clause&.last&.text || nil
+    end
+    NOTE_CONTAINER_ANCESTOR =
+      ".//ancestor::*[local-name() = 'subsection' or "\
+      "local-name() = 'foreword' or "\
+      "local-name() = 'introduction' or local-name() = 'terms' or "\
+      "local-name() = 'clause' or local-name() = 'references' or "\
+      "local-name() = 'annex' or local-name() = 'formula' or "\
+      "local-name() = 'table' or local-name() = 'example' or "\
+      "local-name() = 'figure']/@id".freeze
+    def get_note_container_id(node)
+      container = node.xpath(NOTE_CONTAINER_ANCESTOR)
+      container&.last&.text || nil
+    end
+    def sentence_join(array)
+      return "" if array.nil? || array.empty?
+      if array.length == 1
+        array[0]
+      else
+        l10n("#{array[0..-2].join(', ')} #{@and_lbl} #{array.last}")
+      end
+    end
+    # avoid `; avoid {{ (Liquid Templates); avoid [[ (Javascript)
+    def extract_delims(text)
+      @openmathdelim = "(#("
+      @closemathdelim = ")#)"
+      while text.include?(@openmathdelim) || text.include?(@closemathdelim)
+        @openmathdelim += "("
+        @closemathdelim += ")"
+      end
+      [@openmathdelim, @closemathdelim]
+    end
   end
 end

data/lib/isodoc/version.rb CHANGED

@@ -1,3 +1,3 @@
 module IsoDoc
-  VERSION = "0.4.5".freeze
+  VERSION = "0.5.5".freeze
 end

data/lib/isodoc/xref_gen.rb CHANGED

@@ -1,9 +1,5 @@
-#require "isodoc/utils"
 module IsoDoc
   class Convert
-    #include ::IsoDoc::Utils
     @anchors = {}
     def get_anchors
@@ -24,46 +20,78 @@ module IsoDoc
       section_names(d.at(ns("//clause[title = 'Scope']")), "1", 1)
       section_names(d.at(ns(
         "//references[title = 'Normative References']")), "2", 1)
-      section_names(d.at(ns("//terms")), "3", 1)
+      section_names(d.at(ns("//sections/terms")), "3", 1)
       middle_section_asset_names(d)
     end
     def middle_section_asset_names(d)
       middle_sections = "//clause[title = 'Scope'] | "\
-        "//references[title = 'Normative References'] | //terms | "\
-        "//symbols-abbrevs | //clause[parent::sections]"
+        "//foreword | //introduction | "\
+        "//references[title = 'Normative References'] | //sections/terms | "\
+        "//sections/symbols-abbrevs | //clause[parent::sections]"
       sequential_asset_names(d.xpath(ns(middle_sections)))
     end
-    def clause_names(docxml,sect_num)
+    def clause_names(docxml, sect_num)
       q = "//clause[parent::sections][not(xmlns:title = 'Scope')]"
       docxml.xpath(ns(q)).each_with_index do |c, i|
         section_names(c, (i + sect_num).to_s, 1)
       end
     end
+    def termnote_label(n)
+      @termnote_lbl.gsub(/%/, n.to_s)
+    end
     def termnote_anchor_names(docxml)
       docxml.xpath(ns("//term[termnote]")).each do |t|
         t.xpath(ns("./termnote")).each_with_index do |n, i|
-          @anchors[n["id"]] = { label: "Note #{i + 1} to entry",
-                                xref: "#{@anchors[t["id"]][:xref]},"\
-                                "Note #{i + 1}" }
+          @anchors[n["id"]] =
+            { label: termnote_label(i + 1),
+              xref: l10n("#{@anchors[t['id']][:xref]}, "\
+                         "#{@note_xref_lbl} #{i + 1}") }
         end
       end
     end
-    def table_note_anchor_names(docxml)
-      docxml.xpath(ns("//table[note]")).each do |t|
-        t.xpath(ns("./note")).each_with_index do |n, i|
-          @anchors[n["id"]] = { label: "NOTE #{i + 1}",
-                                xref: "#{@anchors[t["id"]][:xref]},"\
-                                "Note #{i + 1}" }
+    SECTIONS_XPATH =
+      "//foreword | //introduction | //sections/terms | //annex | "\
+      "//sections/clause | //references[not(ancestor::references)]".freeze
+    CHILD_NOTES_XPATH =
+      "./*[not(self::xmlns:subsection)]//xmlns:note | ./xmlns:note".freeze
+    def note_anchor_names(sections)
+      sections.each do |s|
+        notes = s.xpath(CHILD_NOTES_XPATH)
+        notes.each_with_index do |n, i|
+          next if @anchors[n["id"]]
+          next if n["id"].nil?
+          idx = notes.size == 1 ? "" : " #{i + 1}"
+          @anchors[n["id"]] = anchor_struct(idx, s, @note_xref_lbl)
+        end
+        note_anchor_names(s.xpath(ns("./subsection")))
+      end
+    end
+    CHILD_EXAMPLES_XPATH =
+      "./*[not(self::xmlns:subsection)]//xmlns:example | "\
+      "./xmlns:example".freeze
+    def example_anchor_names(sections)
+      sections.each do |s|
+        notes = s.xpath(CHILD_EXAMPLES_XPATH)
+        notes.each_with_index do |n, i|
+          next if @anchors[n["id"]]
+          idx = notes.size == 1 ? "" : " #{i + 1}"
+          @anchors[n["id"]] = anchor_struct(idx, s, @example_xref_lbl)
         end
+        example_anchor_names(s.xpath(ns("./subsection")))
       end
     end
     def middle_anchor_names(docxml)
-      symbols_abbrevs = docxml.at(ns("//symbols-abbrevs"))
+      symbols_abbrevs = docxml.at(ns("//sections/symbols-abbrevs"))
       sect_num = 4
       if symbols_abbrevs
         section_names(symbols_abbrevs, sect_num.to_s, 1)
@@ -78,59 +106,65 @@ module IsoDoc
       initial_anchor_names(docxml)
       middle_anchor_names(docxml)
       back_anchor_names(docxml)
-      table_note_anchor_names(docxml)
+      # preempt clause notes with all other types of note
+      note_anchor_names(docxml.xpath(ns("//table | //example | //formula | "\
+                                        "//figure")))
+      note_anchor_names(docxml.xpath(ns(SECTIONS_XPATH)))
+      example_anchor_names(docxml.xpath(ns(SECTIONS_XPATH)))
     end
     def sequential_figure_names(clause)
       i = j = 0
       clause.xpath(ns(".//figure")).each do |t|
-        label = "Figure #{i}" + ( j.zero? ? "" : "-#{j}" )
-        if t.parent.name == "figure"
-          j += 1
+        if t.parent.name == "figure" then j += 1
         else
           j = 0
           i += 1
         end
-        label = "Figure #{i}" + ( j.zero? ? "" : "-#{j}" )
-        @anchors[t["id"]] = { label: label, xref: label }
+        label = i.to_s + (j.zero? ? "" : "-#{j}")
+        @anchors[t["id"]] = anchor_struct(label, nil, @figure_lbl)
       end
     end
+    def anchor_struct(lbl, container, elem)
+      ret = { label: lbl.to_s }
+      ret[:xref] =
+        elem == "Formula" ? l10n("#{elem} (#{lbl})") : l10n("#{elem} #{lbl}")
+      ret[:xref].gsub!(/ $/, "")
+      ret[:container] = get_clause_id(container) unless container.nil?
+      ret
+    end
     def sequential_asset_names(clause)
       clause.xpath(ns(".//table")).each_with_index do |t, i|
-        @anchors[t["id"]] = { label: "Table #{i + 1}",
-                              xref: "Table #{i + 1}" }
+        @anchors[t["id"]] = anchor_struct(i + 1, nil, @table_lbl)
       end
       sequential_figure_names(clause)
       clause.xpath(ns(".//formula")).each_with_index do |t, i|
-        @anchors[t["id"]] = { label: (i + 1).to_s,
-                              xref: "Formula #{i + 1}" }
+        @anchors[t["id"]] = anchor_struct(i + 1, t, @formula_lbl)
       end
     end
     def hierarchical_figure_names(clause, num)
       i = j = 0
       clause.xpath(ns(".//figure")).each do |t|
-        if t.parent.name == "figure"
-          j += 1
+        if t.parent.name == "figure" then j += 1
         else
           j = 0
           i += 1
         end
-        label = "Figure #{num}.#{i}" + ( j.zero? ? "" : "-#{j}" )
-        @anchors[t["id"]] = { label: label, xref: label }
+        label = "#{num}.#{i}" + (j.zero? ? "" : "-#{j}")
+        @anchors[t["id"]] = anchor_struct(label, nil, @figure_lbl)
       end
     end
     def hierarchical_asset_names(clause, num)
       clause.xpath(ns(".//table")).each_with_index do |t, i|
-        @anchors[t["id"]] = { label: "Table #{num}.#{i + 1}",
-                              xref: "Table #{num}.#{i + 1}" }
+        @anchors[t["id"]] = anchor_struct("#{num}.#{i + 1}", nil, @table_lbl)
       end
       hierarchical_figure_names(clause, num)
       clause.xpath(ns(".//formula")).each_with_index do |t, i|
-        @anchors[t["id"]] = { label: "#{num}.#{i + 1}",
-                              xref: "Formula #{num}.#{i + 1}" }
+        @anchors[t["id"]] = anchor_struct("#{num}.#{i + 1}", t, @formula_lbl)
       end
     end
@@ -141,30 +175,32 @@ module IsoDoc
       end
     end
-    def section_names(clause, num, level)
-      @anchors[clause["id"]] = { label: num, xref: "Clause #{num}",
-                                 level: level }
-      clause.xpath(ns("./subsection | ./term")).each_with_index do |c, i|
-        section_names1(c, "#{num}.#{i + 1}", level + 1)
+    def section_names(clause, num, lvl)
+      return if clause.nil?
+      @anchors[clause["id"]] =
+        { label: num, xref: l10n("#{@clause_lbl} #{num}"), level: lvl }
+      clause.xpath(ns("./subsection | ./term  | ./terms | ./symbols-abbrevs")).
+        each_with_index do |c, i|
+        section_names1(c, "#{num}.#{i + 1}", lvl + 1)
       end
     end
     def section_names1(clause, num, level)
-      @anchors[clause["id"]] =
-        { label: num, level: level,
-          xref: clause.name == "term" ? num : "Clause #{num}" }
-      clause.xpath(ns("./subsection ")).
+      @anchors[clause["id"]] =
+        { label: num, level: level, xref: num }
+      # subclauses are not prefixed with "Clause"
+      clause.xpath(ns("./subsection | ./terms | ./term | ./symbols-abbrevs")).
         each_with_index do |c, i|
         section_names1(c, "#{num}.#{i + 1}", level + 1)
       end
     end
     def annex_names(clause, num)
-      obligation = "(Informative)"
-      obligation = "(Normative)" if clause["subtype"] == "normative"
-      label = "<b>Annex #{num}</b><br/>#{obligation}"
-      @anchors[clause["id"]] = { label: label,
-                                 xref: "Annex #{num}", level: 1 }
+      obl = l10n("(#{@inform_annex_lbl})")
+      obl = l10n("(#{@norm_annex_lbl})") if clause["obligation"] == "normative"
+      label = l10n("<b>#{@annex_lbl} #{num}</b><br/>#{obl}")
+      @anchors[clause["id"]] =
+        { label: label, xref: "#{@annex_lbl} #{num}", level: 1 }
       clause.xpath(ns("./subsection")).each_with_index do |c, i|
         annex_names1(c, "#{num}.#{i + 1}", 2)
       end
@@ -172,34 +208,10 @@ module IsoDoc
     end
     def annex_names1(clause, num, level)
-      @anchors[clause["id"]] = { label: num,
-                                 xref: num,
-                                 level: level }
+      @anchors[clause["id"]] = { label: num, xref: num, level: level }
       clause.xpath(ns(".//subsection")).each_with_index do |c, i|
         annex_names1(c, "#{num}.#{i + 1}", level + 1)
       end
     end
-    def format_ref(ref, isopub)
-      return "ISO #{ref}" if isopub
-      return "[#{ref}]" if /^\d+$/.match?(ref) && !/^\[.*\]$/.match?(ref)
-      ref
-    end
-    def reference_names(ref)
-      isopub = ref.at(ns(ISO_PUBLISHER_XPATH))
-      docid = ref.at(ns("./docidentifier"))
-      return ref_names(ref) unless docid
-      date = ref.at(ns("./date[@type = 'published']"))
-      reference = format_ref(docid.text, isopub)
-      reference += ": #{date.text}" if date && isopub
-      @anchors[ref["id"]] = { xref: reference }
-    end
-    def ref_names(ref)
-      linkend = ref.text
-      linkend.gsub!(/[\[\]]/, "") unless /^\[\d+\]$/.match? linkend
-      @anchors[ref["id"]] = { xref: linkend }
-    end
   end
 end

data/spec/isodoc/blocks_spec.rb ADDED

@@ -0,0 +1,618 @@
+require "spec_helper"
+RSpec.describe IsoDoc do
+  it "processes unlabelled notes" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <note>
+  <p id="_f06fd0d1-a203-4f3d-a515-0bdba0f8d83f">These results are based on a study carried out on three different types of kernel.</p>
+</note>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <div id="" class="Note">
+                   <p class="Note">NOTE<span style="mso-tab-count:1">&#160; </span>These results are based on a study carried out on three different types of kernel.</p>
+                 </div>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes labelled notes" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <note id="note1">
+  <p id="_f06fd0d1-a203-4f3d-a515-0bdba0f8d83f">These results are based on a study carried out on three different types of kernel.</p>
+</note>
+    <note id="note2">
+  <p id="_f06fd0d1-a203-4f3d-a515-0bdba0f8d83a">These results are based on a study carried out on three different types of kernel.</p>
+</note>
+    </foreword>
+    </iso-standard>
+INPUT
+       <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <div id="note1" class="Note">
+                   <p class="Note">NOTE  1<span style="mso-tab-count:1">&#160; </span>These results are based on a study carried out on three different types of kernel.</p>
+                 </div>
+                 <div id="note2" class="Note">
+                   <p class="Note">NOTE  2<span style="mso-tab-count:1">&#160; </span>These results are based on a study carried out on three different types of kernel.</p>
+                 </div>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes multi-para notes" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <note>
+  <p id="_f06fd0d1-a203-4f3d-a515-0bdba0f8d83f">These results are based on a study carried out on three different types of kernel.</p>
+  <p id="_f06fd0d1-a203-4f3d-a515-0bdba0f8d83a">These results are based on a study carried out on three different types of kernel.</p>
+</note>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <div id="" class="Note">
+                   <p class="Note">NOTE<span style="mso-tab-count:1">&#160; </span>These results are based on a study carried out on three different types of kernel.</p>
+                   <p class="Note" id="_f06fd0d1-a203-4f3d-a515-0bdba0f8d83a">These results are based on a study carried out on three different types of kernel.</p>
+                 </div>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes non-para notes" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <note>
+    <dl>
+    <dt>A</dt>
+    <dd><p>B</p></dd>
+    </dl>
+    <ul>
+    <li>C</li></ul>
+</note>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <div id="" class="Note"><p class="Note">NOTE<span style="mso-tab-count:1">&#160; </span></p>
+           <dl><dt><p class="Note">A</p></dt><dd><p class="Note">B</p></dd></dl>
+           <ul>
+           <li>C</li></ul>
+       </div>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes figures" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <figure id="figureA-1">
+  <name>Split-it-right sample divider</name>
+  <image src="rice_images/rice_image1.png" id="_8357ede4-6d44-4672-bac4-9a85e82ab7f0" imagetype="PNG"/>
+  <dl>
+  <dt>A</dt>
+  <dd><p>B</p></dd>
+  </dl>
+</figure>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <div id="figureA-1" class="figure">
+         <img src="rice_images/rice_image1.png"/>
+         <p><b>Key</b></p><dl><dt><p>A</p></dt><dd><p>B</p></dd></dl>
+       <p class="FigureTitle" align="center"><b>Figure 1&#160;&#8212; Split-it-right sample divider</b></p></div>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes examples" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <example id="samplecode">
+  <p>Hello</p>
+</example>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <table id="samplecode" class="example">
+                   <tr>
+                     <td width="110pt" valign="top" style="width:82.8pt;padding:.75pt .75pt .75pt .75pt">EXAMPLE</td>
+                     <td valign="top">
+         <p>Hello</p>
+       </td>
+                   </tr>
+                 </table>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes sequences of examples" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <example id="samplecode">
+  <p>Hello</p>
+</example>
+    <example id="samplecode2>
+  <p>Hello</p>
+</example>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <table id="samplecode" class="example">
+                   <tr>
+                     <td width="110pt" valign="top" style="width:82.8pt;padding:.75pt .75pt .75pt .75pt">EXAMPLE  1</td>
+                     <td valign="top">
+         <p>Hello</p>
+       </td>
+                   </tr>
+                 </table>
+                 <table id="samplecode2&gt;   " class="example">
+                   <tr>
+                     <td width="110pt" valign="top" style="width:82.8pt;padding:.75pt .75pt .75pt .75pt">EXAMPLE  2</td>
+                     <td valign="top"/>
+                   </tr>
+                 </table>
+                 <p>Hello</p>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes sourcecode" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <sourcecode id="samplecode">
+    <name>Ruby code</name>
+  puts x
+</sourcecode>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <p id="samplecode" class="Sourcecode"><br/>&#160;&#160;&#160;&#160;<br/>&#160;&#160;puts&#160;x<br/><p class="FigureTitle" align="center"><b>Ruby code</b></p></p>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes sourcecode with annotations" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <sourcecode id="_">puts "Hello, world." <callout target="A">1</callout>
+       %w{a b c}.each do |x|
+         puts x <callout target="B">2</callout>
+       end<annotation id="A">
+         <p id="_">This is one callout</p>
+       </annotation><annotation id="B">
+         <p id="_">This is another callout</p>
+       </annotation></sourcecode>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <p id="_" class="Sourcecode">puts&#160;"Hello,&#160;world."&#160; &lt;1&gt;<br/>&#160;&#160;&#160;%w{a&#160;b&#160;c}.each&#160;do&#160;|x|<br/>&#160;&#160;&#160;&#160;&#160;puts&#160;x&#160; &lt;2&gt;<br/>&#160;&#160;&#160;end<span class="zzMoveToFollowing">&lt;1&gt; </span>
+            <p class="Sourcecode" id="_">This is one callout</p>
+          <span class="zzMoveToFollowing">&lt;2&gt; </span>
+            <p class="Sourcecode" id="_">This is another callout</p>
+          </p>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes admonitions" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <admonition id="_70234f78-64e5-4dfc-8b6f-f3f037348b6a" type="caution">
+  <p id="_e94663cc-2473-4ccc-9a72-983a74d989f2">Only use paddy or parboiled rice for the determination of husked rice yield.</p>
+</admonition>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <div class="Admonition"><title>CAUTION</title>
+         <p id="_e94663cc-2473-4ccc-9a72-983a74d989f2">Only use paddy or parboiled rice for the determination of husked rice yield.</p>
+       </div>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes formulae" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <formula id="_be9158af-7e93-4ee2-90c5-26d31c181934">
+  <stem type="AsciiMath">r = 1 %</stem>
+<dl id="_e4fe94fe-1cde-49d9-b1ad-743293b7e21d">
+  <dt>
+    <stem type="AsciiMath">r</stem>
+  </dt>
+  <dd>
+    <p id="_1b99995d-ff03-40f5-8f2e-ab9665a69b77">is the repeatability limit.</p>
+  </dd>
+</dl></formula>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <div id="_be9158af-7e93-4ee2-90c5-26d31c181934" class="formula"><span class="stem">(#(r = 1 %)#)</span><span style="mso-tab-count:1">&#160; </span>(1)</div>
+                 <p>where</p>
+                 <dl>
+                   <dt>
+           <span class="stem">(#(r)#)</span>
+         </dt>
+                   <dd>
+           <p id="_1b99995d-ff03-40f5-8f2e-ab9665a69b77">is the repeatability limit.</p>
+         </dd>
+                 </dl>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes paragraph alignments" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <p align="left" id="_08bfe952-d57f-4150-9c95-5d52098cc2a8">Vache Equipment<br/>
+Fictitious<br/>
+World
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <p id="_08bfe952-d57f-4150-9c95-5d52098cc2a8" align="left" style="text-align:left">Vache Equipment<br/>
+       Fictitious<br/>
+       World
+           </p>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes blockquotes" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <foreword>
+    <quote id="_044bd364-c832-4b78-8fea-92242402a1d1">
+  <source type="inline" bibitemid="ISO7301" citeas="ISO 7301: 2011"><locality type="clause"><referenceFrom>1</referenceFrom></locality></source>
+  <author>ISO</author>
+  <p id="_d4fd0a61-f300-4285-abe6-602707590e53">This International Standard gives the minimum specifications for rice (<em>Oryza sativa</em> L.) which is subject to international trade. It is applicable to the following types: husked rice and milled rice, parboiled or not, intended for direct human consumption. It is neither applicable to other products derived from rice, nor to waxy rice (glutinous rice).</p>
+</quote>
+    </foreword>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <br clear="all" style="mso-special-character:line-break;page-break-before:always"/>
+               <div>
+                 <h1 class="ForewordTitle">Foreword</h1>
+                 <div class="Quote" id="_044bd364-c832-4b78-8fea-92242402a1d1">
+         <p id="_d4fd0a61-f300-4285-abe6-602707590e53">This International Standard gives the minimum specifications for rice (<i>Oryza sativa</i> L.) which is subject to international trade. It is applicable to the following types: husked rice and milled rice, parboiled or not, intended for direct human consumption. It is neither applicable to other products derived from rice, nor to waxy rice (glutinous rice).</p>
+       <p class="QuoteAttribution">&#8212; ISO, <a href="#ISO7301">ISO 7301: 2011, Clause 1</a></p></div>
+               </div>
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+  it "processes term domains" do
+    expect(IsoDoc::Convert.new({}).convert_file(<<~"INPUT", "test", true)).to be_equivalent_to <<~"OUTPUT"
+    <iso-standard xmlns="http://riboseinc.com/isoxml">
+    <sections>
+    <terms>
+    <term id="_extraneous_matter"><preferred>extraneous matter</preferred><admitted>EM</admitted>
+<domain>rice</domain>
+<definition><p id="_318b3939-be09-46c4-a284-93f9826b981e">organic and inorganic components other than whole or broken kernels</p></definition>
+</term>
+    </terms>
+    </sections>
+    </iso-standard>
+    INPUT
+           <html xmlns:epub="http://www.idpf.org/2007/ops">
+         <head>
+           <title>test</title>
+           <body lang="EN-US" link="blue" vlink="#954F72">
+             <div class="WordSection1">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection2">
+               <p>&#160;</p>
+             </div>
+             <br clear="all" class="section"/>
+             <div class="WordSection3">
+               <p class="zzSTDTitle1"/>
+               <div><h1>3.<span style="mso-tab-count:1">&#160; </span>Terms and Definitions</h1><p>For the purposes of this document,
+           the following terms and definitions apply.</p>
+       <p>ISO and IEC maintain terminological databases for use in
+       standardization at the following addresses:</p>
+       <ul>
+       <li> <p>ISO Online browsing platform: available at
+         <a href="http://www.iso.org/obp">http://www.iso.org/obp</a></p> </li>
+       <li> <p>IEC Electropedia: available at
+         <a href="http://www.electropedia.org">http://www.electropedia.org</a>
+       </p> </li> </ul>
+       <p class="TermNum" id="_extraneous_matter">3.1</p><p class="Terms">extraneous matter</p><p class="AltTerms">EM</p>
+       <p id="_318b3939-be09-46c4-a284-93f9826b981e">&lt;rice&gt; organic and inorganic components other than whole or broken kernels</p>
+       </div>
+             </div>
+           </body>
+         </head>
+       </html>
+    OUTPUT
+  end
+end