RubyGems - polytexnic - Versions diffs - 0.5.0 - Mend

polytexnic 0.5.0

Files changed (125) hide show

checksums.yaml +7 -0
data/.gitignore +37 -0
data/.pull_requests/1371777257 +0 -0
data/.pull_requests/1371927975 +0 -0
data/.pull_requests/1372804345 +0 -0
data/.pull_requests/1374784075 +0 -0
data/.pull_requests/1375304853 +0 -0
data/.pull_requests/1375408308 +0 -0
data/.pull_requests/1375409462 +0 -0
data/.pull_requests/1375410668 +0 -0
data/.pull_requests/1375472132 +0 -0
data/.pull_requests/1375485496 +0 -0
data/.pull_requests/1375487548 +0 -0
data/.pull_requests/1375492835 +0 -0
data/.pull_requests/1375497765 +0 -0
data/.pull_requests/1375559547 +0 -0
data/.pull_requests/1375589063 +0 -0
data/.pull_requests/1375841786 +0 -0
data/.pull_requests/1376352634 +0 -0
data/.pull_requests/1376353299 +0 -0
data/.pull_requests/1376449284 +0 -0
data/.pull_requests/1376452696 +0 -0
data/.pull_requests/1376454166 +0 -0
data/.pull_requests/1376532291 +0 -0
data/.pull_requests/1376625487 +0 -0
data/.pull_requests/1376690108 +0 -0
data/.pull_requests/1376699046 +0 -0
data/.pull_requests/1376707642 +0 -0
data/.pull_requests/1377230284 +0 -0
data/.pull_requests/1379118478 +0 -0
data/.pull_requests/1379123150 +0 -0
data/.pull_requests/1380221847 +0 -0
data/.pull_requests/1380589654 +0 -0
data/.pull_requests/1380673142 +0 -0
data/.pull_requests/1380850800 +0 -0
data/.pull_requests/1381001264 +0 -0
data/.pull_requests/1381005204 +0 -0
data/.pull_requests/1381103022 +0 -0
data/.pull_requests/1381252832 +0 -0
data/.pull_requests/1381276624 +0 -0
data/.pull_requests/1381344234 +0 -0
data/.pull_requests/1381385297 +0 -0
data/.pull_requests/1381427498 +0 -0
data/.pull_requests/1381429761 +0 -0
data/.pull_requests/1381873684 +0 -0
data/.pull_requests/1382045490 +0 -0
data/.pull_requests/1382056384 +0 -0
data/.pull_requests/1382405223 +0 -0
data/.pull_requests/1382478400 +0 -0
data/.pull_requests/1382479780 +0 -0
data/.pull_requests/1382485483 +0 -0
data/.pull_requests/1382569911 +0 -0
data/.pull_requests/1382646199 +0 -0
data/.pull_requests/1382649778 +0 -0
data/.pull_requests/1382660987 +0 -0
data/.pull_requests/1382743927 +0 -0
data/.pull_requests/1382840347 +0 -0
data/.pull_requests/1383077676 +0 -0
data/.pull_requests/1383086948 +0 -0
data/.pull_requests/1383161978 +0 -0
data/.pull_requests/1383263695 +0 -0
data/.pull_requests/1383274008 +0 -0
data/.pull_requests/1383327328 +0 -0
data/.rspec +2 -0
data/.ruby-gemset +1 -0
data/.ruby-version +1 -0
data/Gemfile +15 -0
data/Guardfile +15 -0
data/LICENSE.txt +22 -0
data/README.md +21 -0
data/Rakefile +2 -0
data/lib/polytexnic/literal.rb +299 -0
data/lib/polytexnic/postprocessor.rb +28 -0
data/lib/polytexnic/postprocessors/html.rb +1139 -0
data/lib/polytexnic/postprocessors/latex.rb +18 -0
data/lib/polytexnic/postprocessors/polytex.rb +44 -0
data/lib/polytexnic/preprocessor.rb +23 -0
data/lib/polytexnic/preprocessors/html.rb +349 -0
data/lib/polytexnic/preprocessors/latex.rb +43 -0
data/lib/polytexnic/preprocessors/polytex.rb +127 -0
data/lib/polytexnic/utils.rb +176 -0
data/lib/polytexnic/version.rb +3 -0
data/lib/polytexnic.rb +92 -0
data/notes/pandoc.md +41 -0
data/polytexnic.gemspec +28 -0
data/polytexnic_commands.sty +5 -0
data/precompiled_binaries/tralics +0 -0
data/spec/fixtures/code_listing.tex +14 -0
data/spec/fixtures/figures.tex +8 -0
data/spec/fixtures/inline_math.html +4 -0
data/spec/fixtures/inline_math.tex +3 -0
data/spec/fixtures/math_environments.html +50 -0
data/spec/fixtures/math_environments.tex +56 -0
data/spec/fixtures/section_xrefs.tex +9 -0
data/spec/fixtures/sidebar.tex +10 -0
data/spec/fixtures/tables.tex +8 -0
data/spec/fixtures/verbatim_environments.html +11 -0
data/spec/fixtures/verbatim_environments.tex +13 -0
data/spec/integration_spec.rb +34 -0
data/spec/markdown_to_polytex_spec.rb +192 -0
data/spec/resemble_matcher_spec.rb +69 -0
data/spec/spec_helper.rb +38 -0
data/spec/support/resemble_matcher.rb +100 -0
data/spec/to_html/asides_spec.rb +42 -0
data/spec/to_html/chapters_and_sections_spec.rb +268 -0
data/spec/to_html/characters_and_punctuation_spec.rb +138 -0
data/spec/to_html/codelistings_spec.rb +70 -0
data/spec/to_html/core_spec.rb +227 -0
data/spec/to_html/eqref_spec.rb +32 -0
data/spec/to_html/footnote_spec.rb +164 -0
data/spec/to_html/graphics_and_figures_spec.rb +358 -0
data/spec/to_html/lists_spec.rb +103 -0
data/spec/to_html/literal_environments/code_spec.rb +141 -0
data/spec/to_html/literal_environments/math_spec.rb +255 -0
data/spec/to_html/literal_environments/unicode_spec.rb +12 -0
data/spec/to_html/literal_environments/verbatim_spec.rb +168 -0
data/spec/to_html/quotations_and_verse_spec.rb +86 -0
data/spec/to_html/table_of_contents_spec.rb +93 -0
data/spec/to_html/table_spec.rb +269 -0
data/spec/to_html/text_formatting_spec.rb +50 -0
data/spec/to_latex_spec.rb +197 -0
data/tasks/bin/ruby_tests +41 -0
data/tasks/run_tests_with_both_rubies.rake +5 -0
data/tmp/.gitkeep +0 -0
metadata +286 -0

data/lib/polytexnic/postprocessors/latex.rb ADDED Viewed

@@ -0,0 +1,18 @@
+require 'polytexnic/literal'
+module Polytexnic
+  module Postprocessor
+    module Latex
+      # Restores literal environments (verbatim, code, math, etc.).
+      def replace_hashes(polytex)
+        puts polytex if debug?
+        polytex.tap do
+          literal_cache.each do |key, value|
+            polytex.gsub!(key, escape_backslashes(value))
+          end
+        end
+      end
+    end
+  end
+end

data/lib/polytexnic/postprocessors/polytex.rb ADDED Viewed

@@ -0,0 +1,44 @@
+# encoding=utf-8
+module Polytexnic
+  module Postprocessor
+    module Polytex
+      # Removes references to the hypertarget package.
+      # TODO: Support hypertarget
+      # This isn't a priority, as you get most of what you need
+      # with hyperref.
+      def remove_hypertarget
+        @source.gsub!(/\\hypertarget.*$/, '')
+      end
+      # Fixes a kramdown verbatim bug.
+      # When converting code, kramdown outputs
+      # "\begin{verbatim}foo" instead of
+      # "\begin{verbatim}\nfoo".
+      def fix_verbatim_bug
+        @source.gsub!(/\\begin\{verbatim\}/) { |s| s + "\n" }
+      end
+      # Writes the PolyTeX code environments based on the code cache.
+      # I.e., code that looks like
+      # {lang="ruby"}
+      #     def foo
+      #       "bar"
+      #     end
+      # becomes
+      # %= lang:ruby
+      # \begin{code}
+      # def foo
+      #   "bar"
+      # end
+      # \end{code}
+      # which reduces syntax highlighting to a previously solved problem.
+      def write_polytex_code
+        code_cache.each do |key, (code, lang, in_codelisting)|
+          latex = "%= lang:#{lang}\n\\begin{code}\n#{code}\n\\end{code}"
+          @source.gsub!(key, latex)
+        end
+      end
+    end
+  end
+end

data/lib/polytexnic/preprocessor.rb ADDED Viewed

@@ -0,0 +1,23 @@
+# encoding=utf-8
+require 'polytexnic/literal'
+require 'polytexnic/preprocessors/html'
+require 'polytexnic/preprocessors/latex'
+require 'polytexnic/preprocessors/polytex'
+module Polytexnic
+  module Preprocessor
+    include Literal
+    include Html
+    include Latex
+    include Polytex
+    # Preprocesses the input based on output format.
+    def preprocess(format)
+      case format
+      when :html    then to_xml
+      when :latex   then to_processed_latex
+      when :polytex then to_polytex
+      end
+    end
+  end
+end

data/lib/polytexnic/preprocessors/html.rb ADDED Viewed

@@ -0,0 +1,349 @@
+# encoding=utf-8
+module Polytexnic
+  module Preprocessor
+    module Html
+      # Converts HTML to XML.
+      # The heart of the process is using Tralics to convert the input PolyTeX
+      # to XML. The raw PolyTeX needs to be processed first to make everything
+      # go smoothly, but after that the steps to producing the corresponding
+      # XML is straightforward.
+      def to_xml
+        polytex = process_for_tralics(@polytex)
+        doc = Nokogiri::XML(tralics_xml(polytex))
+        add_document_tag(doc)
+        @xml = doc.to_xml
+      end
+      private
+        # Processes the input PolyTeX for Tralics.
+        # The key steps are creating a clean document safe for making global
+        # substitutions (gsubs), and then making a bunch of gsubs.
+        def process_for_tralics(polytex)
+          clean_document(polytex).tap do |output|
+            process_spaces(output)
+            remove_commands(output)
+            hyperrefs(output)
+            title_fields(output)
+            maketitle(output)
+            label_names(output)
+            image_names(output)
+            restore_eq_labels(output)
+            convert_figure_centering(output)
+            convert_longtable(output)
+            mark_environments(output)
+            make_tabular_alignment_cache(output)
+          end
+        end
+        # Returns a clean document with cached literal environments.
+        # This is a key step: we cache literal environments that should be
+        # passed through the pipeline with no changes (verbatim, code, etc.).
+        # The result is a document that can safely be transformed using
+        # global substitutions.
+        def clean_document(polytex)
+          doc = cache_unicode(cache_literal(add_commands(polytex)))
+          inline_verbatim(doc)
+          cache_hrefs(doc)
+          remove_comments(doc)
+          double_backslashes(cache_display_inline_math(doc))
+        end
+        # Prepares spaces to be passed through the pipeline.
+        # Handles thin spaces ('\,') and normal spaces ('\ '), as well as
+        # end-of-sentence spaces.
+        def process_spaces(doc)
+          doc.gsub!(/\\,/, xmlelement('thinspace'))
+          # Match an end of sentence character, while also recognizing
+          # things like (Or otherwise.) and ``Yes, indeed!'' as being the
+          # ends of sentences.
+          end_of_sentence = '[.?!](?:\)|\'+)?'
+          # Handle a forced normal space '\ '.
+          doc.gsub!(/(#{end_of_sentence})\\ /) do
+            $1 + xmlelement('normalspace')
+          end
+          not_a_capital = '[^A-Z]'
+          # Case of "foo. A"
+          doc.gsub!(/(#{not_a_capital})(#{end_of_sentence})[ ]+([^\s])/) do
+            $1 + $2 + xmlelement('intersentencespace') + ' ' + $3
+          end
+          # Case of "foo.\n A"
+          doc.gsub!(/(#{not_a_capital})(#{end_of_sentence})\n[ ]+([^\s])/) do
+            $1 + $2 + xmlelement('intersentencespace') + ' ' + $3
+          end
+          # Case of "foo.\nA"
+          doc.gsub!(/(#{not_a_capital})(#{end_of_sentence})\n([^\n])/) do
+            $1 + $2 + xmlelement('intersentencespace') + ' ' + $3
+          end
+          # Handle the manual override to force an inter-sentence space, '\@',
+          # as in 'Superman II\@. A new sentence'.
+          doc.gsub!(/\\@\. /, '.' + xmlelement('intersentencespace') + ' ')
+        end
+        # Removes commands that might screw up Tralics.
+        def remove_commands(doc)
+          # Determine if we're using footnote symbols.
+          symbols_cmd = '\renewcommand{\thefootnote}{\fnsymbol{footnote}}'
+          @footnote_symbols = !!doc.match(/^\s*#{Regexp.escape(symbols_cmd)}/)
+          doc.gsub!(/^\s*\\renewcommand.*$/, '')
+        end
+        # Returns true if we should use footnote symbols in place of numbers.
+        def footnote_symbols?
+          @footnote_symbols
+        end
+        # Handles \verb environments.
+        # LaTeX supports an inline verbatim environment using
+        #   \verb+<stuff>+
+        # The + is arbitrary; any non-letter character is fine as long as it
+        # doesn't appear in <stuff>, so this code has exactly the same effect:
+        #   \verb!<stuff>!
+        #   \verb@<stuff>@
+        #   \verb8<stuff>8
+        # My preference is to use + or - if available.
+        def inline_verbatim(doc)
+          doc.gsub!(/\\verb([^A-Za-z])(.*?)\1/) do
+            key = digest($2)
+            literal_cache[key] = $2
+            xmlelement('inlineverbatim') { key }
+          end
+        end
+        # Removes commented-out lines.
+        def remove_comments(output)
+          output.gsub!(/[^\\]%.*$/, '')
+        end
+        # Converts LaTeX double backslashes to HTML breaks.
+        def double_backslashes(string)
+          lines = []
+          in_table = false
+          string.split("\n").each do |line|
+            in_table ||= (line =~ /^\s*\\begin{(?:tabular|longtable)}/)
+            line.gsub!('\\\\', xmlelement('backslashbreak')) unless in_table
+            lines << line
+            in_table = (in_table && line !~ /^\s*\\end{tabular}/)
+          end
+          lines.join("\n")
+        end
+        # Adds some default commands.
+        def add_commands(polytex)
+          line(custom_commands) + tralics_commands + polytex
+        end
+        # Pads a string with newlines.
+        def line(string)
+          "\n#{string}\n"
+        end
+        # Handles title fields.
+        def title_fields(string)
+          %w{title subtitle author date}.each do |field|
+            string.gsub! /\\#{field}\{(.*)\}/ do |s|
+              maketitle_elements[field] = $1
+              ''
+            end
+          end
+        end
+        # Replaces maketitle with an XML element.
+        def maketitle(string)
+          string.gsub! /\\maketitle/ do |s|
+            xmlelement('maketitle')
+          end
+        end
+        # Preserves label names.
+        # Tralics doesn't keep the names of labels, e.g., 'cha:foobar' in
+        # '\label{cha:foobar}'. But Tralics supplies a wide variety of
+        # pseudo-LaTeX commands to add arbitrary XML elements to the final
+        # document. In this case, the \xbox command does the trick. See
+        # http://www-sop.inria.fr/marelle/tralics/doc-x.html
+        # for more information.
+        def label_names(string)
+          string.gsub! /\\label\{(.*?)\}/ do |s|
+            label = $1.gsub(':', '-').gsub('_', underscore_digest)
+            "#{s}\n\\xbox{data-label}{#{label}}"
+          end
+        end
+        # Handles image names with underscores.
+        # This is a terrible kludge, and it's annoying that it's
+        # apparently necessary.
+        def image_names(string)
+          string.gsub! /\\image\{(.*?)\}/ do |s|
+            escaped_filename = $1.gsub('_', underscore_digest)
+            "\\image{#{escaped_filename}}"
+          end
+          string.gsub! /\\imagebox\{(.*?)\}/ do |s|
+            escaped_filename = $1.gsub('_', underscore_digest)
+            "\\imagebox{#{escaped_filename}}"
+          end
+        end
+        # Restores the equation labels.
+        def restore_eq_labels(output)
+          math_label_cache.each do |key, label|
+            output.gsub!(key, label)
+          end
+        end
+        # Handles centering in figures.
+        # The way we handle generic \begin{center}...\end{center} doesn't
+        # work in figures for some reason. Luckily, the preferred method
+        # is to use \centering anyway, so this kludge is actually better LaTeX.
+        def convert_figure_centering(output)
+          @in_figure = false
+          centered = output.split("\n").map do |line|
+            if line =~ /^\s*\\begin\{figure\}/
+              @in_figure = true
+              line
+            elsif @in_figure && line =~ /^\s*\\begin\{center\}/
+              '\centering'
+            elsif @in_figure && line =~ /^\s*\\end\{center\}/
+              ''
+            elsif @in_figure && line =~ /^\s*\\end\{figure\}/
+              @in_figure = false
+              line
+            else
+              line
+            end
+          end.join("\n")
+          output.replace(centered)
+        end
+        # Converts the longtable environment to simple tabular.
+        # This is mainly because kramdown outputs longtables by default,
+        # but as a side-effect you can also use longtables in PolyTeX
+        # input documents.
+        def convert_longtable(output)
+          output.gsub!('\begin{longtable}', '\begin{tabular}')
+          output.gsub!('\end{longtable}',   '\end{tabular}')
+        end
+        # Marks environments with their types.
+        # Tralics strips some information when processing LaTeX, such as
+        # whether a particular div defines a chapter. We remedy this by
+        # using the \AddAttToCurrent pseudo-LaTeX command to mark such
+        # environments with their types.
+        def mark_environments(string)
+          # Marks chapters with a 'chapter' type.
+          # Also handles \chapter*.
+          string.gsub! /^\s*\\chapter\*?\{(.*)\}/ do |s|
+            "#{s}\n\\AddAttToCurrent{type}{chapter}"
+          end
+          # Wrap codelistings in a 'codelisting' element.
+          string.gsub! /\\begin{codelisting}/ do |s|
+            "\\begin{xmlelement*}{codelisting}\n#{s}"
+          end
+          string.gsub! /\\end{codelisting}/ do |s|
+            "#{s}\n\\end{xmlelement*}"
+          end
+          # Wrap asides in an 'aside' element.
+          string.gsub! /\\begin{aside}/ do |s|
+            "\\begin{xmlelement*}{aside}\n#{s}"
+          end
+          string.gsub! /\\end{aside}/ do |s|
+            "#{s}\n\\end{xmlelement*}"
+          end
+          # Replace quotations and verse with corresponding XML elements.
+          string.gsub! /\\begin{quote}/ do |s|
+            quotation = '\AddAttToCurrent{class}{quotation}'
+            "\\begin{xmlelement*}{blockquote}\n#{quotation}"
+          end
+          string.gsub! /\\end{quote}/ do |s|
+            "\\end{xmlelement*}"
+          end
+          string.gsub! /\\begin{verse}/ do |s|
+            "\\begin{xmlelement*}{blockquote}\n\\AddAttToCurrent{class}{verse}"
+          end
+          string.gsub! /\\end{verse}/ do |s|
+            "\\end{xmlelement*}"
+          end
+          # Handle \begin{center}...\end{center}
+          string.gsub! /\\begin{center}/, '\begin{xmlelement*}{center}'
+          string.gsub! /\\end{center}/,   '\end{xmlelement*}'
+          # Handle \centering
+          string.gsub! /\\centering/, '\AddAttToCurrent{class}{center}'
+          # # Handle \image
+          # string.gsub! /\\image/, '\includegraphics'
+        end
+        # Collects alignment information for tabular environments.
+        # We suck out all the stuff like 'l|l|lr' in
+        # \begin{tabular}{l|l|lr}
+        # The reason is that we need to work around a couple of bugs in Tralics.
+        # I've tried in vain to figure out WTF is going on in the Tralics
+        # source, but it's easy enough in Ruby so I'm throwing it in here.
+        def make_tabular_alignment_cache(output)
+          alignment_regex = /^\s*\\begin{tabular}{((?:\|*[lcr]+\|*)+)}/
+          @tabular_alignment_cache = output.scan(alignment_regex).flatten
+        end
+        # Returns the XML produced by the Tralics program.
+        # There is a lot of ugly file manipulation here, but it's fundamentally
+        # straightforward. The heart of it is
+        #
+        #   system("#{tralics} -nomathml #{file.path} > log/tralics.log")
+        #
+        # which writes the converted PolyTeX file as XML, which then gets
+        # read in and lightly processed.
+        def tralics_xml(polytex)
+          file = Tempfile.new(['polytex', '.tex'])
+          puts polytex if debug?
+          file.write(polytex)
+          file.close
+          Dir.mkdir 'log' unless File.directory?('log')
+          system("#{tralics} -nomathml #{file.path} > log/tralics.log")
+          dirname = File.dirname(file.path)
+          xml_filename = File.basename(file.path, '.tex') + '.xml'
+          raw_xml = File.read(File.join(dirname, xml_filename))
+          xml = clean_xml(raw_xml)
+          puts xml if debug?
+          xml
+        ensure
+          xmlfile = file.path.sub('.tex', '.xml')
+          logfile = file.path.sub('.tex', '.log')
+          [xmlfile, logfile].each do |file|
+            File.delete(file) if File.exist?(file)
+          end
+          file.delete
+        end
+        # Wraps the whole document in <document></document>.
+        # Fragmentary documents come wrapped in 'unknown' tags.
+        # Full documents are wrapped in 'std' tags.
+        # Change either to 'document' for consistency.
+        def add_document_tag(doc)
+          %w[unknown std].each do |parent_tag|
+            node = doc.at_css(parent_tag)
+            node.name = 'document' unless node.nil?
+          end
+        end
+        def clean_xml(raw_xml)
+          nokogiri_ellipsis_workaround(raw_xml)
+        end
+        # Fixes a Nokogiri bug.
+        # As of this writing, the latest version of Nokogiri (1.5.6) doesn't
+        # handle the horizontal ellipsis character '&#133;' correctly in Ruby 2.
+        # The kludgy solution is to replace it with '…' in the raw XML,
+        # which does work.
+        def nokogiri_ellipsis_workaround(raw_xml)
+          raw_xml.gsub('&#133;', '…')
+        end
+    end
+  end
+end

data/lib/polytexnic/preprocessors/latex.rb ADDED Viewed

@@ -0,0 +1,43 @@
+module Polytexnic
+  module Preprocessor
+    module Latex
+      def to_processed_latex
+        @polytex = polish_tables(process_asides(clean_latex_document))
+      end
+      # Returns LaTeX with hashed versions of literal environments.
+      # Literal environments are hashed and passed through the pipeline
+      # so that we can process things like refs to hyperrefs using gsubs.
+      def clean_latex_document
+        cache_literal(@polytex, :latex)
+      end
+      def polish_tables(text)
+        text.tap do
+          text.gsub!(/^\s*(\\begin\{table\})/) do
+            "#{$1}\n\\begin{center}\n\\small\n"
+          end
+          text.gsub!(/^\s*(\\end\{table\})/) { "\\end{center}\n#{$1}" }
+        end
+      end
+      # Processes aside environments.
+      # In order to get nice framed & shaded aside boxes, we need to
+      # transform the default aside into a new environment.
+      def process_asides(text)
+        # Transform asides with headings and labels.
+        aside_regex = /\\begin{aside}\n\s*
+                       \\heading{(.*?)}\s*
+                       \\label{(.*?)}\n
+                       (.*?)
+                       \\end{aside}/mx
+        text.tap do
+          text.gsub!(aside_regex) do
+            %(\\begin{shaded_aside}{#{$1}}{#{$2}}\n#{$3}\n\\end{shaded_aside})
+          end
+        end
+      end
+    end
+  end
+end

data/lib/polytexnic/preprocessors/polytex.rb ADDED Viewed

@@ -0,0 +1,127 @@
+# encoding=utf-8
+module Polytexnic
+  module Preprocessor
+    module Polytex
+      # Converts Markdown to PolyTeX.
+      # We adopt a unified approach: rather than convert "Markdown" (I use
+      # the term loosely*) directly to HTML, we convert it to PolyTeX and
+      # then run everything through the PolyTeX pipeline. Happily, kramdown
+      # comes equipped with a `to_latex` method that does most of the heavy
+      # lifting. The ouput isn't as clean as that produced by Pandoc (our
+      # previous choice), but it comes with significant advantages: (1) It's
+      # written in Ruby, available as a gem, so its use eliminates an external
+      # dependency. (2) It's the foundation for the "Markdown" interpreter
+      # used by Leanpub, so by using it ourselves we ensure greater
+      # compatibility with Leanpub books.
+      #
+      # * <rant>The number of mutually incompatible markup languages going
+      # by the name "Markdown" is truly mind-boggling. Most of them add things
+      # to John Gruber's original Markdown language in an ever-expanding
+      # attempt to bolt on the functionality needed to write longer documents.
+      # At this point, I fear that "Markdown" has become little more than a
+      # marketing term.</rant>
+      def to_polytex
+        require 'Kramdown'
+        cleaned_markdown = cache_code_environments
+        cleaned_markdown.tap do |markdown|
+          convert_code_inclusion(markdown)
+        end
+        math_cache = cache_math(cleaned_markdown)
+        # Override the header ordering, which starts with 'section' by default.
+        lh = 'chapter,section,subsection,subsubsection,paragraph,subparagraph'
+        kramdown = Kramdown::Document.new(cleaned_markdown, latex_headers: lh)
+        @source = restore_inclusion(restore_math(kramdown.to_latex, math_cache))
+      end
+      def cache_code_environments
+        output = []
+        lines = @source.split("\n")
+        indentation = ' ' * 4
+        while (line = lines.shift)
+          if line =~ /\{lang="(.*?)"\}/
+            language = $1
+            code = []
+            while (line = lines.shift) && line.match(/^#{indentation}(.*)$/) do
+              code << $1
+            end
+            code = code.join("\n")
+            key = digest(code)
+            code_cache[key] = [code, language]
+            output << key
+            output << line
+          elsif line =~ /^```\s*$/        # basic code fences
+            while (line = lines.shift) && !line.match(/^```\s*$/)
+              output << indentation + line
+            end
+            output << "\n"
+          elsif line =~ /^```(\w+)\s*$/   # syntax-highlighted code fences
+            language = $1
+            code = []
+            while (line = lines.shift) && !line.match(/^```\s*$/) do
+              code << line
+            end
+            code = code.join("\n")
+            key = digest(code)
+            code_cache[key] = [code, language]
+            output << key
+          else
+            output << line
+          end
+        end
+        output.join("\n")
+      end
+      # Caches Leanpub-style math.
+      # Leanpub uses the notation {$$}...{/$$} for both inline and block math,
+      # with the only difference being the presences of newlines:
+      #     {$$} x^2 {/$$}  % inline
+      # and
+      #     {$$}
+      #     x^2             % block
+      #     {/$$}
+      # I personally hate this notation and convention, but anyone who really
+      # cares should just use PolyTeX instead of Markdown.
+      def cache_math(text)
+        cache = {}
+        text.gsub!(/\{\$\$\}\n(.*?)\n\{\/\$\$\}/) do
+          key = digest($1)
+          cache[[:block, key]] = $1
+          key
+        end
+        text.gsub!(/\{\$\$\}(.*?)\{\/\$\$\}/) do
+          key = digest($1)
+          cache[[:inline, key]] = $1
+          key
+        end
+        cache
+      end
+      # Restores the Markdown math.
+      # This is easy because we're running everything through our LaTeX
+      # pipeline.
+      def restore_math(text, cache)
+        cache.each do |(kind, key), value|
+          case kind
+          when :inline
+            open  = '\('
+            close =  '\)'
+          when :block
+            open  = '\[' + "\n"
+            close = "\n" + '\]'
+          end
+          text.gsub!(key, open + value + close)
+        end
+        text
+      end
+    end
+    # Adds support for <<(path/to/code) inclusion.
+    def convert_code_inclusion(text)
+      text.gsub!(/^\s*<<(\(.*?\))/) { "<!-- inclusion= <<#{$1}-->" }
+    end
+    def restore_inclusion(text)
+      text.gsub(/% <!-- inclusion= (.*?)-->/) { "%= #{$1}" }
+    end
+  end
+end