RubyGems - latexmath - Versions diffs - 0.1.0 → 0.1.1 - Mend

latexmath 0.1.0 → 0.1.1

Files changed (32) hide show

checksums.yaml +4 -4
data/.editorconfig +14 -0
data/.github/workflows/test.yml +80 -0
data/.gitignore +10 -0
data/.rubocop.yml +132 -0
data/Gemfile +6 -3
data/Gemfile.lock +44 -3
data/README.adoc +28 -0
data/Rakefile +29 -3
data/bin/console +3 -3
data/exe/latexmath +8 -0
data/latexmath.gemspec +17 -14
data/lib/latexmath.rb +80 -10
data/lib/latexmath/aggregator.rb +351 -0
data/lib/latexmath/converter.rb +421 -0
data/lib/latexmath/equation.rb +3 -30
data/lib/latexmath/ext.rb +9 -0
data/lib/latexmath/latexml_requirement.rb +11 -12
data/lib/latexmath/requirement.rb +2 -3
data/lib/latexmath/symbol.rb +43 -0
data/lib/latexmath/tokenizer.rb +81 -0
data/lib/latexmath/version.rb +1 -1
data/lib/latexmath/xml/builder.rb +4 -0
data/lib/latexmath/xml/element.rb +25 -0
data/lib/unimathsymbols.js.erb +4 -0
data/lib/unimathsymbols.txt +2864 -0
data/opal/latexmath-opal.rb +40 -0
data/opal/ox.rb +64 -0
data/opal/pseudoenumerator.rb +19 -0
metadata +73 -15
data/.travis.yml +0 -6
data/README.md +0 -40

@@ -1,22 +1,92 @@
-require "latexmath/version"
-require "latexmath/latexml_requirement"
-require "latexmath/equation"
-require "htmlentities"
-require "unicode2latex"
+require 'byebug' unless RUBY_ENGINE == 'opal'
+require 'json'
+require 'htmlentities'
+require 'ox'
+require_relative 'latexmath/ext'
+require_relative 'latexmath/version'
+#require_relative 'latexmath/latexml_requirement'
+require_relative 'latexmath/aggregator'
+require_relative 'latexmath/converter'
+require_relative 'latexmath/symbol'
+require_relative 'latexmath/tokenizer'
+require_relative 'latexmath/xml/element'
+require_relative 'latexmath/equation'
 module Latexmath
-  class Error < StandardError; end
-  # Your code goes here...
+  MATRICES = [
+    '\\matrix',
+    '\\matrix*',
+    '\\pmatrix',
+    '\\pmatrix*',
+    '\\bmatrix',
+    '\\bmatrix*',
+    '\\Bmatrix',
+    '\\Bmatrix*',
+    '\\vmatrix',
+    '\\vmatrix*',
+    '\\Vmatrix',
+    '\\Vmatrix*',
+    '\\array',
+    '\\split',
+    '\\substack'
+  ].freeze
-  Requirements = {
-    latexml: LatexmlRequirement.new
+  SPACES = ['\\,', '\\:', '\\;', '\\\\'].freeze
+  STYLES = {
+    '\\bf' => 'mathbf'
+  }.freeze
+  LIMITS = ['\\lim', '\\sup', '\\inf', '\\max', '\\min'].freeze
+  COMMANDS = {
+    # command: [params_count, mathml_equivalent, attributes]
+    '_' => [2, 'msub', {}],
+    '^' => [2, 'msup', {}],
+    '_^' => [3, 'msubsup', {}],
+    '\\frac' => [2, 'mfrac', {}],
+    '\\sqrt' => [1, 'msqrt', {}],
+    '\\root' => [2, 'mroot', {}],
+    '\\binom' => [2, 'mfrac', { "linethickness": '0' }],
+    '\\left' => [
+      1,
+      'mo',
+      [%w[stretchy true], %w[fence true], %w[form prefix]]
+    ],
+    '\\right' => [
+      1,
+      'mo',
+      [%w[stretchy true], %w[fence true], %w[form postfix]]
+    ],
+    '\\overline' => [1, 'mover', {}],
+    '\\bar' => [1, 'mover', {}],
+    '\\underline' => [1, 'munder', {}],
+    '\\limits' => [3, 'munderover', {}],
+    '\\overrightarrow' => [1, 'mover', {}]
   }
+  COMMANDS['\\quad'] = [0, 'mo', { "mathvariant": 'italic', separator: 'true' }]
+  COMMANDS['\\qquad'] = [0, 'mo', { "mathvariant": 'italic', separator: 'true' }]
+  SPACES.each do |space|
+    COMMANDS[space] = [0, 'mspace', { "width": '0.167em' }]
+  end
+  MATRICES.each do |matrix|
+    COMMANDS[matrix] = [1, 'mtable', {}]
+  end
+  LIMITS.each do |limit|
+    COMMANDS[limit] = [1, 'munder', {}]
+  end
+  Requirements = {
+    #latexml: LatexmlRequirement.new
+  }.freeze
   def self.parse(string)
-    lxm_input = Unicode2LaTeX.unicode2latex(HTMLEntities.new.decode(string))
+    lxm_input = HTMLEntities.new.decode(string)
     # parse
     Equation.new(lxm_input)
   end
+  class Error < StandardError; end
 end

data/lib/latexmath/aggregator.rb ADDED

@@ -0,0 +1,351 @@
+module Latexmath
+  class Aggregator
+    OPERATORS = '+-*/=[]_^{}()'.freeze
+    OPENING_BRACES = '{'.freeze
+    CLOSING_BRACES = '}'.freeze
+    OPENING_BRACKET = '['.freeze
+    CLOSING_BRACKET = ']'.freeze
+    OPENING_PARENTHESIS = '('.freeze
+    CLOSING_PARENTHESIS = ')'.freeze
+    BACKSLASH = '\\\\'.freeze
+    AMPERSAND = '&'.freeze
+    DASH = '-'.freeze
+    SUB_SUP = '_^'.freeze
+    SUBSCRIPT = '_'.freeze
+    SUPERSCRIPT = '^'.freeze
+    # Added prefix LATEX_ to avoid ruby reserved words
+    LATEX_LEFT = '\\left'.freeze
+    LATEX_RIGHT = '\\right'.freeze
+    LATEX_OVER = '\\over'.freeze
+    LATEX_HLINE = '\\hline'.freeze
+    LATEX_BEGIN = '\\begin'.freeze
+    LATEX_FRAC = '\\frac'.freeze
+    LATEX_ROOT = '\\root'.freeze
+    LATEX_SQRT = '\\sqrt'.freeze
+    def initialize(tokens)
+      @tokens = tokens
+    end
+    def aggregate(tokens = @tokens)
+      aggregated = []
+      loop do
+        begin
+          token = next_item_or_group(tokens)
+          raise StopIteration if token.nil?
+          if token.is_a?(Array)
+            aggregated << token
+          elsif token == OPENING_BRACKET
+            previous = nil
+            previous = aggregated[-1] if aggregated.any?
+            begin
+              g = group(tokens, opening: OPENING_BRACKET, closing: CLOSING_BRACKET)
+              if previous == LATEX_SQRT
+                root = tokens.shift
+                raise StopIteration if root.nil?
+                if root == OPENING_BRACES
+                  begin
+                    root = group(tokens)
+                  rescue EmptyGroupError
+                    root = ''
+                  end
+                end
+                aggregated[-1] = LATEX_ROOT
+                aggregated << root
+              end
+              aggregated << g
+            rescue EmptyGroupError
+              next if previous == LATEX_SQRT
+              aggregated += [OPENING_BRACKET, CLOSING_BRACKET]
+            end
+          elsif LIMITS.include?(token)
+            raise StopIteration if tokens.shift.nil?
+            a = next_item_or_group(tokens)
+            aggregated += [token, a]
+          elsif token == '\\limits'
+            previous = aggregated.pop
+            raise StopIteration if tokens.shift.nil?
+            a = next_item_or_group(tokens)
+            raise StopIteration if tokens.shift.nil?
+            b = next_item_or_group(tokens)
+            aggregated += [token, previous, a, b]
+          elsif token && SUB_SUP.include?(token)
+            aggregated = process_sub_sup(aggregated, token, tokens)
+          elsif token.start_with?(LATEX_BEGIN) || MATRICES.include?(token)
+            aggregated += environment(token, tokens)
+          elsif token == LATEX_OVER
+            numerator = aggregated
+            aggregated = []
+            aggregated << LATEX_FRAC
+            aggregated << numerator
+            aggregated << aggregate(tokens)
+          else
+            aggregated << token
+          end
+        rescue EmptyGroupError
+          aggregated += [OPENING_BRACES, CLOSING_BRACES]
+          next
+        rescue StopIteration
+          aggregated << token unless token.nil?
+          break
+        end
+      end
+      aggregated
+    end
+    def environment(token, tokens)
+      env = if token.start_with?(LATEX_BEGIN)
+              token[7..-2]
+            else
+              token[1..token.size]
+      end
+      alignment = nil
+      content = []
+      row = []
+      has_rowline = false
+      loop do
+        begin
+          token = next_item_or_group(tokens)
+          raise StopIteration if token.nil?
+          if token.is_a? Array
+            begin
+              if env == 'array' && token.all? { |x| 'lcr|'.include?(x) }
+                alignment = token
+              else
+                row << process_row(token)
+              end
+            rescue TypeError
+              row << token
+            end
+          elsif token == "\\end{#{env}}"
+            break
+          elsif token == AMPERSAND
+            row << token
+          elsif token == BACKSLASH
+            row = group_columns(row) if row.include?(AMPERSAND)
+            row.insert(0, LATEX_HLINE) if has_rowline
+            content << row
+            row = []
+            has_rowline = false
+          elsif token == LATEX_HLINE
+            has_rowline = true
+          elsif token == OPENING_BRACKET && content.empty?
+            begin
+              alignment = group(tokens, opening: OPENING_BRACKET, closing: CLOSING_BRACKET)
+            rescue EmptyGroupError
+              next
+            end
+          elsif token == DASH
+            next_token = tokens.shift
+            raise StopIteration if next_token.nil?
+            row << if next_token == "\\end{#{env}}"
+                    token
+                  else
+                    [token, next_token]
+                  end
+          elsif SUB_SUP.include?(token)
+            row = process_sub_sup(row, token, tokens)
+          elsif token.start_with?(LATEX_BEGIN)
+            row += environment(token, tokens)
+          else
+            row << token
+          end
+        rescue EmptyGroupError
+          row << []
+          next
+        rescue StopIteration
+          break
+        end
+      end
+      if row.any?
+        row = group_columns(row) if row.include?(AMPERSAND)
+        row.insert(0, LATEX_HLINE) if has_rowline
+        content << row
+      end
+      content = content.pop while content.size == 1 && content.first.is_a?(Array)
+      return ["\\#{env}", alignment.join, content] if alignment
+      ["\\#{env}", content]
+    end
+    def group(tokens, opening: OPENING_BRACES, closing: CLOSING_BRACES, delimiter: nil)
+      g = []
+      if delimiter
+        g << delimiter
+        g << tokens.shift
+      end
+      loop do
+        begin
+          token = tokens.shift
+          raise StopIteration if token.nil?
+          if token == closing && delimiter.nil?
+            break if g.any?
+            raise EmptyGroupError
+          elsif token == opening
+            begin
+              g << group(tokens)
+            rescue EmptyGroupError
+              g += [[]]
+            end
+          elsif token == LATEX_LEFT
+            g << group(tokens, delimiter: token)
+          elsif token == LATEX_RIGHT
+            g << token
+            _token = tokens.shift
+            raise StopIteration if _token.nil?
+            g << _token
+            break
+          else
+            g << token
+          end
+        rescue StopIteration
+          break
+        end
+      end
+      if delimiter
+        right = g.index(LATEX_RIGHT)
+        raise ExtraLeftOrMissingRight if right.nil?
+        content = g[2..right - 1]
+        g_ = g
+        g_ = g[0..1] + [aggregate(content)] + g[right..g.size] if content.any?
+        return g_
+      end
+      aggregate(g)
+    end
+    def group_columns(row)
+      grouped = [[]]
+      row.each do |item|
+        if item == AMPERSAND
+          grouped << []
+        else
+          grouped[-1] << item
+        end
+      end
+      grouped.map { |item| item.size > 1 ? item : item.pop }
+    end
+    def next_item_or_group(tokens)
+      token = tokens.shift
+      raise StopIteration if token.nil?
+      return group(tokens) if token == OPENING_BRACES
+      return group(tokens, delimiter: token) if token == LATEX_LEFT
+      token
+    end
+    def find_opening_parenthesis(tokens)
+      closing = 0
+      tokens.map.with_index { |x, i| [i, x] }.reverse.each do |index, token|
+        if token == CLOSING_PARENTHESIS
+          closing += 1
+        elsif token == OPENING_PARENTHESIS
+          return index if closing == 0
+          closing -= 1
+        end
+      end
+      raise ExtraLeftOrMissingRight
+    end
+    def process_row(tokens)
+      row = []
+      content = []
+      tokens.each do |token|
+        if token == AMPERSAND
+          next
+        elsif token == BACKSLASH
+          content << row if row.any?
+          row = []
+        else
+          row << token
+        end
+      end
+      content << row if row.any?
+      content = content.pop while content.size == 1 && content.first.is_a?(Array)
+      content
+    end
+    def process_sub_sup(aggregated, token, tokens)
+      begin
+        previous = aggregated.pop
+        raise IndexError if previous.nil?
+        if previous.is_a?(String) && OPERATORS.include?(previous)
+          if (previous == CLOSING_PARENTHESIS) && aggregated.include?(OPENING_PARENTHESIS)
+            index = find_opening_parenthesis(aggregated)
+            aggregated = aggregated[0, index] + [token] + [aggregated[index..aggregated.size] + [previous]]
+          else
+            aggregated += [previous, token]
+          end
+          return aggregated
+        end
+        begin
+          next_token = next_item_or_group(tokens)
+          if aggregated.size >= 2
+            if aggregated[-2] == SUBSCRIPT && token == SUPERSCRIPT
+              aggregated[-2] = SUB_SUP
+              aggregated += [previous, next_token]
+            elsif (aggregated[-2] == SUPERSCRIPT) && (token == SUBSCRIPT)
+              aggregated[-2] = SUB_SUP
+              aggregated += [next_token, previous]
+            else
+              aggregated += [token, previous, next_token]
+            end
+          else
+            aggregated += [token, previous, next_token]
+          end
+        rescue EmptyGroupError
+          aggregated += [token, previous, []]
+        end
+      rescue IndexError
+        next_token = next_item_or_group(tokens)
+        aggregated += [token, '', next_token]
+      end
+      aggregated
+    end
+  end
+  class EmptyGroupError < StandardError; end
+  class ExtraLeftOrMissingRight < StandardError; end
+  class MissingSuperScriptOrSubscript < StandardError; end
+  class StopIteration < StandardError; end
+end