RubyGems - latexmath - Versions diffs - 0.1.0 → 0.1.5 - Mend

latexmath 0.1.0 → 0.1.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

checksums.yaml +4 -4
data/.editorconfig +14 -0
data/.github/workflows/test.yml +80 -0
data/.gitignore +11 -0
data/.rubocop.yml +129 -0
data/Gemfile +6 -3
data/Gemfile.lock +44 -3
data/README.adoc +28 -0
data/Rakefile +93 -4
data/bin/console +3 -3
data/exe/latexmath +8 -0
data/latexmath.gemspec +17 -14
data/lib/latexmath.rb +76 -10
data/lib/latexmath/aggregator.rb +351 -0
data/lib/latexmath/constants/symbols.rb +3936 -0
data/lib/latexmath/converter.rb +424 -0
data/lib/latexmath/equation.rb +3 -30
data/lib/latexmath/ext.rb +9 -0
data/lib/latexmath/symbol.rb +21 -0
data/lib/latexmath/tokenizer.rb +82 -0
data/lib/latexmath/version.rb +1 -1
data/lib/latexmath/xml/builder.rb +4 -0
data/lib/latexmath/xml/element.rb +25 -0
data/lib/unimathsymbols.js.erb +4 -0
data/lib/unimathsymbols.txt +2864 -0
data/opal/latexmath-opal.rb +40 -0
data/opal/ox.rb +64 -0
data/opal/pseudoenumerator.rb +19 -0
metadata +74 -17
data/.travis.yml +0 -6
data/README.md +0 -40
data/lib/latexmath/latexml_requirement.rb +0 -84
data/lib/latexmath/requirement.rb +0 -12

data/bin/console CHANGED

@@ -1,7 +1,7 @@
 #!/usr/bin/env ruby
-require "bundler/setup"
-require "latexmath"
+require 'bundler/setup'
+require 'latexmath'
 # You can add fixtures and/or initialization code here to make experimenting
 # with your gem easier. You can also use a different console, if you like.
@@ -10,5 +10,5 @@ require "latexmath"
 # require "pry"
 # Pry.start
-require "irb"
+require 'irb'
 IRB.start(__FILE__)

data/exe/latexmath ADDED

@@ -0,0 +1,8 @@
+#!/usr/bin/env ruby
+require_relative '../lib/latexmath'
+latex = File.read(ARGV[0])
+tokens = Latexmath::Tokenizer.new(latex).tokenize
+aggr = Latexmath::Aggregator.new(tokens).aggregate
+puts Latexmath::Converter.new(aggr).convert

data/latexmath.gemspec CHANGED

@@ -1,31 +1,34 @@
 require_relative 'lib/latexmath/version'
 Gem::Specification.new do |spec|
-  spec.name          = "latexmath"
+  spec.name          = 'latexmath'
   spec.version       = Latexmath::VERSION
   spec.authors       = ['Ribose Inc.']
   spec.email         = ['open.source@ribose.com']
-  spec.summary       = %q{Converts LaTeX math into MathML.}
-  spec.description   = %q{Converts LaTeX math into MathML.}
-  spec.homepage      = "https://github.com/metanorma/latexmath"
-  spec.license       = "BSD-2-Clause"
+  spec.summary       = 'Converts LaTeX math into MathML.'
+  spec.description   = 'Converts LaTeX math into MathML.'
+  spec.homepage      = 'https://github.com/plurimath/latexmath'
+  spec.license       = 'BSD-2-Clause'
-  spec.required_ruby_version = Gem::Requirement.new(">= 2.3.0")
+  spec.required_ruby_version = Gem::Requirement.new('>= 2.3.0')
-  spec.metadata["homepage_uri"] = spec.homepage
-  spec.metadata["source_code_uri"] = "https://github.com/metanorma/latexmath"
-  spec.metadata["changelog_uri"] = "https://github.com/metanorma/latexmath/blob/master/CHANGELOG.md."
+  spec.metadata['homepage_uri'] = spec.homepage
+  spec.metadata['source_code_uri'] = 'https://github.com/plurimath/latexmath'
+  spec.metadata['changelog_uri'] = 'https://github.com/plurimath/latexmath/blob/master/CHANGELOG.md.'
   # Specify which files should be added to the gem when it is released.
   # The `git ls-files -z` loads the files in the RubyGem that have been added into git.
-  spec.files         = Dir.chdir(File.expand_path('..', __FILE__)) do
+  spec.files = Dir.chdir(File.expand_path(__dir__)) do
     `git ls-files -z`.split("\x0").reject { |f| f.match(%r{^(test|spec|features)/}) }
   end
-  spec.bindir        = "exe"
+  spec.bindir        = 'exe'
   spec.executables   = spec.files.grep(%r{^exe/}) { |f| File.basename(f) }
-  spec.require_paths = ["lib"]
+  spec.require_paths = ['lib']
-  spec.add_dependency "unicode2latex", "~> 0.0.1"
-  spec.add_dependency "htmlentities", "~> 4.3"
+  spec.add_dependency 'htmlentities', '~> 4.3'
+  spec.add_dependency 'ox', '~> 2.13'
+  spec.add_development_dependency 'equivalent-xml'
+  spec.add_development_dependency 'execjs'
+  spec.add_development_dependency 'opal'
 end

data/lib/latexmath.rb CHANGED

@@ -1,22 +1,88 @@
-require "latexmath/version"
-require "latexmath/latexml_requirement"
-require "latexmath/equation"
-require "htmlentities"
-require "unicode2latex"
+#require 'byebug' unless RUBY_ENGINE == 'opal'
+require 'json'
+require 'htmlentities'
+require 'ox'
+require_relative 'latexmath/ext'
+require_relative 'latexmath/version'
+require_relative 'latexmath/constants/symbols'
+require_relative 'latexmath/aggregator'
+require_relative 'latexmath/converter'
+require_relative 'latexmath/symbol'
+require_relative 'latexmath/tokenizer'
+require_relative 'latexmath/xml/element'
+require_relative 'latexmath/equation'
 module Latexmath
-  class Error < StandardError; end
-  # Your code goes here...
+  MATRICES = [
+    '\\matrix',
+    '\\matrix*',
+    '\\pmatrix',
+    '\\pmatrix*',
+    '\\bmatrix',
+    '\\bmatrix*',
+    '\\Bmatrix',
+    '\\Bmatrix*',
+    '\\vmatrix',
+    '\\vmatrix*',
+    '\\Vmatrix',
+    '\\Vmatrix*',
+    '\\array',
+    '\\split',
+    '\\substack'
+  ].freeze
+  SPACES = ['\\,', '\\:', '\\;', '\\\\'].freeze
+  STYLES = {
+    '\\bf' => 'mathbf'
+  }.freeze
-  Requirements = {
-    latexml: LatexmlRequirement.new
+  LIMITS = ['\\lim', '\\sup', '\\inf', '\\max', '\\min'].freeze
+  COMMANDS = {
+    # command: [params_count, mathml_equivalent, attributes]
+    '_' => [2, 'msub', {}],
+    '^' => [2, 'msup', {}],
+    '_^' => [3, 'msubsup', {}],
+    '\\frac' => [2, 'mfrac', {}],
+    '\\sqrt' => [1, 'msqrt', {}],
+    '\\root' => [2, 'mroot', {}],
+    '\\binom' => [2, 'mfrac', { "linethickness": '0' }],
+    '\\left' => [
+      1,
+      'mo',
+      [%w[stretchy true], %w[fence true], %w[form prefix]]
+    ],
+    '\\right' => [
+      1,
+      'mo',
+      [%w[stretchy true], %w[fence true], %w[form postfix]]
+    ],
+    '\\overline' => [1, 'mover', {}],
+    '\\bar' => [1, 'mover', {}],
+    '\\underline' => [1, 'munder', {}],
+    '\\limits' => [3, 'munderover', {}],
+    '\\overrightarrow' => [1, 'mover', {}]
   }
+  COMMANDS['\\quad'] = [0, 'mo', { "mathvariant": 'italic', separator: 'true' }]
+  COMMANDS['\\qquad'] = [0, 'mo', { "mathvariant": 'italic', separator: 'true' }]
+  SPACES.each do |space|
+    COMMANDS[space] = [0, 'mspace', { "width": '0.167em' }]
+  end
+  MATRICES.each do |matrix|
+    COMMANDS[matrix] = [1, 'mtable', {}]
+  end
+  LIMITS.each do |limit|
+    COMMANDS[limit] = [1, 'munder', {}]
+  end
   def self.parse(string)
-    lxm_input = Unicode2LaTeX.unicode2latex(HTMLEntities.new.decode(string))
+    lxm_input = HTMLEntities.new.decode(string)
     # parse
     Equation.new(lxm_input)
   end
+  class Error < StandardError; end
 end

data/lib/latexmath/aggregator.rb ADDED

@@ -0,0 +1,351 @@
+module Latexmath
+  class Aggregator
+    OPERATORS = '+-*/=[]_^{}()'.freeze
+    OPENING_BRACES = '{'.freeze
+    CLOSING_BRACES = '}'.freeze
+    OPENING_BRACKET = '['.freeze
+    CLOSING_BRACKET = ']'.freeze
+    OPENING_PARENTHESIS = '('.freeze
+    CLOSING_PARENTHESIS = ')'.freeze
+    BACKSLASH = '\\\\'.freeze
+    AMPERSAND = '&'.freeze
+    DASH = '-'.freeze
+    SUB_SUP = '_^'.freeze
+    SUBSCRIPT = '_'.freeze
+    SUPERSCRIPT = '^'.freeze
+    # Added prefix LATEX_ to avoid ruby reserved words
+    LATEX_LEFT = '\\left'.freeze
+    LATEX_RIGHT = '\\right'.freeze
+    LATEX_OVER = '\\over'.freeze
+    LATEX_HLINE = '\\hline'.freeze
+    LATEX_BEGIN = '\\begin'.freeze
+    LATEX_FRAC = '\\frac'.freeze
+    LATEX_ROOT = '\\root'.freeze
+    LATEX_SQRT = '\\sqrt'.freeze
+    def initialize(tokens)
+      @tokens = tokens
+    end
+    def aggregate(tokens = @tokens)
+      aggregated = []
+      loop do
+        begin
+          token = next_item_or_group(tokens)
+          raise StopIteration if token.nil?
+          if token.is_a?(Array)
+            aggregated << token
+          elsif token == OPENING_BRACKET
+            previous = nil
+            previous = aggregated[-1] if aggregated.any?
+            begin
+              g = group(tokens, opening: OPENING_BRACKET, closing: CLOSING_BRACKET)
+              if previous == LATEX_SQRT
+                root = tokens.shift
+                raise StopIteration if root.nil?
+                if root == OPENING_BRACES
+                  begin
+                    root = group(tokens)
+                  rescue EmptyGroupError
+                    root = ''
+                  end
+                end
+                aggregated[-1] = LATEX_ROOT
+                aggregated << root
+              end
+              aggregated << g
+            rescue EmptyGroupError
+              next if previous == LATEX_SQRT
+              aggregated += [OPENING_BRACKET, CLOSING_BRACKET]
+            end
+          elsif LIMITS.include?(token)
+            raise StopIteration if tokens.shift.nil?
+            a = next_item_or_group(tokens)
+            aggregated += [token, a]
+          elsif token == '\\limits'
+            previous = aggregated.pop
+            raise StopIteration if tokens.shift.nil?
+            a = next_item_or_group(tokens)
+            raise StopIteration if tokens.shift.nil?
+            b = next_item_or_group(tokens)
+            aggregated += [token, previous, a, b]
+          elsif token && SUB_SUP.include?(token)
+            aggregated = process_sub_sup(aggregated, token, tokens)
+          elsif token.start_with?(LATEX_BEGIN) || MATRICES.include?(token)
+            aggregated += environment(token, tokens)
+          elsif token == LATEX_OVER
+            numerator = aggregated
+            aggregated = []
+            aggregated << LATEX_FRAC
+            aggregated << numerator
+            aggregated << aggregate(tokens)
+          else
+            aggregated << token
+          end
+        rescue EmptyGroupError
+          aggregated += [OPENING_BRACES, CLOSING_BRACES]
+          next
+        rescue StopIteration
+          aggregated << token unless token.nil?
+          break
+        end
+      end
+      aggregated
+    end
+    def environment(token, tokens)
+      env = if token.start_with?(LATEX_BEGIN)
+              token[7..-2]
+            else
+              token[1..token.size]
+      end
+      alignment = nil
+      content = []
+      row = []
+      has_rowline = false
+      loop do
+        begin
+          token = next_item_or_group(tokens)
+          raise StopIteration if token.nil?
+          if token.is_a? Array
+            begin
+              if env == 'array' && token.all? { |x| 'lcr|'.include?(x) }
+                alignment = token
+              else
+                row << process_row(token)
+              end
+            rescue TypeError
+              row << token
+            end
+          elsif token == "\\end{#{env}}"
+            break
+          elsif token == AMPERSAND
+            row << token
+          elsif token == BACKSLASH
+            row = group_columns(row) if row.include?(AMPERSAND)
+            row.insert(0, LATEX_HLINE) if has_rowline
+            content << row
+            row = []
+            has_rowline = false
+          elsif token == LATEX_HLINE
+            has_rowline = true
+          elsif token == OPENING_BRACKET && content.empty?
+            begin
+              alignment = group(tokens, opening: OPENING_BRACKET, closing: CLOSING_BRACKET)
+            rescue EmptyGroupError
+              next
+            end
+          elsif token == DASH
+            next_token = tokens.shift
+            raise StopIteration if next_token.nil?
+            row << if next_token == "\\end{#{env}}"
+                    token
+                  else
+                    [token, next_token]
+                  end
+          elsif SUB_SUP.include?(token)
+            row = process_sub_sup(row, token, tokens)
+          elsif token.start_with?(LATEX_BEGIN)
+            row += environment(token, tokens)
+          else
+            row << token
+          end
+        rescue EmptyGroupError
+          row << []
+          next
+        rescue StopIteration
+          break
+        end
+      end
+      if row.any?
+        row = group_columns(row) if row.include?(AMPERSAND)
+        row.insert(0, LATEX_HLINE) if has_rowline
+        content << row
+      end
+      content = content.pop while content.size == 1 && content.first.is_a?(Array)
+      return ["\\#{env}", alignment.join, content] if alignment
+      ["\\#{env}", content]
+    end
+    def group(tokens, opening: OPENING_BRACES, closing: CLOSING_BRACES, delimiter: nil)
+      g = []
+      if delimiter
+        g << delimiter
+        g << tokens.shift
+      end
+      loop do
+        begin
+          token = tokens.shift
+          raise StopIteration if token.nil?
+          if token == closing && delimiter.nil?
+            break if g.any?
+            raise EmptyGroupError
+          elsif token == opening
+            begin
+              g << group(tokens)
+            rescue EmptyGroupError
+              g += [[]]
+            end
+          elsif token == LATEX_LEFT
+            g << group(tokens, delimiter: token)
+          elsif token == LATEX_RIGHT
+            g << token
+            _token = tokens.shift
+            raise StopIteration if _token.nil?
+            g << _token
+            break
+          else
+            g << token
+          end
+        rescue StopIteration
+          break
+        end
+      end
+      if delimiter
+        right = g.index(LATEX_RIGHT)
+        raise ExtraLeftOrMissingRight if right.nil?
+        content = g[2..right - 1]
+        g_ = g
+        g_ = g[0..1] + [aggregate(content)] + g[right..g.size] if content.any?
+        return g_
+      end
+      aggregate(g)
+    end
+    def group_columns(row)
+      grouped = [[]]
+      row.each do |item|
+        if item == AMPERSAND
+          grouped << []
+        else
+          grouped[-1] << item
+        end
+      end
+      grouped.map { |item| item.size > 1 ? item : item.pop }
+    end
+    def next_item_or_group(tokens)
+      token = tokens.shift
+      raise StopIteration if token.nil?
+      return group(tokens) if token == OPENING_BRACES
+      return group(tokens, delimiter: token) if token == LATEX_LEFT
+      token
+    end
+    def find_opening_parenthesis(tokens)
+      closing = 0
+      tokens.map.with_index { |x, i| [i, x] }.reverse.each do |index, token|
+        if token == CLOSING_PARENTHESIS
+          closing += 1
+        elsif token == OPENING_PARENTHESIS
+          return index if closing == 0
+          closing -= 1
+        end
+      end
+      raise ExtraLeftOrMissingRight
+    end
+    def process_row(tokens)
+      row = []
+      content = []
+      tokens.each do |token|
+        if token == AMPERSAND
+          next
+        elsif token == BACKSLASH
+          content << row if row.any?
+          row = []
+        else
+          row << token
+        end
+      end
+      content << row if row.any?
+      content = content.pop while content.size == 1 && content.first.is_a?(Array)
+      content
+    end
+    def process_sub_sup(aggregated, token, tokens)
+      begin
+        previous = aggregated.pop
+        raise IndexError if previous.nil?
+        if previous.is_a?(String) && OPERATORS.include?(previous)
+          if (previous == CLOSING_PARENTHESIS) && aggregated.include?(OPENING_PARENTHESIS)
+            index = find_opening_parenthesis(aggregated)
+            aggregated = aggregated[0, index] + [token] + [aggregated[index..aggregated.size] + [previous]]
+          else
+            aggregated += [previous, token]
+          end
+          return aggregated
+        end
+        begin
+          next_token = next_item_or_group(tokens)
+          if aggregated.size >= 2
+            if aggregated[-2] == SUBSCRIPT && token == SUPERSCRIPT
+              aggregated[-2] = SUB_SUP
+              aggregated += [previous, next_token]
+            elsif (aggregated[-2] == SUPERSCRIPT) && (token == SUBSCRIPT)
+              aggregated[-2] = SUB_SUP
+              aggregated += [next_token, previous]
+            else
+              aggregated += [token, previous, next_token]
+            end
+          else
+            aggregated += [token, previous, next_token]
+          end
+        rescue EmptyGroupError
+          aggregated += [token, previous, []]
+        end
+      rescue IndexError
+        next_token = next_item_or_group(tokens)
+        aggregated += [token, '', next_token]
+      end
+      aggregated
+    end
+  end
+  class EmptyGroupError < StandardError; end
+  class ExtraLeftOrMissingRight < StandardError; end
+  class MissingSuperScriptOrSubscript < StandardError; end
+  class StopIteration < StandardError; end
+end