RubyGems - markup_parser - Versions diffs - 0.0.1 - Mend

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

data/.gitignore +17 -0
data/Gemfile +4 -0
data/Rakefile +2 -0
data/lib/markup_parser.rb +11 -0
data/lib/markup_parser/default.rb +109 -0
data/lib/markup_parser/html.rb +13 -0
data/lib/markup_parser/markdown.rb +116 -0
data/lib/markup_parser/rdoc.rb +26 -0
data/lib/markup_parser/version.rb +3 -0
data/markup_parser.gemspec +19 -0
metadata +69 -0

data/.gitignore ADDED Viewed

@@ -0,0 +1,17 @@
+*.gem
+*.rbc
+.bundle
+.config
+.yardoc
+Gemfile.lock
+InstalledFiles
+_yardoc
+coverage
+doc/
+lib/bundler/man
+pkg
+rdoc
+spec/reports
+test/tmp
+test/version_tmp
+tmp

data/Gemfile ADDED Viewed

@@ -0,0 +1,4 @@
+source 'http://rubygems.org'
+# Specify your gem's dependencies in markup_parser.gemspec
+gemspec

data/Rakefile ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ #!/usr/bin/env rake
2	+ require "bundler/gem_tasks"

data/lib/markup_parser.rb ADDED Viewed

@@ -0,0 +1,11 @@
+require "markup_parser/version"
+module MarkupParser
+  puts "\n**************\nMarkupParser loaded\n**************\n"
+  self.parser_path = File.join(File.dirname(__FILE__), 'markup_parser')
+  def self.parsers
+    @parsers ||= Dir.glob( File.join(@parser_path, '*.rb') ).collect {|f| File.basename(f, '.rb') } - ["default"]
+  end
+end

data/lib/markup_parser/default.rb ADDED Viewed

@@ -0,0 +1,109 @@
+module MarkupParser
+  class Default
+    puts "\n**************\nMarkupParser::Default loaded\n**************\n"
+    attr_reader :original_text, :nokoguri_parser, :html_text, :lexer_proc
+    def initialize(text='', &lexer)
+      @original_text = hot_fixes(text)
+      @lexer_proc = lexer || default_lexer
+    end
+    # Returns the fully stylized and sanitized HTML
+    def to_html
+      begin
+        nokoguri_parser.to_xhtml(:save_with => Nokogiri::XML::Node::SaveOptions::AS_XHTML)
+      rescue => e
+        puts "
+        \n******************
+        Error in #{self.class}#to_html.
+        Reason: #{e.message}.
+        Putting error message into the output.
+        ******************\n"
+        return "<p class='parse_error'>Error in parsing in #{self.class}: #{e.message}.</p>"
+      end
+    end
+    # Instantiates a Nokoguri::HTML fragment parser
+    def nokoguri_parser
+      begin
+        @nokoguri_parser ||= Nokogiri::HTML::DocumentFragment.parse(html_text)
+      rescue => e
+        puts "
+        \n******************
+        Error in #{self.class}#nokoguri_parser.
+        Reason: #{e.message}.
+        Putting error message into the output.
+        ******************\n"
+        @nokoguri_parser = Nokogiri::HTML::DocumentFragment.parse("<p class='parse_error'>Error in parsing in #{self.class}: #{e.message}.</p>")
+      end
+    end
+    # Instantiates the html_text via this markup parser
+    def html_text
+      begin
+        @html_text ||= parse(@original_text)
+      rescue => e
+          puts "
+          \n******************
+          Error in #{self.class}#html_text.
+          Reason: #{e.message}.
+          Putting error message into the output.
+          ******************\n"
+          @html_text = "<p class='parse_error'>Error in parsing in #{self.class}: #{e.message}.</p>"
+      end
+    end
+    # Stylizes the code blocks in the html_text.
+    # Uses either a passed in lexer Proc or the default_lexer
+    def stylize_code_blocks
+        nokoguri_parser.search('pre').each do |node|
+          begin
+            next unless lang = node['lang']
+            text = node.inner_text
+            html = @lexer_proc.call(text, lang)
+            node.replace(html)
+          rescue => e
+            puts "
+            \n******************
+            Error in parsing <pre lang=''> block.
+            Reason: #{e.message}.
+            Continueing code block parsing.
+            ******************\n"
+          end
+        end
+      self
+    end
+    private
+    # Default Lexer Proc
+    def default_lexer
+      Proc.new {|code, lang| Uv.parse(code, "xhtml", lang, false, "railscasts") }
+    end
+    ######################################################################
+    # TO BE OVERRIDDEN
+    # Markup specific Parser invokation
+    def parse(text)
+      text
+    end
+    # Performs hotfixes on a per-markup basis
+    def hot_fixes(text)
+      text
+    end
+    ######################################################################
+  end
+end

data/lib/markup_parser/html.rb ADDED Viewed

@@ -0,0 +1,13 @@
+module MarkupParser
+  class Html < MarkupParser::Default
+    puts "\n**************\nMarkupParser::Html loaded\n**************\n"
+    private
+    # Performs my html hotfixes
+    def hot_fixes(text)
+      text
+    end
+  end
+end

data/lib/markup_parser/markdown.rb ADDED Viewed

@@ -0,0 +1,116 @@
+module MarkupParser
+  class Markdown < MarkupParser::Default
+    puts "\n**************\nMarkupParser::Markdown loaded\n**************\n"
+    # HTML renderer with Ultraviolet Code Lexer
+    class UvHtmlRender < Redcarpet::Render::HTML
+      puts "\n**************\nMarkupParser::Markdown::UvHtmlRender loaded\n**************\n"
+      def block_code(code, language)
+        Uv.parse(code, "xhtml", language, false, "railscasts")
+      end
+    end
+    # Only loads the Markdown parser once
+    def self.html_parser_with_code_lexer
+      @@html_parser_with_code_lexer ||= Redcarpet::Markdown.new(UvHtmlRender, OPTIONS)
+    end
+    # Only loads the Markdown parser once
+    def self.html_parser
+      @@parser_with_code_blocks ||= Redcarpet::Markdown.new(Redcarpet::Render::HTML, OPTIONS)
+    end
+    # Selected Markdown Options
+    OPTIONS = {
+      autolink: true, #parse links even when they are not enclosed in `<>` characters. Autolinks for the http, https and ftp
+                 #protocols will be automatically detected. Email addresses are also handled, and http links without protocol, but
+                 #starting with `www.`
+      no_intraemphasis: true, #will stop underscores within words from being treated as the start or end of emphasis blocks
+                        #and will therefore stop Ruby method or variable names with underscores in them from triggering the emphasis
+      lax_html_blocks: true,  #HTML blocks do not require to be surrounded by an empty line as in the Markdown standard.
+      strikethrough: true, #parse strikethrough, PHP-Markdown style Two `~` characters mark the start of a strikethrough, e.g. `this is ~~good~~ bad`
+      fenced_code_blocks: true, #renders fenced code (```) and (~~~)
+      tables: true, #parse tables, PHP-Markdown style
+    }
+    # Returns the fully stylized HTML for this markdown text
+    def html_text
+      @html_text ||= parser.render(@original_text)
+    end
+    # Sets the parser to include as code lexer
+    def stylize_code_blocks
+      @parser = Markdown.html_parser_with_code_lexer
+      self
+    end
+    private
+    # Instantiates the parser for this Markdown instance.
+    # Defaults to @@html_parser
+    def parser
+      @parser ||= Markdown.html_parser
+    end
+    # Hacks parse to return this instence's parser for a later call
+    def parse(text)
+      parser
+    end
+    # Performs my markdown hotfixes
+    def hot_fixes(text)
+      text.standardize_newlines!
+      text.convert_tabs_to_spaces!
+      text.correct_gh_code_syntax!
+      text
+    end
+  end
+end
+# Adds classes to String class...
+class String
+  # Corrects the gh code block syntax mistake where one would write '~~~ .ruby'
+  # and the correct code should be '~~~ruby'
+  def correct_gh_code_syntax!
+    self.gsub!(/~~~\s\.([a-zA-Z]*)/, '~~~\1')
+  end
+  # Corrects the ol list elements: which only except the syntax: '1. ...'.
+  # Corrected syntaxes: '1)'
+  def correct_ol_list_parenth!
+    self.gsub!(/(\s*)(\d)\)/,'\1\2.')
+  end
+  # Converts tabs (\t) to 2 spaces
+  def convert_tabs_to_spaces!
+    self.gsub!(/\t/, "  ")
+  end
+  # Standardize line endings
+  def standardize_newlines!
+    self.gsub!("\r\n", "\n")
+    self.gsub!("\r", "\n")
+  end
+  # Corrects the newlines by stripping the leading whitespace.
+  # NOTE: this is a hack to workaround the strange Gollum editor indentation behavior
+  def sub_newlines!
+    self.gsub!(/([\r\n|\n])[\ ]*(.)/,'\1\2')
+  end
+end

data/lib/markup_parser/rdoc.rb ADDED Viewed

@@ -0,0 +1,26 @@
+require 'rdoc/markup/to_html'
+module MarkupParser
+  class Rdoc < MarkupParser::Default
+    puts "\n**************\nMarkupParser::Rdoc loaded\n**************\n"
+    private
+    # Returns the fully stylized HTML for this text
+    # Forces UTF-8 encoding since Rdoc seems to return ASCII-8BIT
+    def parse(text)
+      Rdoc.parser.convert(text).force_encoding("UTF-8")
+    end
+    # Memorized Parser
+    def self.parser
+      @@parser ||= RDoc::Markup::ToHtml.new
+    end
+    # Performs my rdoc hotfixes
+    def hot_fixes(text)
+      text
+    end
+  end
+end

data/lib/markup_parser/version.rb ADDED Viewed

@@ -0,0 +1,3 @@
+module MarkupParser
+  VERSION = "0.0.1"
+end

data/markup_parser.gemspec ADDED Viewed

@@ -0,0 +1,19 @@
+# -*- encoding: utf-8 -*-
+require File.expand_path('../lib/markup_parser/version', __FILE__)
+Gem::Specification.new do |gem|
+  gem.authors       = ["Quinn"]
+  gem.email         = ["chaffeqa@gmail.com"]
+  gem.description   = %q{Standardized markup parsers to use a single format: an object.  Instantiate a specific markup class with text to output formated Html.  Allows for easy code block highlighting using a Proc; defaults to Uv (ruby Ultraviolet)}
+  gem.summary       = %q{Standardized markup parsers to a single format.  Sole use is for converting markup text to Html. }
+  gem.homepage      = "https://github.com/chaffeqa/markup_parser"
+  gem.executables   = `git ls-files -- bin/*`.split("\n").map{ |f| File.basename(f) }
+  gem.files         = `git ls-files`.split("\n")
+  gem.test_files    = `git ls-files -- {test,spec,features}/*`.split("\n")
+  gem.name          = "markup_parser"
+  gem.require_paths = ["lib"]
+  gem.version       = MarkupParser::VERSION
+  gem.add_dependency "uv"
+end

metadata ADDED Viewed

@@ -0,0 +1,69 @@
+--- !ruby/object:Gem::Specification
+name: markup_parser
+version: !ruby/object:Gem::Version
+  version: 0.0.1
+  prerelease:
+platform: ruby
+authors:
+- Quinn
+autorequire:
+bindir: bin
+cert_chain: []
+date: 2011-09-28 00:00:00.000000000 Z
+dependencies:
+- !ruby/object:Gem::Dependency
+  name: uv
+  requirement: &70102402385260 !ruby/object:Gem::Requirement
+    none: false
+    requirements:
+    - - ! '>='
+      - !ruby/object:Gem::Version
+        version: '0'
+  type: :runtime
+  prerelease: false
+  version_requirements: *70102402385260
+description: ! 'Standardized markup parsers to use a single format: an object.  Instantiate
+  a specific markup class with text to output formated Html.  Allows for easy code
+  block highlighting using a Proc; defaults to Uv (ruby Ultraviolet)'
+email:
+- chaffeqa@gmail.com
+executables: []
+extensions: []
+extra_rdoc_files: []
+files:
+- .gitignore
+- Gemfile
+- Rakefile
+- lib/markup_parser.rb
+- lib/markup_parser/default.rb
+- lib/markup_parser/html.rb
+- lib/markup_parser/markdown.rb
+- lib/markup_parser/rdoc.rb
+- lib/markup_parser/version.rb
+- markup_parser.gemspec
+homepage: https://github.com/chaffeqa/markup_parser
+licenses: []
+post_install_message:
+rdoc_options: []
+require_paths:
+- lib
+required_ruby_version: !ruby/object:Gem::Requirement
+  none: false
+  requirements:
+  - - ! '>='
+    - !ruby/object:Gem::Version
+      version: '0'
+required_rubygems_version: !ruby/object:Gem::Requirement
+  none: false
+  requirements:
+  - - ! '>='
+    - !ruby/object:Gem::Version
+      version: '0'
+requirements: []
+rubyforge_project:
+rubygems_version: 1.8.10
+signing_key:
+specification_version: 3
+summary: Standardized markup parsers to a single format.  Sole use is for converting
+  markup text to Html.
+test_files: []

markup_parser 0.0.1