RubyGems - rbbcode - Versions diffs - 0.1.11 → 1.0.0 - Mend

rbbcode 0.1.11 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

data/lib/rbbcode/node_extensions.rb +126 -0
data/lib/rbbcode/rbbcode_grammar.treetop +113 -0
data/lib/rbbcode/sanitize.rb +13 -0
data/lib/rbbcode.rb +49 -5
metadata +34 -131
data/.document +0 -5
data/Gemfile +0 -13
data/LICENSE.txt +0 -21
data/README.markdown +0 -126
data/Rakefile +0 -35
data/VERSION +0 -1
data/lib/rbbcode/html_maker.rb +0 -90
data/lib/rbbcode/parser.rb +0 -32
data/lib/rbbcode/schema.rb +0 -309
data/lib/rbbcode/tree_maker.rb +0 -430
data/pkg/rbbcode-0.1.8.gem +0 -0
data/rbbcode.gemspec +0 -82
data/spec/html_maker_spec.rb +0 -92
data/spec/node_spec_helper.rb +0 -117
data/spec/parser_spec.rb +0 -163
data/spec/schema_spec.rb +0 -100
data/spec/spec_helper.rb +0 -17
data/spec/tree_maker_spec.rb +0 -123

data/lib/rbbcode/tree_maker.rb DELETED Viewed

@@ -1,430 +0,0 @@
-require 'pp'
-module RbbCode
-	module CharCodes
-		CR_CODE = 13
-		LF_CODE = 10
-		L_BRACK_CODE = 91
-		R_BRACK_CODE = 93
-		SLASH_CODE = 47
-		LOWER_A_CODE = 97
-		LOWER_Z_CODE = 122
-		UPPER_A_CODE = 65
-		UPPER_Z_CODE = 90
-	end
-	class Node
-		def << (child)
-			@children << child
-		end
-		attr_accessor :children
-		def initialize(parent)
-			@parent = parent
-			@children = []
-		end
-		attr_accessor :parent
-	end
-	class RootNode < Node
-		def initialize
-			@children = []
-		end
-	end
-	class TextNode < Node
-		undef_method '<<'.to_sym
-		undef_method :children
-		def initialize(parent, text)
-			@parent = parent
-			@text = text
-		end
-		attr_accessor :text
-		def to_bb_code
-			@text
-		end
-	end
-	class TagNode < Node
-		def self.from_opening_bb_code(parent, bb_code)
-		  # Remove colon if leave_tag
-		  if bb_code[1,1] == ':'
-		    bb_code = "[#{bb_code[2..-1]}"
-		  end
-			if equal_index = bb_code.index('=')
-				tag_name = bb_code[1, equal_index - 1]
-				value = bb_code[(equal_index + 1)..-2]
-			else
-				tag_name = bb_code[1..-2]
-				value = nil
-			end
-			new(parent, tag_name, value)
-		end
-		def initialize(parent, tag_name, value = nil)
-			super(parent)
-			@tag_name = tag_name
-			@value = value
-			@preformatted = false
-		end
-		def inner_bb_code
-			@children.inject('') do |output, child|
-				output << child.to_bb_code
-			end
-		end
-		def preformat!
-			@preformatted = true
-		end
-		def preformatted?
-			@preformatted
-		end
-		def to_bb_code
-			if @value.nil?
-				output = "[#{@tag_name}]"
-			else
-				output = "[#{@tag_name}=#{@value}]"
-			end
-			output << inner_bb_code << "[/#{@tag_name}]"
-		end
-		attr_reader :tag_name
-		attr_reader :value
-	end
-	class TreeMaker
-		include CharCodes
-		def initialize(schema)
-			@schema = schema
-		end
-		def make_tree(str)
-			delete_junk_breaks!(
-				delete_invalid_empty_tags!(
-					parse_str(str)
-				)
-			)
-		end
-		protected
-		def ancestor_list(parent)
-			ancestors = []
-			while parent.is_a?(TagNode)
-				ancestors << parent.tag_name
-				parent = parent.parent
-			end
-			ancestors
-		end
-		def break_type(break_str)
-			if break_str.length > 2
-				:paragraph
-			elsif break_str.length == 1
-				:line_break
-			elsif break_str == "\r\n"
-				:line_break
-			else
-				:paragraph
-			end
-		end
-		# Delete empty paragraphs and line breaks at the end of block-level elements
-		def delete_junk_breaks!(node)
-			node.children.reject! do |child|
-				if child.is_a?(TagNode)
-					if !child.children.empty?
-						delete_junk_breaks!(child)
-						false
-					elsif child.tag_name == @schema.paragraph_tag_name
-						# It's an empty paragraph tag
-						true
-					#elsif not node.is_a?(RootNode) and @schema.block_level?(node.tag_name) and child.tag_name == @schema.line_break_tag_name and node.children.last == child
-					elsif @schema.block_level?(node.tag_name) and child.tag_name == @schema.line_break_tag_name and node.children.last == child
-						# It's a line break a the end of the block-level element
-						true
-					else
-						false
-					end
-				else
-					false
-				end
-			end
-			node
-		end
-		# The schema defines some tags that may not be empty. This method removes any such empty tags from the tree.
-		def delete_invalid_empty_tags!(node)
-			node.children.reject! do |child|
-				if child.is_a?(TagNode)
-					if child.children.empty? and !@schema.tag_may_be_empty?(child.tag_name)
-						true
-					else
-						delete_invalid_empty_tags!(child)
-						false
-					end
-				end
-			end
-			node
-		end
-		def parse_str(str)
-			tree = RootNode.new
-			# Initially, we open a paragraph tag. If it turns out that the first thing we encounter
-			# is a block-level element, no problem: we'll be calling promote_block_level_elements
-			# later anyway.
-			current_parent = TagNode.new(tree, @schema.paragraph_tag_name)
-			tree << current_parent
-			current_token = ''
-			current_token_type = :unknown
-			# It may seem naive to use each_byte. What about Unicode? So long as we're using UTF-8, none of the
-			# BB Code control characters will appear as part of multibyte characters, because UTF-8 doesn't allow
-			# the range 0x00-0x7F in multibyte chars. As for the multibyte characters themselves, yes, they will
-			# be temporarily split up as we append bytes onto the text nodes. But as of yet, I haven't found
-			# a way that this could cause a problem. The bytes always come back together again. (It would be a problem
-			# if we tried to count the characters for some reason, but we don't do that.)
-      # AQ: #each_byte doesn't work with ruby 1.9+, but luckily we have #each_char
-      split_method = :each_byte
-      split_method = :each_char if RUBY_VERSION.split('.')[1] > "8"
-			block = Proc.new do |char|
-			  if split_method == :each_char
-			    # ruby 1.9
-			    char_code = char.ord
-		    else
-		      # ruby 1.8
-		      char_code = char
-		      char = char_code.chr
-	      end
-				case current_token_type
-				when :unknown
-					case char
-					when '['
-						current_token_type = :possible_tag
-						current_token << char
-					when "\r", "\n"
-						current_token_type = :break
-						current_token << char
-					else
-						if current_parent.is_a?(RootNode)
-							new_paragraph_tag = TagNode.new(current_parent, @schema.paragraph_tag_name)
-							current_parent << new_paragraph_tag
-							current_parent = new_paragraph_tag
-						end
-						current_token_type = :text
-						current_token << char
-					end
-				when :text
-					case char
-					when "["
-						if @schema.text_valid_in_context?(*ancestor_list(current_parent))
-							current_parent << TextNode.new(current_parent, current_token)
-						end
-						current_token = '['
-						current_token_type = :possible_tag
-					when "\r", "\n"
-						if @schema.text_valid_in_context?(*ancestor_list(current_parent))
-							current_parent << TextNode.new(current_parent, current_token)
-						end
-						current_token = char
-						current_token_type = :break
-					else
-						current_token << char
-					end
-				when :break
-					if char_code == CR_CODE or char_code == LF_CODE
-						current_token << char
-					else
-						if break_type(current_token) == :paragraph
-							while current_parent.is_a?(TagNode) and !@schema.block_level?(current_parent.tag_name) and current_parent.tag_name != @schema.paragraph_tag_name
-								current_parent = current_parent.parent
-							end
-							# The current parent might be a paragraph tag, in which case we should move up one more level.
-							# Otherwise, it might be a block-level element or a root node, in which case we should not move up.
-							if current_parent.is_a?(TagNode) and current_parent.tag_name == @schema.paragraph_tag_name
-								current_parent = current_parent.parent
-							end
-							# Regardless of whether the current parent is a block-level element, we need to open a new paragraph.
-							new_paragraph_node = TagNode.new(current_parent, @schema.paragraph_tag_name)
-							current_parent << new_paragraph_node
-							current_parent = new_paragraph_node
-						else # line break
-							prev_sibling = current_parent.children.last
-							if prev_sibling.is_a?(TagNode) and @schema.block_level?(prev_sibling.tag_name)
-								# Although the input only contains a single newline, we should
-								# interpret is as the start of a new paragraph, because the last
-								# thing we encountered was a block-level element.
-								new_paragraph_node = TagNode.new(current_parent, @schema.paragraph_tag_name)
-								current_parent << new_paragraph_node
-								current_parent = new_paragraph_node
-							elsif @schema.tag(@schema.line_break_tag_name).valid_in_context?(*ancestor_list(current_parent))
-								current_parent << TagNode.new(current_parent, @schema.line_break_tag_name)
-							end
-						end
-						if char == '['
-							current_token = '['
-							current_token_type = :possible_tag
-						else
-							current_token = char
-							current_token_type = :text
-						end
-					end
-				when :possible_tag
-					case char
-					when '['
-						current_parent << TextNode.new(current_parent, '[')
-						# No need to reset current_token or current_token_type, because now we're in a new possible tag
-					when '/'
-						current_token_type = :closing_tag
-						current_token << '/'
-				  when ':'
-				    current_token_type = :leaf_tag
-				    current_token << ':'
-					else
-						if tag_name_char?(char_code)
-							current_token_type = :opening_tag
-							current_token << char
-						else
-							current_token_type = :text
-							current_token << char
-						end
-					end
-				when :opening_tag
-					if tag_name_char?(char_code) or char == '='
-						current_token << char
-					elsif char == ']'
-						current_token << ']'
-						tag_node = TagNode.from_opening_bb_code(current_parent, current_token)
-						if @schema.block_level?(tag_node.tag_name) and current_parent.tag_name == @schema.paragraph_tag_name
-							# If there is a line break before this, it's superfluous and should be deleted
-							prev_sibling = current_parent.children.last
-							if prev_sibling.is_a?(TagNode) and prev_sibling.tag_name == @schema.line_break_tag_name
-								current_parent.children.pop
-							end
-							# Promote a block-level element
-							current_parent = current_parent.parent
-							tag_node.parent = current_parent
-							current_parent << tag_node
-							current_parent = tag_node
-							# If all of this results in empty paragraph tags, no worries: they will be deleted later.
-						elsif tag_node.tag_name == current_parent.tag_name and @schema.close_twins?(tag_node.tag_name)
-							# The current tag and the tag we're now opening are of the same type, and this kind of tag auto-closes its twins
-							# (E.g. * tags in the default config.)
-							current_parent.parent << tag_node
-							current_parent = tag_node
-						elsif @schema.tag(tag_node.tag_name).valid_in_context?(*ancestor_list(current_parent))
-							current_parent << tag_node
-							current_parent = tag_node
-						end # else, don't do anything--the tag is invalid and will be ignored
-						if @schema.preformatted?(current_parent.tag_name)
-							current_token_type = :preformatted
-							current_parent.preformat!
-						else
-							current_token_type = :unknown
-						end
-						current_token = ''
-					elsif char == "\r" or char == "\n"
-						current_parent << TextNode.new(current_parent, current_token)
-						current_token = char
-						current_token_type = :break
-					elsif current_token.include?('=')
-						current_token << char
-					else
-						current_token_type = :text
-						current_token << char
-					end
-				when :leaf_tag
-				  if tag_name_char?(char_code) or char == '='
-						current_token << char
-					elsif char == ']'
-					  current_token << ']'
-					  tag_node = TagNode.from_opening_bb_code(current_parent, current_token)
-					  if @schema.tag(tag_node.tag_name).valid_in_context?(*ancestor_list(current_parent))
-					    current_parent.children << tag_node
-					    current_token_type = :unknown
-					    current_token = ''
-					  else
-					    current_token_type = :text
-					  end
-					end
-				when :closing_tag
-					if tag_name_char?(char_code)
-						current_token << char
-					elsif char == ']'
-						original_parent = current_parent
-						while current_parent.is_a?(TagNode) and current_parent.tag_name != current_token[2..-1]
-							current_parent = current_parent.parent
-						end
-						if current_parent.is_a?(TagNode)
-							current_parent = current_parent.parent
-						else # current_parent is a RootNode
-							# we made it to the top of the tree, and never found the tag to close
-							# so we'll just ignore the closing tag altogether
-							current_parent = original_parent
-						end
-						current_token_type = :unknown
-						current_token = ''
-					elsif char == "\r" or char == "\n"
-						current_parent << TextNode.new(current_parent, current_token)
-						current_token = char
-						current_token_type = :break
-					else
-						current_token_type = :text
-						current_token << char
-					end
-				when :preformatted
-					if char == '['
-						current_parent << TextNode.new(current_parent, current_token)
-						current_token_type = :possible_preformatted_end
-						current_token = '['
-					else
-						current_token << char
-					end
-				when :possible_preformatted_end
-					current_token << char
-					if current_token == "[/#{current_parent.tag_name}]" # Did we just see the closing tag for this preformatted element?
-						current_parent = current_parent.parent
-						current_token_type = :unknown
-						current_token = ''
-					elsif char == ']' # We're at the end of this opening/closing tag, and it's not the closing tag for the preformatted element
-						current_parent << TextNode.new(current_parent, current_token)
-						current_token_type = :preformatted
-						current_token = ''
-					end
-				else
-					raise "Unknown token type in state machine: #{current_token_type}"
-				end
-			end
-      str.send(split_method, &block)
-			# Handle whatever's left in the current token
-			if current_token_type != :break and !current_token.empty?
-				current_parent << TextNode.new(current_parent, current_token)
-			end
-			tree
-		end
-		def tag_name_char?(char_code)
-			(char_code >= LOWER_A_CODE and char_code <= LOWER_Z_CODE) or (char_code >= UPPER_A_CODE and char_code <= UPPER_Z_CODE) or char_code.chr == '*'
-		end
-	end
-end

data/pkg/rbbcode-0.1.8.gem DELETED Viewed

Binary file

data/rbbcode.gemspec DELETED Viewed

@@ -1,82 +0,0 @@
-# Generated by jeweler
-# DO NOT EDIT THIS FILE DIRECTLY
-# Instead, edit Jeweler::Tasks in Rakefile, and run 'rake gemspec'
-# -*- encoding: utf-8 -*-
-Gem::Specification.new do |s|
-  s.name = %q{rbbcode}
-  s.version = "0.1.11"
-  s.required_rubygems_version = Gem::Requirement.new(">= 0") if s.respond_to? :required_rubygems_version=
-  s.authors = ["Jarrett Colby", "aq1018@gmail.com"]
-  s.date = %q{2011-02-19}
-  s.description = %q{RbbCode is a customizable Ruby library for parsing BB Code. RbbCode validates and cleans input. It supports customizable schemas so you can set rules about what tags are allowed where. The default rules are designed to ensure valid HTML output.}
-  s.email = %q{jarrett@jarrettcolby.com, aq1018@gmail.com}
-  s.extra_rdoc_files = [
-    "LICENSE.txt",
-    "README.markdown"
-  ]
-  s.files = [
-    ".document",
-    "Gemfile",
-    "LICENSE.txt",
-    "README.markdown",
-    "Rakefile",
-    "VERSION",
-    "lib/rbbcode.rb",
-    "lib/rbbcode/html_maker.rb",
-    "lib/rbbcode/parser.rb",
-    "lib/rbbcode/schema.rb",
-    "lib/rbbcode/tree_maker.rb",
-    "pkg/rbbcode-0.1.8.gem",
-    "rbbcode.gemspec",
-    "spec/html_maker_spec.rb",
-    "spec/node_spec_helper.rb",
-    "spec/parser_spec.rb",
-    "spec/schema_spec.rb",
-    "spec/spec_helper.rb",
-    "spec/tree_maker_spec.rb"
-  ]
-  s.homepage = %q{http://github.com/jarrett/rbbcode}
-  s.licenses = ["MIT"]
-  s.require_paths = ["lib"]
-  s.rubygems_version = %q{1.3.7}
-  s.summary = %q{Ruby BB Code parser}
-  s.test_files = [
-    "spec/html_maker_spec.rb",
-    "spec/node_spec_helper.rb",
-    "spec/parser_spec.rb",
-    "spec/schema_spec.rb",
-    "spec/spec_helper.rb",
-    "spec/tree_maker_spec.rb"
-  ]
-  if s.respond_to? :specification_version then
-    current_version = Gem::Specification::CURRENT_SPECIFICATION_VERSION
-    s.specification_version = 3
-    if Gem::Version.new(Gem::VERSION) >= Gem::Version.new('1.2.0') then
-      s.add_runtime_dependency(%q<sanitize-url>, [">= 0.1.3"])
-      s.add_development_dependency(%q<rspec>, ["~> 2.3.0"])
-      s.add_development_dependency(%q<bluecloth>, [">= 0"])
-      s.add_development_dependency(%q<yard>, ["~> 0.6.0"])
-      s.add_development_dependency(%q<bundler>, ["~> 1.0.0"])
-      s.add_development_dependency(%q<jeweler>, ["~> 1.5.2"])
-    else
-      s.add_dependency(%q<sanitize-url>, [">= 0.1.3"])
-      s.add_dependency(%q<rspec>, ["~> 2.3.0"])
-      s.add_dependency(%q<bluecloth>, [">= 0"])
-      s.add_dependency(%q<yard>, ["~> 0.6.0"])
-      s.add_dependency(%q<bundler>, ["~> 1.0.0"])
-      s.add_dependency(%q<jeweler>, ["~> 1.5.2"])
-    end
-  else
-    s.add_dependency(%q<sanitize-url>, [">= 0.1.3"])
-    s.add_dependency(%q<rspec>, ["~> 2.3.0"])
-    s.add_dependency(%q<bluecloth>, [">= 0"])
-    s.add_dependency(%q<yard>, ["~> 0.6.0"])
-    s.add_dependency(%q<bundler>, ["~> 1.0.0"])
-    s.add_dependency(%q<jeweler>, ["~> 1.5.2"])
-  end
-end

data/spec/html_maker_spec.rb DELETED Viewed

@@ -1,92 +0,0 @@
-# encoding: UTF-8
-require File.expand_path(File.dirname(__FILE__) + '/spec_helper')
-require File.expand_path(File.dirname(__FILE__) + '/node_spec_helper')
-describe RbbCode::HtmlMaker do
-	context '#make_html' do
-		def expect_html(expected_html, &block)
-			@html_maker.make_html(NodeBuilder.build(&block)).should == expected_html
-		end
-		before :each do
-			@html_maker = RbbCode::HtmlMaker.new
-		end
-		it 'should replace simple BB code tags with HTML tags' do
-			expect_html('<p>This is <strong>bold</strong> text</p>') do
-				tag('p') do
-					text 'This is '
-					tag('b') { text 'bold' }
-					text ' text'
-				end
-			end
-		end
-		it 'should work for nested tags' do
-			expect_html('<p>This is <strong>bold and <u>underlined</u></strong> text</p>') do
-				tag('p') do
-					text 'This is '
-					tag('b') do
-						text 'bold and '
-						tag('u') { text 'underlined' }
-					end
-					text ' text'
-				end
-			end
-		end
-		it 'should not allow JavaScript in URLs' do
-			urls = [
-				'javascript:alert("1");',
-				'j a v a script:alert("2");',
-				' javascript:alert("3");',
-				'JavaScript:alert("4");',
-				"java\nscript:alert(\"5\");",
-				"java\rscript:alert(\"6\");"
-			]
-			# url tag
-			urls.each do |evil_url|
-				expect_html('<p><a href="">foo</a></p>') do
-					tag('p') do
-						tag('url', evil_url) do
-							text 'foo'
-						end
-					end
-				end
-			end
-			# img tag
-			urls.each do |evil_url, clean_url|
-				expect_html("<p><img src=\"#{clean_url}\" alt=\"\"/></p>") do
-					tag('p') do
-						tag('img') do
-							text evil_url
-						end
-					end
-				end
-			end
-		end
-		it 'should hex-encode double-quotes in the URL' do
-			expect_html('<p><a href="http://example.com/foo%22bar">Foo</a></p>') do
-				tag('p') do
-					tag('url', 'http://example.com/foo"bar') do
-						text 'Foo'
-					end
-				end
-			end
-		end
-		it 'wraps preformatted tags in <pre>' do
-			expect_html('<p><pre><code>Some code</code></pre></p>') do
-				tag('p') do
-					tag('code', nil, true) do
-						text 'Some code'
-					end
-				end
-			end
-		end
-	end
-end