RubyGems - coderay - Versions diffs - 1.0.0 → 1.0.0.598.pre - Mend

coderay 1.0.0 → 1.0.0.598.pre

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (79) hide show

data/FOLDERS +49 -0
data/Rakefile +6 -5
data/bin/coderay +74 -190
data/bin/coderay_stylesheet +4 -0
data/{README_INDEX.rdoc → lib/README} +20 -10
data/lib/coderay.rb +60 -62
data/lib/coderay/duo.rb +55 -2
data/lib/coderay/encoder.rb +39 -52
data/lib/coderay/encoders/_map.rb +7 -11
data/lib/coderay/encoders/comment_filter.rb +61 -0
data/lib/coderay/encoders/count.rb +26 -11
data/lib/coderay/encoders/debug.rb +60 -11
data/lib/coderay/encoders/div.rb +8 -9
data/lib/coderay/encoders/filter.rb +52 -12
data/lib/coderay/encoders/html.rb +113 -106
data/lib/coderay/encoders/html/css.rb +7 -2
data/lib/coderay/encoders/html/numbering.rb +27 -24
data/lib/coderay/encoders/html/output.rb +58 -15
data/lib/coderay/encoders/json.rb +44 -37
data/lib/coderay/encoders/lines_of_code.rb +56 -9
data/lib/coderay/encoders/null.rb +13 -6
data/lib/coderay/encoders/page.rb +8 -8
data/lib/coderay/encoders/span.rb +9 -10
data/lib/coderay/encoders/statistic.rb +114 -51
data/lib/coderay/encoders/terminal.rb +10 -7
data/lib/coderay/encoders/text.rb +36 -17
data/lib/coderay/encoders/token_kind_filter.rb +58 -1
data/lib/coderay/encoders/xml.rb +11 -13
data/lib/coderay/encoders/yaml.rb +14 -16
data/lib/coderay/for_redcloth.rb +1 -1
data/lib/coderay/helpers/file_type.rb +240 -125
data/lib/coderay/helpers/gzip_simple.rb +123 -0
data/lib/coderay/helpers/plugin.rb +307 -241
data/lib/coderay/helpers/word_list.rb +126 -65
data/lib/coderay/scanner.rb +103 -153
data/lib/coderay/scanners/_map.rb +16 -18
data/lib/coderay/scanners/c.rb +13 -13
data/lib/coderay/scanners/cpp.rb +6 -6
data/lib/coderay/scanners/css.rb +48 -47
data/lib/coderay/scanners/debug.rb +55 -9
data/lib/coderay/scanners/delphi.rb +4 -4
data/lib/coderay/scanners/diff.rb +25 -43
data/lib/coderay/scanners/groovy.rb +2 -2
data/lib/coderay/scanners/html.rb +30 -107
data/lib/coderay/scanners/java.rb +5 -6
data/lib/coderay/scanners/java/builtin_types.rb +0 -2
data/lib/coderay/scanners/java_script.rb +6 -6
data/lib/coderay/scanners/json.rb +6 -7
data/lib/coderay/scanners/nitro_xhtml.rb +136 -0
data/lib/coderay/scanners/php.rb +12 -13
data/lib/coderay/scanners/plaintext.rb +26 -0
data/lib/coderay/scanners/python.rb +4 -4
data/lib/coderay/scanners/{erb.rb → rhtml.rb} +11 -19
data/lib/coderay/scanners/ruby.rb +208 -219
data/lib/coderay/scanners/ruby/patterns.rb +85 -18
data/lib/coderay/scanners/scheme.rb +136 -0
data/lib/coderay/scanners/sql.rb +22 -29
data/lib/coderay/scanners/yaml.rb +10 -11
data/lib/coderay/styles/_map.rb +2 -2
data/lib/coderay/styles/alpha.rb +104 -102
data/lib/coderay/styles/cycnus.rb +143 -0
data/lib/coderay/styles/murphy.rb +123 -0
data/lib/coderay/token_kinds.rb +86 -87
data/lib/coderay/tokens.rb +169 -26
data/test/functional/basic.rb +14 -200
data/test/functional/examples.rb +14 -20
data/test/functional/for_redcloth.rb +8 -15
data/test/functional/load_plugin_scanner.rb +11 -0
data/test/functional/suite.rb +6 -9
data/test/functional/vhdl.rb +126 -0
data/test/functional/word_list.rb +79 -0
metadata +129 -107
data/lib/coderay/helpers/gzip.rb +0 -41
data/lib/coderay/scanners/clojure.rb +0 -217
data/lib/coderay/scanners/haml.rb +0 -168
data/lib/coderay/scanners/ruby/string_state.rb +0 -71
data/lib/coderay/scanners/text.rb +0 -26
data/lib/coderay/tokens_proxy.rb +0 -55
data/lib/coderay/version.rb +0 -3

data/lib/coderay/token_kinds.rb CHANGED Viewed

@@ -1,90 +1,89 @@
 module CodeRay
-  # A Hash of all known token kinds and their associated CSS classes.
-  TokenKinds = Hash.new do |h, k|
-    warn 'Undefined Token kind: %p' % [k] if $CODERAY_DEBUG
-    false
+  class Tokens
+    AbbreviationForKind = Hash.new do |h, k|  # :nodoc:
+      if $CODERAY_DEBUG
+        raise 'Undefined Token kind: %p' % [k]  # :nodoc:
+      else
+        :NO_HIGHLIGHT
+      end
+    end
+    AbbreviationForKind.update with = {  # :nodoc:
+      :annotation => 'at',
+      :attribute_name => 'an',
+      :attribute_value => 'av',
+      :bin => 'bi',
+      :char => 'ch',
+      :class => 'cl',
+      :class_variable => 'cv',
+      :color => 'cr',
+      :comment => 'c',
+      :complex => 'cm',
+      :constant => 'co',
+      :content => 'k',
+      :decorator => 'de',
+      :definition => 'df',
+      :delimiter => 'dl',
+      :directive => 'di',
+      :doc => 'do',
+      :doctype => 'dt',
+      :doc_string => 'ds',
+      :entity => 'en',
+      :error => 'er',
+      :escape => 'e',
+      :exception => 'ex',
+      :filename => 'filename',
+      :float => 'fl',
+      :function => 'fu',
+      :global_variable => 'gv',
+      :hex => 'hx',
+      :imaginary => 'cm',
+      :important => 'im',
+      :include => 'ic',
+      :inline => 'il',
+      :inline_delimiter => 'idl',
+      :instance_variable => 'iv',
+      :integer => 'i',
+      :interpreted => 'in',
+      :key => 'ke',
+      :keyword => 'kw',
+      :label => 'la',
+      :local_variable => 'lv',
+      :modifier => 'mod',
+      :namespace => 'ns',
+      :oct => 'oc',
+      :predefined => 'pd',
+      :preprocessor => 'pp',
+      :pre_constant => 'pc',
+      :pre_type => 'pt',
+      :pseudo_class => 'ps',
+      :regexp => 'rx',
+      :reserved => 'r',
+      :shell => 'sh',
+      :string => 's',
+      :symbol => 'sy',
+      :tag => 'ta',
+      :tag_special => 'ts',
+      :type => 'ty',
+      :value => 'vl',
+      :variable => 'v',
+      :insert => 'ins',
+      :delete => 'del',
+      :change => 'chg',
+      :head => 'head',
+      :eyecatcher => 'eye',
+      :ident => :NO_HIGHLIGHT, # 'id'
+      #:operator => 'op',
+      :operator => :NO_HIGHLIGHT,  # 'op'
+      :space => :NO_HIGHLIGHT,  # 'sp'
+      :plain => :NO_HIGHLIGHT,
+    }
+    AbbreviationForKind[:method] = AbbreviationForKind[:function]
+    AbbreviationForKind[:nesting_delimiter] = AbbreviationForKind[:delimiter]
+    AbbreviationForKind[:escape] = AbbreviationForKind[:delimiter]
+    AbbreviationForKind[:docstring] = AbbreviationForKind[:comment]
+    #AbbreviationForKind.default = AbbreviationForKind[:error] or raise 'no class found for :error!'
   end
-  # speedup
-  TokenKinds.compare_by_identity if TokenKinds.respond_to? :compare_by_identity
-  TokenKinds.update(  # :nodoc:
-    :annotation          => 'annotation',
-    :attribute_name      => 'attribute-name',
-    :attribute_value     => 'attribute-value',
-    :binary              => 'bin',
-    :char                => 'char',
-    :class               => 'class',
-    :class_variable      => 'class-variable',
-    :color               => 'color',
-    :comment             => 'comment',
-    :complex             => 'complex',
-    :constant            => 'constant',
-    :content             => 'content',
-    :debug               => 'debug',
-    :decorator           => 'decorator',
-    :definition          => 'definition',
-    :delimiter           => 'delimiter',
-    :directive           => 'directive',
-    :doc                 => 'doc',
-    :doctype             => 'doctype',
-    :doc_string          => 'doc-string',
-    :entity              => 'entity',
-    :error               => 'error',
-    :escape              => 'escape',
-    :exception           => 'exception',
-    :filename            => 'filename',
-    :float               => 'float',
-    :function            => 'function',
-    :global_variable     => 'global-variable',
-    :hex                 => 'hex',
-    :imaginary           => 'imaginary',
-    :important           => 'important',
-    :include             => 'include',
-    :inline              => 'inline',
-    :inline_delimiter    => 'inline-delimiter',
-    :instance_variable   => 'instance-variable',
-    :integer             => 'integer',
-    :key                 => 'key',
-    :keyword             => 'keyword',
-    :label               => 'label',
-    :local_variable      => 'local-variable',
-    :modifier            => 'modifier',
-    :namespace           => 'namespace',
-    :octal               => 'octal',
-    :predefined          => 'predefined',
-    :predefined_constant => 'predefined-constant',
-    :predefined_type     => 'predefined-type',
-    :preprocessor        => 'preprocessor',
-    :pseudo_class        => 'pseudo-class',
-    :regexp              => 'regexp',
-    :reserved            => 'reserved',
-    :shell               => 'shell',
-    :string              => 'string',
-    :symbol              => 'symbol',
-    :tag                 => 'tag',
-    :type                => 'type',
-    :value               => 'value',
-    :variable            => 'variable',
-    :change              => 'change',
-    :delete              => 'delete',
-    :head                => 'head',
-    :insert              => 'insert',
-    :eyecatcher          => 'eyecatcher',
-    :ident               => false,
-    :operator            => false,
-    :space               => false,
-    :plain               => false
-  )
-  TokenKinds[:method]    = TokenKinds[:function]
-  TokenKinds[:escape]    = TokenKinds[:delimiter]
-  TokenKinds[:docstring] = TokenKinds[:comment]
-  TokenKinds.freeze
 end

data/lib/coderay/tokens.rb CHANGED Viewed

@@ -1,8 +1,5 @@
 module CodeRay
-  # GZip library for writing and reading token dumps.
-  autoload :GZip, 'coderay/helpers/gzip'
   # = Tokens  TODO: Rewrite!
   #
   # The Tokens class represents a list of tokens returnd from
@@ -64,25 +61,127 @@ module CodeRay
     #
     # options are passed to the encoder.
     def encode encoder, options = {}
-      encoder = Encoders[encoder].new options if encoder.respond_to? :to_sym
+      unless encoder.is_a? Encoders::Encoder
+        unless encoder.is_a? Class
+          encoder_class = Encoders[encoder]
+        end
+        encoder = encoder_class.new options
+      end
       encoder.encode_tokens self, options
     end
-    # Turn tokens into a string by concatenating them.
-    def to_s
-      encode CodeRay::Encoders::Encoder.new
+    # Turn into a string using Encoders::Text.
+    #
+    # +options+ are passed to the encoder if given.
+    def to_s options = {}
+      encode :text, options
     end
     # Redirects unknown methods to encoder calls.
     #
     # For example, if you call +tokens.html+, the HTML encoder
     # is used to highlight the tokens.
     def method_missing meth, options = {}
-      encode meth, options
+      encode_with meth, options
     rescue PluginHost::PluginNotFound
       super
     end
+    def encode_with encoder, options = {}
+      Encoders[encoder].new(options).encode_tokens self
+    end
+    # Returns the tokens compressed by joining consecutive
+    # tokens of the same kind.
+    #
+    # This can not be undone, but should yield the same output
+    # in most Encoders.  It basically makes the output smaller.
+    #
+    # Combined with dump, it saves space for the cost of time.
+    #
+    # If the scanner is written carefully, this is not required -
+    # for example, consecutive //-comment lines could already be
+    # joined in one comment token by the Scanner.
+    def optimize
+      raise NotImplementedError, 'Tokens#optimize needs to be rewritten.'
+      last_kind = last_text = nil
+      new = self.class.new
+      for text, kind in self
+        if text.is_a? String
+          if kind == last_kind
+            last_text << text
+          else
+            new << [last_text, last_kind] if last_kind
+            last_text = text
+            last_kind = kind
+          end
+        else
+          new << [last_text, last_kind] if last_kind
+          last_kind = last_text = nil
+          new << [text, kind]
+        end
+      end
+      new << [last_text, last_kind] if last_kind
+      new
+    end
+    # Compact the object itself; see optimize.
+    def optimize!
+      replace optimize
+    end
+    # Ensure that all begin_group tokens have a correspondent end_group.
+    #
+    # TODO: Test this!
+    def fix
+      raise NotImplementedError, 'Tokens#fix needs to be rewritten.'
+      tokens = self.class.new
+      # Check token nesting using a stack of kinds.
+      opened = []
+      for type, kind in self
+        case type
+        when :begin_group
+          opened.push [:begin_group, kind]
+        when :begin_line
+          opened.push [:end_line, kind]
+        when :end_group, :end_line
+          expected = opened.pop
+          if [type, kind] != expected
+            # Unexpected end; decide what to do based on the kind:
+            # - token was never opened: delete the end (just skip it)
+            next unless opened.rindex expected
+            # - token was opened earlier: also close tokens in between
+            tokens << token until (token = opened.pop) == expected
+          end
+        end
+        tokens << [type, kind]
+      end
+      # Close remaining opened tokens
+      tokens << token while token = opened.pop
+      tokens
+    end
+    def fix!
+      replace fix
+    end
+    # TODO: Scanner#split_into_lines
+    #
+    # Makes sure that:
+    # - newlines are single tokens
+    #   (which means all other token are single-line)
+    # - there are no open tokens at the end the line
+    #
+    # This makes it simple for encoders that work line-oriented,
+    # like HTML with list-style numeration.
+    def split_into_lines
+      raise NotImplementedError
+    end
+    def split_into_lines!
+      replace split_into_lines
+    end
     # Split the tokens into parts of the given +sizes+.
     #
     # The result will be an Array of Tokens objects. The parts have
@@ -121,15 +220,12 @@ module CodeRay
                 content_or_kind
               end
             end
-            part.concat closing
-            begin
-              parts << part
-              part = Tokens.new
-              size = sizes[i += 1]
-            end until size.nil? || size > 0
+            parts << part.concat(closing)
+            part = Tokens.new
             # ...and open them again.
             part.concat opened.flatten
             part_size = 0
+            size = sizes[i += 1]
             redo unless content.empty?
           else
             part << content << item
@@ -143,19 +239,19 @@ module CodeRay
           when :end_group, :end_line
             opened.pop
           else
-            raise ArgumentError, 'Unknown token action: %p, kind = %p' % [content, item]
+            raise 'Unknown token action: %p, kind = %p' % [content, item]
           end
           part << content << item
           content = nil
         else
-          raise ArgumentError, 'Token input junk: %p, kind = %p' % [content, item]
+          raise 'else case reached'
         end
       end
       parts << part
       parts << Tokens.new while parts.size < sizes.size
       parts
     end
     # Dumps the object into a String that can be saved
     # in files or databases.
     #
@@ -172,8 +268,9 @@ module CodeRay
     #
     # See GZip module.
     def dump gzip_level = 7
+      require 'coderay/helpers/gzip_simple'
       dump = Marshal.dump self
-      dump = GZip.gzip dump, gzip_level
+      dump = dump.gzip gzip_level
       dump.extend Undumping
     end
@@ -181,7 +278,7 @@ module CodeRay
     def count
       size / 2
     end
     # Include this module to give an object an #undump
     # method.
     #
@@ -192,17 +289,18 @@ module CodeRay
         Tokens.load self
       end
     end
     # Undump the object using Marshal.load, then
     # unzip it using GZip.gunzip.
     #
     # The result is commonly a Tokens object, but
     # this is not guaranteed.
     def Tokens.load dump
-      dump = GZip.gunzip dump
+      require 'coderay/helpers/gzip_simple'
+      dump = dump.gunzip
       @dump = Marshal.load dump
     end
     alias text_token push
     def begin_group kind; push :begin_group, kind end
     def end_group kind; push :end_group, kind end
@@ -211,5 +309,50 @@ module CodeRay
     alias tokens concat
   end
 end
+if $0 == __FILE__
+  $VERBOSE = true
+  $: << File.join(File.dirname(__FILE__), '..')
+  eval DATA.read, nil, $0, __LINE__ + 4
+end
+__END__
+require 'test/unit'
+class TokensTest < Test::Unit::TestCase
+  def test_creation
+    assert CodeRay::Tokens < Array
+    tokens = nil
+    assert_nothing_raised do
+      tokens = CodeRay::Tokens.new
+    end
+    assert_kind_of Array, tokens
+  end
+  def test_adding_tokens
+    tokens = CodeRay::Tokens.new
+    assert_nothing_raised do
+      tokens.text_token 'string', :type
+      tokens.text_token '()', :operator
+    end
+    assert_equal tokens.size, 4
+    assert_equal tokens.count, 2
+  end
+  def test_dump_undump
+    tokens = CodeRay::Tokens.new
+    assert_nothing_raised do
+      tokens.text_token 'string', :type
+      tokens.text_token '()', :operator
+    end
+    tokens2 = nil
+    assert_nothing_raised do
+      tokens2 = tokens.dump.undump
+    end
+    assert_equal tokens, tokens2
+  end
+end