RubyGems - gammo - Versions diffs - 0.2.0 → 0.3.0 - Mend

gammo 0.2.0 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (52) hide show

checksums.yaml +4 -4
data/.github/workflows/test.yml +32 -0
data/Gemfile.lock +6 -6
data/README.md +334 -10
data/Rakefile +5 -1
data/lib/gammo/attributes.rb +5 -0
data/lib/gammo/css_selector/ast/combinator.rb +92 -0
data/lib/gammo/css_selector/ast/selector/attrib_selector.rb +86 -0
data/lib/gammo/css_selector/ast/selector/class_selector.rb +19 -0
data/lib/gammo/css_selector/ast/selector/id_selector.rb +18 -0
data/lib/gammo/css_selector/ast/selector/negation.rb +21 -0
data/lib/gammo/css_selector/ast/selector/pseudo_class.rb +92 -0
data/lib/gammo/css_selector/ast/selector.rb +100 -0
data/lib/gammo/css_selector/context.rb +17 -0
data/lib/gammo/css_selector/errors.rb +6 -0
data/lib/gammo/css_selector/node_set.rb +44 -0
data/lib/gammo/css_selector/parser.rb +790 -0
data/lib/gammo/css_selector/parser.y +321 -0
data/lib/gammo/css_selector.rb +33 -0
data/lib/gammo/modules/subclassify.rb +31 -0
data/lib/gammo/node.rb +2 -0
data/lib/gammo/parser/foreign.rb +3 -3
data/lib/gammo/parser/insertion_mode/after_after_body.rb +1 -1
data/lib/gammo/parser/insertion_mode/after_after_frameset.rb +1 -1
data/lib/gammo/parser/insertion_mode/after_body.rb +1 -1
data/lib/gammo/parser/insertion_mode/after_frameset.rb +1 -1
data/lib/gammo/parser/insertion_mode/after_head.rb +1 -1
data/lib/gammo/parser/insertion_mode/before_head.rb +1 -1
data/lib/gammo/parser/insertion_mode/before_html.rb +1 -1
data/lib/gammo/parser/insertion_mode/in_body.rb +1 -1
data/lib/gammo/parser/insertion_mode/in_column_group.rb +1 -1
data/lib/gammo/parser/insertion_mode/in_frameset.rb +1 -1
data/lib/gammo/parser/insertion_mode/in_head.rb +3 -2
data/lib/gammo/parser/insertion_mode/in_head_noscript.rb +1 -1
data/lib/gammo/parser/insertion_mode/in_select.rb +1 -1
data/lib/gammo/parser/insertion_mode/in_table.rb +1 -1
data/lib/gammo/parser/insertion_mode/in_template.rb +1 -1
data/lib/gammo/parser/insertion_mode/initial.rb +1 -1
data/lib/gammo/parser/insertion_mode/text.rb +1 -1
data/lib/gammo/parser/insertion_mode.rb +1 -1
data/lib/gammo/tokenizer/tokens.rb +10 -1
data/lib/gammo/tokenizer.rb +10 -10
data/lib/gammo/version.rb +1 -1
data/lib/gammo/xpath/ast/axis.rb +1 -1
data/lib/gammo/xpath/ast/expression.rb +2 -0
data/lib/gammo/xpath/ast/function.rb +1 -1
data/lib/gammo/xpath/ast/node_test.rb +1 -1
data/lib/gammo/xpath/ast/path.rb +1 -0
data/lib/gammo/xpath.rb +4 -5
metadata +17 -4
data/.travis.yml +0 -6
data/lib/gammo/xpath/ast/subclassify.rb +0 -35

data/lib/gammo/css_selector/parser.y ADDED Viewed

@@ -0,0 +1,321 @@
+class Gammo::CSSSelector::Parser
+token T_COMMA
+      T_PLUS
+      T_MINUS
+      T_HYPHEN
+      T_DIMENSION
+      T_NUMBER
+      T_STRING
+      T_IDENT
+      T_NOT
+      T_RBRACK
+      T_HASH
+      T_S
+      T_GREATER
+      T_TILDE
+      T_DOT
+      T_PIPE
+      T_ASTERISK
+      T_LBRACK
+      T_PREFIXMATCH
+      T_SUFFIXMATCH
+      T_SUBSTRINGMATCH
+      T_EQUAL
+      T_INCLUDES
+      T_DASHMATCH
+      T_COLON
+      T_FUNCTION
+      T_RPAREN
+      T_ASTERISK
+start selectors_group
+rule
+  optional_whitespaces:
+    | repeatable_whitespaces
+  repeatable_whitespaces:
+    T_S
+    | repeatable_whitespaces T_S
+  # selectors_group: selector [ COMMA S* selector ]*
+  selectors_group:
+    repeatable_selectors { result = val[0] }
+  repeatable_selectors:
+    selector {
+      result = AST::SelectorsGroup.new
+      result << val[0]
+    }
+    | repeatable_selectors optional_whitespaces T_COMMA optional_whitespaces selector {
+      result = val[0]
+      result << val[4]
+    }
+  # selector: simple_selector_sequence [ combinator simple_selector_sequence ]*
+  selector:
+    repeatable_simple_selector_sequence
+  # combinators can be surrounded by whitespace
+  # combinator: PLUS S* | GREATER S* | TILDE S* | S+
+  combinator:
+    optional_whitespaces T_PLUS optional_whitespaces { result = :next_sibling }
+    | optional_whitespaces T_GREATER optional_whitespaces { result = :child }
+    | optional_whitespaces T_TILDE optional_whitespaces { result = :subsequent_sibling }
+    | repeatable_whitespaces { result = :descendant }
+  repeatable_simple_selector_sequence:
+    simple_selector_sequence {
+      result = val[0]
+    }
+    | repeatable_simple_selector_sequence combinator simple_selector_sequence {
+      result = val[0]
+      result.combine(AST::Combinator.fetch(val[1]).new(val[2]))
+    }
+  # simple_selector_sequence:
+  # [ type_selector | universal ]
+  #   [ HASH | class | attrib | pseudo | negation ]*
+  # | [ HASH | class | attrib | pseudo | negation ]+
+  simple_selector_sequence:
+    type_selector
+    | universal
+    | type_selector repeatable_selector_operators {
+      val[0].selectors.concat(val[1])
+      result = val[0]
+    }
+    | universal repeatable_selector_operators {
+      val[0].selectors.concat(val[1])
+      result = val[0]
+    }
+    | repeatable_selector_operators {
+      any = AST::Selector::Universal.new
+      any.selectors.concat(val[0])
+      result = any
+    }
+  repeatable_selector_operators:
+    selector_operators { result = [val[0]] }
+    | repeatable_selector_operators selector_operators { result = val[0] << val[1] }
+  selector_operators:
+    hash
+    | class
+    | attrib
+    | pseudo
+    | negation
+  # type_selector: [ namespace_prefix ]? element_name
+  type_selector:
+    element_name { result = AST::Selector::Type.new(element_name: val[0]) }
+    | namespace_prefix element_name  { result = AST::Selector::Type.new(element_name: val[1], namespace_prefix: val[0]) }
+  # namespace_prefix: [ IDENT | '*' ]? '|'
+  namespace_prefix:
+    T_PIPE { result = val[0] }
+    | T_IDENT T_PIPE { result = val[0] }
+    | T_ASTERISK T_PIPE { result = val[1] }
+  # element_name: IDENT
+  element_name: T_IDENT { result = val[0] }
+  # universal: [ namespace_prefix ]? '*'
+  universal:
+    namespace_prefix T_ASTERISK { result = AST::Selector::Universal.new(namespace_prefix: val[0]) }
+    | T_ASTERISK { result = AST::Selector::Universal.new }
+  # class: '.' IDENT
+  class: T_DOT T_IDENT { result = AST::Selector::Class.new(val[1]) }
+  # attrib: '[' S* [ namespace_prefix ]? IDENT S*
+  #  [ [ PREFIXMATCH |
+  #      SUFFIXMATCH |
+  #      SUBSTRINGMATCH |
+  #      '=' |
+  #      INCLUDES |
+  #      DASHMATCH ] S* [ IDENT | STRING ] S*
+  #  ]? ']'
+  attrib:
+    T_LBRACK optional_whitespaces namespace_prefix T_IDENT optional_whitespaces optional_attrib_clause T_RBRACK {
+      op, value = val[4]
+      result = AST::Selector::Attrib.fetch(op).new(key: val[2], value: value, namespace_prefix: val[2])
+    }
+    | T_LBRACK optional_whitespaces T_IDENT optional_whitespaces optional_attrib_clause T_RBRACK {
+      op, value = val[4]
+      result = AST::Selector::Attrib.fetch(op).new(key: val[2], value: value)
+    }
+  optional_attrib_clause:
+    | attrib_operators optional_whitespaces T_IDENT optional_whitespaces { result = [val[0], val[2]] }
+    | attrib_operators optional_whitespaces T_STRING optional_whitespaces { result = [val[0], val[2]] }
+  attrib_operators:
+    T_PREFIXMATCH      { result = :prefix_match }
+    | T_SUFFIXMATCH    { result = :suffix_match }
+    | T_SUBSTRINGMATCH { result = :substring_match }
+    | T_EQUAL          { result = :equal }
+    | T_INCLUDES       { result = :includes }
+    | T_DASHMATCH      { result = :dash_match }
+  # pseudo: ':' ':'? [ IDENT | functional_pseudo ]
+  pseudo:
+    T_COLON optional_colon T_IDENT { result = AST::Selector::Pseudo.fetch(val[2]).new }
+    | T_COLON optional_colon functional_pseudo { result = val[2] }
+  optional_colon: | T_COLON
+  # functional_pseudo: FUNCTION S* expression ')'
+  functional_pseudo:
+    T_FUNCTION optional_whitespaces repeatable_expressions T_RPAREN { result = AST::Selector::Pseudo.fetch(val[0].slice(0..-2)).new(val[2]) }
+  # expression: [ [ PLUS | '-' | DIMENSION | NUMBER | STRING | IDENT ] S* ]+
+  expression:
+    T_PLUS | T_MINUS | T_HYPHEN | T_DIMENSION | T_NUMBER | T_STRING | T_IDENT { result = val[0] }
+  repeatable_expressions:
+    expression optional_whitespaces { result = [val[0]] }
+    | repeatable_expressions expression optional_whitespaces {
+      val[0] << val[1]
+      result = val[0]
+    }
+  # negation: NOT S* negation_arg S* ')'
+  negation:
+    T_NOT optional_whitespaces negation_arg optional_whitespaces T_RPAREN { result = AST::Selector::Negation.new(val[2]) }
+  # negation_arg: type_selector | universal | HASH | class | attrib | pseudo
+  negation_arg:
+    type_selector | universal | hash | class | attrib | pseudo
+  hash:
+    T_HASH { result = AST::Selector::ID.new(val[0]) }
+end
+---- inner
+  NONASCII = /[^\0-\177]/
+  UNICODE  = /\\[0-9a-f]{1,6}(\r\n|[ \n\r\t\f])?/
+  ESCAPE   = /#{UNICODE}|\\[^\n\r\f0-9a-f]/
+  NMCHAR   = /[_a-z0-9-]|#{NONASCII}|#{ESCAPE}/
+  NMSTART  = /[_a-z]|#{NONASCII}|#{ESCAPE}/
+  NUM      = /[0-9]+|[0-9]*\.[0-9]+/
+  NAME     = /#{NMCHAR}+/
+  IDENT    = /[-]?#{NMSTART}#{NMCHAR}*/
+  NL       = /\n|\r\n|\r|\f/
+  STRING1  = /\"([^\n\r\f\\"]|\\#{NL}|#{NONASCII}|#{ESCAPE})*\"/
+  STRING2  = /\'([^\n\r\f\\']|\\#{NL}|#{NONASCII}|#{ESCAPE})*\'/
+  STRING   = /#{STRING1}|#{STRING2}/
+  INVALID1 = /\"([^\n\r\f\\"]|\\#{NL}|#{NONASCII}|#{ESCAPE})*/
+  INVALID2 = /\'([^\n\r\f\\']|\\#{NL}|#{NONASCII}|#{ESCAPE})*/
+  INVALID  = /#{INVALID1}|#{INVALID2}/
+  W        = /[ \t\r\n\f]*/
+  D        = /d|\\0{0,4}(44|64)(\r\n|[ \t\r\n\f])?/
+  E        = /e|\\0{0,4}(45|65)(\r\n|[ \t\r\n\f])?/
+  N        = /n|\\0{0,4}(4e|6e)(\r\n|[ \t\r\n\f])?|\\n/
+  O        = /o|\\0{0,4}(4f|6f)(\r\n|[ \t\r\n\f])?|\\o/
+  T        = /t|\\0{0,4}(54|74)(\r\n|[ \t\r\n\f])?|\\t/
+  V        = /v|\\0{0,4}(58|78)(\r\n|[ \t\r\n\f])?|\\v/
+  S        = /[ \t\r\n\f]+/
+  require 'strscan'
+  require 'forwardable'
+  require 'gammo/css_selector/errors'
+  require 'gammo/css_selector/ast/selector'
+  require 'gammo/css_selector/ast/combinator'
+  extend Forwardable
+  def_delegators :@scanner, :scan, :eos?
+  def initialize(input)
+    super()
+    @yydebug = true
+    @input = input
+    @scanner = StringScanner.new(input)
+  end
+  def parse
+    @query = []
+    advance { |symbol, val| @query << [symbol, val] }
+    do_parse
+  end
+  def token(symbol, val, &block)
+    @prev_token = symbol
+    block.call(symbol, val)
+  end
+  def next_token
+    @query.shift
+  end
+  EXPR_TOKENS = {
+    '='  => :T_EQUAL,
+    '['  => :T_LBRACK,
+    ']'  => :T_RBRACK,
+    ')'  => :T_RPAREN,
+    '.'  => :T_DOT,
+    ','  => :T_COMMA,
+    ':'  => :T_COLON
+  }.freeze
+  # Declaring the regexp consisting of EXPR_TOKENS keys to keep the token order.
+  EXPRS = /=|\[|\]|@|,|\.|\)|\:/
+  def fetch(key, constraints)
+    unless symbol = constraints[key]
+      fail ParseError, "unexpected token: #{symbol}, want = #{constraints.keys}"
+    end
+    yield symbol
+  end
+  LEXER_TOKENS = []
+  Pattern = Struct.new(:pattern, :token, :range)
+  def self.map(pattern, token, range: nil)
+    LEXER_TOKENS << Pattern.new(pattern, token, range)
+  end
+  map(S,                 :T_S)
+  map(/\~=/,             :T_INCLUDES)
+  map(/\|=/,             :T_DASHMATCH)
+  map(/\^=/,             :T_PREFIXMATCH)
+  map(/\$=/,             :T_SUFFIXMATCH)
+  map(/\*=/,             :T_SUBSTRINGMATCH)
+  map(/<!--/,            :T_CDO)
+  map(/-->/,             :T_CDC)
+  map(/#{IDENT}\(/,      :T_FUNCTION)
+  map(/#{NUM}%/,         :T_PERCENTAGE)
+  map(/#{NUM}#{IDENT}/,  :T_DIMENSION)
+  map(IDENT,             :T_IDENT)
+  map(STRING,            :T_STRING, range: 1..-2) # Remove quotes
+  map(NUM,               :T_NUMBER)
+  map(/##{NAME}/,        :T_HASH,   range: 1..-1) # Remove hash ('#')
+  map(/#{W}\+/,          :T_PLUS)
+  map(/#{W}\-/,          :T_MINUS)
+  map(/#{W}>/,           :T_GREATER)
+  map(/#{W},/,           :T_COMMA)
+  map(/#{W}~/,           :T_TILDE)
+  map(/:#{N}#{O}#{T}\(/, :T_NOT)
+  map(/@#{IDENT}/,       :T_ATKEYWORD)
+  map(/#{INVALID}/,      :T_INVALID)
+  map(/\|/,              :T_PIPE)
+  map(/\*/,              :T_ASTERISK)
+  # TODO: ignore comment token
+  def advance(&block)
+    @prev_token = nil
+    until eos?
+      next if LEXER_TOKENS.find do |pattern|
+        next false unless matched = scan(pattern.pattern)
+        matched = matched[pattern.range] if pattern.range
+        token pattern.token, matched, &block
+        break true
+      end
+      if expr = scan(EXPRS)
+        fetch(expr, EXPR_TOKENS) { |symbol| token symbol, expr, &block }
+        next
+      end
+      fail ParseError, "unexpected token: '#{@scanner.string[@scanner.pos..-1]}'"
+    end
+  end

data/lib/gammo/css_selector.rb ADDED Viewed

@@ -0,0 +1,33 @@
+require 'gammo/css_selector/context'
+require 'gammo/css_selector/parser'
+module Gammo
+  module CSSSelector
+    # Class for traversing DOM tree built by Gammo::Parser by a given expresison.
+    # @!visibility private
+    class Traverser
+      # Constructs an instance of Gammo::CSSSelector::Traverser.
+      # @param [String] expr
+      # @!visibility private
+      def initialize(expr)
+        @expr = expr
+      end
+      # Evaluates a given expression and returns a node set.
+      # @param [Gammo::CSSSelector::Context] context
+      # @return [Gammo::CSSSelector::NodeSet]
+      # @!visibility private
+      def evaluate(context)
+        Parser.new(@expr).parse.evaluate(context)
+      end
+    end
+    # Traverses DOM tree by a given expression, and returns a node set.
+    # @param [String] expr
+    # @return [Gammo::CSSSelector::NodeSet]
+    def query_selector_all(expr)
+      Traverser.new(expr).evaluate(Context.new(node: self))
+    end
+    alias_method :css, :query_selector_all
+  end
+end

data/lib/gammo/modules/subclassify.rb ADDED Viewed

@@ -0,0 +1,31 @@
+module Gammo
+  # Class for making subclass declarable/fetchable
+  # @!visibility private
+  module Subclassify
+    NotFoundError = Class.new(ArgumentError)
+    # @!visibility private
+    def map
+      @map ||= {}
+    end
+    # @!visibility private
+    def declare(key)
+      look_for_superclass.map[key] = self
+    end
+    # @!visibility private
+    def fetch(key)
+      fail NotFoundError, "%s not found" % key unless klass = map[key.to_sym]
+      klass
+    end
+    private
+    # @!visibility private
+    def look_for_superclass
+      klass = superclass
+      ancestors.find { |ancestor| ancestor == klass }
+    end
+  end
+end

data/lib/gammo/node.rb CHANGED Viewed

@@ -1,3 +1,4 @@
+require 'gammo/css_selector'
 require 'gammo/xpath'
 require 'gammo/attributes'
@@ -58,6 +59,7 @@ module Gammo
     # Represents the root document token.
     class Document < Node
       include XPath
+      include CSSSelector
     end
     # Represents the element token including start, end and self-closing token.

data/lib/gammo/parser/foreign.rb CHANGED Viewed

@@ -177,7 +177,7 @@ module Gammo
       def parse_foreign_content
         case token
-        when Tokenizer::TextToken
+        when Tokenizer::CharacterToken
           self.frameset_ok = token.data.lstrip.sub(/\A\x00*/, '').lstrip.empty? if frameset_ok
           token.data = token.data.gsub(/\x00/, "\ufffd")
           add_text token.data
@@ -249,11 +249,11 @@ module Gammo
         if math_ml_text_integration_point?(node)
           return false if token.instance_of?(Tokenizer::StartTagToken) && token.tag != Tags::Mglyph &&
             token.tag != Tags::Malignmark
-          return false if token.instance_of?(Tokenizer::TextToken)
+          return false if token.instance_of?(Tokenizer::CharacterToken)
         end
         return false if node.namespace == 'math' && node.tag == Tags::AnnotationXml && \
           token.instance_of?(Tokenizer::StartTagToken) && token.tag == Tags::Svg
-        return false if html_integration_point?(node) && (token.instance_of?(Tokenizer::StartTagToken) || token.instance_of?(Tokenizer::TextToken))
+        return false if html_integration_point?(node) && (token.instance_of?(Tokenizer::StartTagToken) || token.instance_of?(Tokenizer::CharacterToken))
         return false if token.instance_of? Tokenizer::ErrorToken
         true
       end

data/lib/gammo/parser/insertion_mode/after_after_body.rb CHANGED Viewed

@@ -7,7 +7,7 @@ module Gammo
         halt true
       end
-      def text_token(token)
+      def character_token(token)
         halt InBody.new(parser).process if token.data.lstrip.length.zero?
       end

data/lib/gammo/parser/insertion_mode/after_after_frameset.rb CHANGED Viewed

@@ -6,7 +6,7 @@ module Gammo
         parser.document.append_child Node::Comment.new(data: token.data)
       end
-      def text_token(token)
+      def character_token(token)
         halt InBody.new(parser).process unless token.data.gsub(/[^\s]/, '').empty?
       end

data/lib/gammo/parser/insertion_mode/after_body.rb CHANGED Viewed

@@ -8,7 +8,7 @@ module Gammo
         true
       end
-      def text_token(token)
+      def character_token(token)
         s = token.data.lstrip
         halt InBody.new(parser).process if s.length.zero?
       end

data/lib/gammo/parser/insertion_mode/after_frameset.rb CHANGED Viewed

@@ -8,7 +8,7 @@ module Gammo
         parser.add_child Node::Comment.new(data: token.data)
       end
-      def text_token(token)
+      def character_token(token)
         s = token.data.gsub(/[^\s]/, '')
         parser.add_text(s) unless s.empty?
       end

data/lib/gammo/parser/insertion_mode/after_head.rb CHANGED Viewed

@@ -2,7 +2,7 @@ module Gammo
   class Parser
     # Section 12.2.6.4.5.
     class AfterHead < InsertionMode
-      def text_token(token)
+      def character_token(token)
         s = token.data.lstrip
         if s.length < token.data.length
           # add the initial whitespace to the current node.

data/lib/gammo/parser/insertion_mode/before_head.rb CHANGED Viewed

@@ -2,7 +2,7 @@ module Gammo
   class Parser
     # Section 12.2.6.4.3
     class BeforeHead < InsertionMode
-      def text_token(token)
+      def character_token(token)
         token.data = token.data.lstrip
         halt true if token.data.length.zero?
       end

data/lib/gammo/parser/insertion_mode/before_html.rb CHANGED Viewed

@@ -7,7 +7,7 @@ module Gammo
         halt true
       end
-      def text_token(token)
+      def character_token(token)
         token.data = token.data.lstrip
         # it's all whitespace so ignore it.
         halt true if token.data.length.zero?

data/lib/gammo/parser/insertion_mode/in_body.rb CHANGED Viewed

@@ -2,7 +2,7 @@ module Gammo
   class Parser
     # Section 12.2.6.4.6.
     class InBody < InsertionMode
-      def text_token(token)
+      def character_token(token)
         data = token.data
         node = parser.open_elements.last
         case node.tag

data/lib/gammo/parser/insertion_mode/in_column_group.rb CHANGED Viewed

@@ -2,7 +2,7 @@ module Gammo
   class Parser
     # Section 12.2.6.4.12.
     class InColumnGroup < InsertionMode
-      def text_token(token)
+      def character_token(token)
         s = token.data.lstrip
         if s.length < token.data.length
           # add the initial whitespace to the current node.

data/lib/gammo/parser/insertion_mode/in_frameset.rb CHANGED Viewed

@@ -6,7 +6,7 @@ module Gammo
         parser.add_child Node::Comment.new(data: token.data)
       end
-      def text_token(token)
+      def character_token(token)
         text = token.data.each_char.with_object(String.new) { |c, s| s << c if c == ?\s }
         parser.add_text(text) if text != ''
       end

data/lib/gammo/parser/insertion_mode/in_head.rb CHANGED Viewed

@@ -2,7 +2,7 @@ module Gammo
   class Parser
     # Section 12.2.6.4.4.
     class InHead < InsertionMode
-      def text_token(token)
+      def character_token(token)
         s = token.data.lstrip
         if s.length < token.data.length
           # add the initial whitespace to the current node.
@@ -90,7 +90,8 @@ module Gammo
       end
       def default(_)
-        parser.parse_implied_token(Tokenizer::EndTagToken, Tags::Head, Tags::Head.to_s)
+        parser.open_elements.pop
+        parser.insertion_mode = AfterHead
         halt false
       end
     end

data/lib/gammo/parser/insertion_mode/in_head_noscript.rb CHANGED Viewed

@@ -36,7 +36,7 @@ module Gammo
         end
       end
-      def text_token(token)
+      def character_token(token)
         halt InHead.new(parser).process if token.data.lstrip == ''
       end

data/lib/gammo/parser/insertion_mode/in_select.rb CHANGED Viewed

@@ -2,7 +2,7 @@ module Gammo
   class Parser
     # Section 12.2.6.4.16.
     class InSelect < InsertionMode
-      def text_token(token)
+      def character_token(token)
         parser.add_text token.data.gsub("\x00",'')
       end

data/lib/gammo/parser/insertion_mode/in_table.rb CHANGED Viewed

@@ -2,7 +2,7 @@ module Gammo
   class Parser
     # Section 12.2.6.4.9.
     class InTable < InsertionMode
-      def text_token(token)
+      def character_token(token)
         token.data = token.data.gsub("\x00", "")
         case parser.open_elements.last.tag
         when Tags::Table, Tags::Tbody, Tags::Tfoot, Tags::Thead, Tags::Tr

data/lib/gammo/parser/insertion_mode/in_template.rb CHANGED Viewed

@@ -2,7 +2,7 @@ module Gammo
   class Parser
     # Section 12.2.6.4.18.
     class InTemplate < InsertionMode
-      def text_token(token)
+      def character_token(token)
         halt InBody.new(parser).process
       end

data/lib/gammo/parser/insertion_mode/initial.rb CHANGED Viewed

@@ -4,7 +4,7 @@ module Gammo
   class Parser
     # Section 12.2.6.4.1
     class Initial < InsertionMode
-      def text_token(token)
+      def character_token(token)
         token.data = token.data.lstrip
         # it's all whitespace so ignore it.
         halt true if token.data.length.zero?

data/lib/gammo/parser/insertion_mode/text.rb CHANGED Viewed

@@ -6,7 +6,7 @@ module Gammo
         parser.open_elements.pop
       end
-      def text_token(token)
+      def character_token(token)
         d = token.data
         n = parser.open_elements.last
         if n.tag == Tags::Textarea && n.first_child.nil?

data/lib/gammo/parser/insertion_mode.rb CHANGED Viewed

@@ -12,7 +12,7 @@ module Gammo
       def process
         case token = parser.token
         when Tokenizer::ErrorToken          then consume(:error_token)
-        when Tokenizer::TextToken           then consume(:text_token)
+        when Tokenizer::CharacterToken      then consume(:character_token)
         when Tokenizer::StartTagToken       then consume(:start_tag_token)
         when Tokenizer::EndTagToken         then consume(:end_tag_token)
         when Tokenizer::SelfClosingTagToken then consume(:self_closing_tag_token)

data/lib/gammo/tokenizer/tokens.rb CHANGED Viewed

@@ -14,6 +14,15 @@ module Gammo
       def concat(s)
         data << s
       end
+      def to_s
+        s = "<#{self.class}"
+        members = []
+        members << "tag=\"#{tag}\"" if tag
+        members << "data=\"#{data}\"" if data
+        members << "attributes=\"#{attributes}\"" if attributes && !attributes.empty?
+        "<#{self.class} #{members.join(' ')}>"
+      end
     end
     class EscapedToken < BaseToken
@@ -56,7 +65,7 @@ module Gammo
     end
     ErrorToken          = Class.new(BaseToken)
-    TextToken           = Class.new(EscapedToken)
+    CharacterToken      = Class.new(EscapedToken)
     StartTagToken       = Class.new(BaseToken)
     EndTagToken         = Class.new(BaseToken)
     SelfClosingTagToken = Class.new(BaseToken)