RubyGems - asciidoctor - Versions diffs - 0.0.7 → 0.0.9 - Mend

asciidoctor 0.0.7 → 0.0.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of asciidoctor might be problematic. Click here for more details.

Files changed (47) hide show

data/Gemfile +2 -0
data/README.asciidoc +35 -26
data/Rakefile +9 -6
data/asciidoctor.gemspec +27 -8
data/bin/asciidoctor +1 -1
data/lib/asciidoctor.rb +351 -63
data/lib/asciidoctor/abstract_block.rb +218 -0
data/lib/asciidoctor/abstract_node.rb +249 -0
data/lib/asciidoctor/attribute_list.rb +211 -0
data/lib/asciidoctor/backends/base_template.rb +99 -0
data/lib/asciidoctor/backends/docbook45.rb +510 -0
data/lib/asciidoctor/backends/html5.rb +585 -0
data/lib/asciidoctor/block.rb +27 -254
data/lib/asciidoctor/callouts.rb +117 -0
data/lib/asciidoctor/debug.rb +7 -4
data/lib/asciidoctor/document.rb +229 -77
data/lib/asciidoctor/inline.rb +29 -0
data/lib/asciidoctor/lexer.rb +1330 -502
data/lib/asciidoctor/list_item.rb +33 -34
data/lib/asciidoctor/reader.rb +305 -142
data/lib/asciidoctor/renderer.rb +115 -19
data/lib/asciidoctor/section.rb +100 -189
data/lib/asciidoctor/substituters.rb +468 -0
data/lib/asciidoctor/table.rb +499 -0
data/lib/asciidoctor/version.rb +1 -1
data/test/attributes_test.rb +301 -87
data/test/blocks_test.rb +568 -0
data/test/document_test.rb +221 -24
data/test/fixtures/dot.gif +0 -0
data/test/fixtures/encoding.asciidoc +1 -0
data/test/fixtures/include-file.asciidoc +1 -0
data/test/fixtures/tip.gif +0 -0
data/test/headers_test.rb +411 -43
data/test/lexer_test.rb +265 -45
data/test/links_test.rb +144 -3
data/test/lists_test.rb +2252 -74
data/test/paragraphs_test.rb +21 -30
data/test/preamble_test.rb +24 -0
data/test/reader_test.rb +248 -12
data/test/renderer_test.rb +22 -0
data/test/substitutions_test.rb +414 -0
data/test/tables_test.rb +484 -0
data/test/test_helper.rb +70 -6
data/test/text_test.rb +30 -6
metadata +64 -10
data/lib/asciidoctor/render_templates.rb +0 -317
data/lib/asciidoctor/string.rb +0 -12

data/lib/asciidoctor/debug.rb CHANGED

@@ -1,6 +1,8 @@
 module Asciidoctor
-  def self.debug(*args)
-    puts *args if self.show_debug_output?
+  @show_debug = nil
+  def self.debug
+    puts yield if self.show_debug_output?
   end
   def self.set_debug(value)
@@ -12,9 +14,10 @@ module Asciidoctor
   end
   def self.puts_indented(level, *args)
-    thing = " "*level*2
+    indentation = " " * level * 2
     args.each do |arg|
-      self.debug "#{thing}#{arg}"
+      self.debug { "#{indentation}#{arg}" }
     end
   end
 end

data/lib/asciidoctor/document.rb CHANGED

@@ -1,73 +1,194 @@
 # Public: Methods for parsing Asciidoc documents and rendering them
 # using erb templates.
-class Asciidoctor::Document
+#
+# There are several strategies for getting the title of the document:
+#
+# doctitle - value of title attribute, if assigned and non-empty,
+#            otherwise title of first section in document, if present
+#            otherwise nil
+# name - an alias of doctitle
+# title - value of the title attribute, or nil if not present
+# first_section.title - title of first section in document, if present
+# header.title - title of section level 0
+#
+# Keep in mind that you'll want to honor these document settings:
+#
+# notitle  - The h1 heading should not be shown
+# noheader - The header block (h1 heading, author, revision info) should not be shown
+class Asciidoctor::Document < Asciidoctor::AbstractBlock
   include Asciidoctor
-  # Public: Get the Hash of attributes
-  attr_reader :attributes
+  # Public A read-only integer value indicating the level of security that
+  # should be enforced while processing this document. The value must be
+  # set in the Document constructor using the :safe option.
+  #
+  # A value of 0 (UNSAFE) disables any of the security features enforced
+  # by Asciidoctor (Ruby is still subject to its own restrictions).
+  #
+  # A value of 1 (SAFE) closely parallels safe mode in AsciiDoc. In particular,
+  # it prevents access to files which reside outside of the parent directory
+  # of the source file and disables any macro other than the include macro.
+  #
+  # A value of 10 (SECURE) disallows the document from attempting to read
+  # files from the file system and including the contents of them into the
+  # document. In particular, it disallows use of the include::[] macro and the
+  # embedding of binary content (data uri), stylesheets and JavaScripts
+  # referenced by the document. (Asciidoctor and trusted extensions may still
+  # be allowed to embed trusted content into the document). Since Asciidoctor
+  # is aiming for wide adoption, this value is the default and is recommended
+  # for server-side deployments.
+  #
+  # A value of 100 (PARANOID) is planned to disallow the use of passthrough
+  # macros and prevents the document from setting any known attributes in
+  # addition to all the security features of SafeMode::SECURE. Please note that
+  # this level is not currently implemented (and therefore not enforced)!
+  attr_reader :safe
   # Public: Get the Hash of document references
   attr_reader :references
-  # The section level 0 element
+  # Public: Get the Hash of callouts
+  attr_reader :callouts
+  # Public: The section level 0 block
   attr_reader :header
-  # Public: Get the Array of elements (really Blocks or Sections) for the document
-  attr_reader :elements
+  # Public: Base directory for rendering this document
+  attr_reader :base_dir
+  # Public: A reference to the parent document of this nested document.
+  attr_reader :parent_document
   # Public: Initialize an Asciidoc object.
   #
-  # data  - The Array of Strings holding the Asciidoc source document.
-  # block - A block that can be used to retrieve external Asciidoc
-  #         data to include in this document.
+  # data    - The Array of Strings holding the Asciidoc source document. (default: [])
+  # options - A Hash of options to control processing, such as setting the safe mode (:safe),
+  #           suppressing the header/footer (:header_footer) and attribute overrides (:attributes)
+  #           (default: {})
+  # block   - A block that can be used to retrieve external Asciidoc
+  #           data to include in this document.
   #
   # Examples
   #
   #   data = File.readlines(filename)
   #   doc  = Asciidoctor::Document.new(data)
-  def initialize(data, options = {}, &block)
-    @elements = []
+  #   puts doc.render
+  def initialize(data = [], options = {}, &block)
+    super(self, :document)
+    @renderer = nil
+    if options[:parent]
+      @parent_document = options.delete(:parent)
+      # should we dup here?
+      options[:attributes] = @parent_document.attributes
+      @renderer = @parent_document.renderer
+    else
+      @parent_document = nil
+    end
+    @header = nil
+    @references = {
+      :ids => {},
+      :links => [],
+      :images => []
+    }
+    @callouts = Callouts.new
     @options = options
+    @safe = @options.fetch(:safe, SafeMode::SECURE).to_i
     @options[:header_footer] = @options.fetch(:header_footer, true)
-    @attributes = {}
-    @attributes['sectids'] = nil
+    @attributes['asciidoctor'] = true
+    @attributes['asciidoctor-version'] = VERSION
+    @attributes['sectids'] = true
+    @attributes['encoding'] = 'UTF-8'
-    @reader = Reader.new(data, @attributes, &block)
+    attribute_overrides = options[:attributes] || {}
-    # pseudo-delegation :)
-    #@attributes = @reader.attributes
-    @references = @reader.references
+    # the only way to set the include-depth attribute is via the document options
+    # 10 is the AsciiDoc default, though currently Asciidoctor only supports 1 level
+    attribute_overrides['include-depth'] ||= 10
+    # TODO we should go with one or the other, this is confusing
+    # for now, base_dir takes precedence if set
+    if options.has_key? :base_dir
+      @base_dir = attribute_overrides['docdir'] = options[:base_dir]
+    else
+      attribute_overrides['docdir'] ||= Dir.pwd
+      @base_dir = attribute_overrides['docdir']
+    end
+    # restrict document from setting source-highlighter in SECURE safe mode
+    # it can only be set via the constructor
+    if @safe >= SafeMode::SECURE
+      attribute_overrides['source-highlighter'] ||= nil
+    end
+    attribute_overrides.each {|key, val|
+      # a nil or negative key undefines the attribute
+      if (val.nil? || key[-1..-1] == '!')
+        @attributes.delete(key.chomp '!')
+      # otherwise it's an attribute assignment
+      else
+        @attributes[key] = val
+      end
+    }
+    @attributes['backend'] ||= DEFAULT_BACKEND
+    update_backend_attributes
+    if nested?
+      # don't need to do the extra processing within our own document
+      @reader = Reader.new(data)
+    else
+      @reader = Reader.new(data, self, attribute_overrides, &block)
+    end
     # dynamic intrinstic attribute values
     @attributes['doctype'] ||= DEFAULT_DOCTYPE
     now = Time.new
     @attributes['localdate'] ||= now.strftime('%Y-%m-%d')
     @attributes['localtime'] ||= now.strftime('%H:%m:%S %Z')
     @attributes['localdatetime'] ||= [@attributes['localdate'], @attributes['localtime']].join(' ')
-    @attributes['asciidoctor-version'] = VERSION
+    # docdate and doctime should default to localdate and localtime if not otherwise set
+    @attributes['docdate'] ||= @attributes['localdate']
+    @attributes['doctime'] ||= @attributes['localtime']
+    @attributes['iconsdir'] ||= File.join(@attributes.fetch('imagesdir', 'images'), 'icons')
-    # Now parse @lines into elements
-    while @reader.has_lines?
-      @reader.skip_blank
+    # Now parse the lines in the reader into blocks
+    Lexer.parse(@reader, self)
+    # or we could make it...
+    #self << *Lexer.parse(@reader, self)
-      @elements << Lexer.next_block(@reader, self) if @reader.has_lines?
-    end
+    @callouts.rewind
-    Asciidoctor.debug "Found #{@elements.size} elements in this document:"
-    @elements.each do |el|
-      Asciidoctor.debug el
-    end
+    Asciidoctor.debug {
+      msg = []
+      msg << "Found #{@blocks.size} blocks in this document:"
+      @blocks.each {|b|
+        msg << b
+      }
+      msg * "\n"
+    }
+  end
-    # split off the level 0 section, if present
-    root = @elements.first
-    if root.is_a?(Section) && root.level == 0
-      @header = @elements.shift
-      @elements = @header.blocks
-      @header.clear_blocks
+  def register(type, value)
+    if type == :ids
+      if value.is_a?(Array)
+        @references[:ids][value[0]] = (value[1] || '[' + value[0] + ']')
+      else
+        @references[:ids][value] = '[' + value + ']'
+      end
+    elsif @options[:catalog_assets]
+      @references[type] << value
     end
+  end
+  def nested?
+    !@parent_document.nil?
   end
   # Make the raw source for the Document available.
@@ -75,18 +196,8 @@ class Asciidoctor::Document
     @reader.source if @reader
   end
-  def attr(name, default = nil)
-    default.nil? ? @attributes[name.to_s] : @attributes.fetch(name.to_s, default)
-    #default.nil? ? @attributes[name.to_s.tr('_', '-')] : @attributes.fetch(name.to_s.tr('_', '-'), default)
-  end
-  def attr?(name)
-    @attributes.has_key? name.to_s
-    #@attributes.has_key? name.to_s.tr('_', '-')
-  end
-  def level
-    0
+  def doctype
+    @attributes['doctype']
   end
   # The title explicitly defined in the document attributes
@@ -94,18 +205,20 @@ class Asciidoctor::Document
     @attributes['title']
   end
+  def title=(title)
+    @header = Section.new self
+    @header.title = title
+  end
   # We need to be able to return some semblance of a title
   def doctitle
-    # cached value
-    return @doctitle if @doctitle
-    if @header
-      @doctitle = @header.title
-    elsif @elements.first
-      @doctitle = @elements.first.title
+    if !(title = @attributes.fetch('title', '')).empty?
+      title
+    elsif !(sect = first_section).nil? && sect.title?
+      sect.title
+    else
+      nil
     end
-    @doctitle
   end
   alias :name :doctitle
@@ -113,33 +226,71 @@ class Asciidoctor::Document
     @attributes.has_key? 'notitle'
   end
-  def splain
-    if @header
-      Asciidoctor.debug "Header is #{@header}"
+  def noheader
+    @attributes.has_key? 'noheader'
+  end
+  # QUESTION move to AbstractBlock?
+  def first_section
+    has_header? ? @header : (@blocks || []).detect{|e| e.is_a? Section}
+  end
+  def has_header?
+    !@header.nil?
+  end
+  # Public: Update the backend attributes to reflect a change in the selected backend
+  def update_backend_attributes()
+    backend = @attributes['backend']
+    basebackend = backend.sub(/[[:digit:]]+$/, '')
+    page_width = DEFAULT_PAGE_WIDTHS[basebackend]
+    if page_width
+      @attributes['pagewidth'] = page_width
     else
-      Asciidoctor.debug "No header"
+      @attributes.delete('pagewidth')
     end
+    @attributes['backend-' + backend] = 1
+    @attributes['basebackend'] = basebackend
+    @attributes['basebackend-' + basebackend] = 1
+  end
-    Asciidoctor.debug "I have #{@elements.count} elements"
-    @elements.each_with_index do |block, i|
-      Asciidoctor.debug "v" * 60
-      Asciidoctor.debug "Block ##{i} is a #{block.class}"
-      Asciidoctor.debug "Name is #{block.name rescue 'n/a'}"
-      block.splain(0) if block.respond_to? :splain
-      Asciidoctor.debug "^" * 60
-    end
+  def splain
+    Asciidoctor.debug {
+      msg = ''
+      if @header
+        msg = "Header is #{@header}"
+      else
+        msg = "No header"
+      end
+      msg += "I have #{@blocks.count} blocks"
+      @blocks.each_with_index do |block, i|
+        msg += "v" * 60
+        msg += "Block ##{i} is a #{block.class}"
+        msg += "Name is #{block.title rescue 'n/a'}"
+        block.splain(0) if block.respond_to? :splain
+        msg += "^" * 60
+      end
+    }
     nil
   end
-  def renderer(options = {})
+  def renderer(opts = {})
     return @renderer if @renderer
     render_options = {}
     # Load up relevant Document @options
     if @options[:template_dir]
       render_options[:template_dir] = @options[:template_dir]
     end
+    render_options[:backend] = @attributes.fetch('backend', 'html5')
+    render_options[:eruby] = @options.fetch(:eruby, 'erb')
+    render_options[:compact] = @options.fetch(:compact, false)
     # Override Document @option settings with options passed in
-    render_options.merge! options
+    render_options.merge! opts
     @renderer = Renderer.new(render_options)
   end
@@ -148,18 +299,19 @@ class Asciidoctor::Document
   # loaded by Renderer. If a :template_dir is not specified,
   # or a template is missing, the renderer will fall back to
   # using the appropriate built-in template.
-  def render(options = {})
-    r = renderer(options)
-    @options.merge(options)[:header_footer] ? r.render('document', self) : content
+  def render(opts = {})
+    r = renderer(opts)
+    @options.merge(opts)[:header_footer] ? r.render('document', self) : r.render('embedded', self)
   end
   def content
-    html_pieces = []
-    @elements.each do |element|
-      Asciidoctor::debug "Rendering element: #{element}"
-      html_pieces << element.render
-    end
-    html_pieces.join
+    # per AsciiDoc-spec, remove the title after rendering the header
+    @attributes.delete('title')
+    @blocks.map {|b| b.render }.join
+  end
+  def to_s
+    %[#{super.to_s} - #{doctitle}]
   end
 end

data/lib/asciidoctor/inline.rb ADDED

@@ -0,0 +1,29 @@
+# Public: Methods for managing inline elements in AsciiDoc block
+class Asciidoctor::Inline < Asciidoctor::AbstractNode
+  # Public: Get the text of this inline element
+  attr_reader :text
+  # Public: Get the type (qualifier) of this inline element
+  attr_reader :type
+  # Public: Get/Set the target (e.g., uri) of this inline element
+  attr_accessor :target
+  def initialize(parent, context, text = nil, opts = {})
+    super(parent, context)
+    @text = text
+    @id = opts[:id] if opts.has_key?(:id)
+    @type = opts[:type] if opts.has_key?(:type)
+    @target = opts[:target] if opts.has_key?(:target)
+    if opts.has_key?(:attributes) && (attributes = opts[:attributes]).is_a?(Hash)
+      update_attributes(opts[:attributes]) unless attributes.empty?
+    end
+  end
+  def render
+    renderer.render("inline_#{@context}", self).chomp
+  end
+end

data/lib/asciidoctor/lexer.rb CHANGED

@@ -1,199 +1,380 @@
-# Public: Methods to parse and build objects from Asciidoc lines
+# Public: Methods to parse lines of AsciiDoc into an object hierarchy
+# representing the structure of the document. All methods are class methods and
+# should be invoked from the Lexer class. The main entry point is ::next_block.
+# No Lexer instances shall be discovered running around. (Any attempt to
+# instantiate a Lexer will be futile).
+#
+# The object hierarchy created by the Lexer consists of zero or more Section
+# and Block objects. Section objects may be nested and a Section object
+# contains zero or more Block objects. Block objects may be nested, but may
+# only contain other Block objects. Block objects which represent lists may
+# contain zero or more ListItem objects.
+#
+# Examples
+#
+#   # Create a Reader for the AsciiDoc lines and retrieve the next block from it.
+#   # Lexer::next_block requires a parent, so we begin by instantiating an empty Document.
+#
+#   doc = Document.new
+#   reader = Reader.new lines
+#   block = Lexer.next_block(reader, doc)
+#   block.class
+#   # => Asciidoctor::Block
 class Asciidoctor::Lexer
   include Asciidoctor
   # Public: Make sure the Lexer object doesn't get initialized.
+  #
+  # Raises RuntimeError if this constructor is invoked.
   def initialize
     raise 'Au contraire, mon frere. No lexer instances will be running around.'
   end
-  def self.document_from_parent(parent)
-    if parent.is_a? Document
-      parent
+  # Public: Parses AsciiDoc source read from the Reader into the Document
+  #
+  # This method is the main entry-point into the Lexer when parsing a full document.
+  # It first looks for and, if found, processes the document title. It then
+  # proceeds to iterate through the lines in the Reader, parsing the document
+  # into nested Sections and Blocks.
+  #
+  # reader   - the Reader holding the source lines of the document
+  # document - the empty Document into which the lines will be parsed
+  #
+  # returns the Document object
+  def self.parse(reader, document)
+    # process and plow away any attribute lines that proceed the first block so
+    # we can get at the document title, if present, then begin parsing blocks
+    attributes = parse_block_metadata_lines(reader, document)
+    # by processing the header here, we enforce its position at head of the document
+    next_level = is_next_line_section? reader
+    if next_level == 0
+      title_info = parse_section_title(reader)
+      document.title = title_info[1]
+      parse_header_metadata(reader, document)
+    end
+    while reader.has_lines?
+      new_section, attributes = next_section(reader, document, attributes)
+      document << new_section unless new_section.nil?
+    end
+    document
+  end
+  # Public: Return the next section from the Reader.
+  #
+  # This method process block metadata, content and subsections for this
+  # section and returns the Section object and any orphaned attributes.
+  #
+  # If the parent is a Document and has a header (document title), then
+  # this method will put any non-section blocks at the start of document
+  # into a preamble Block. If there are no such blocks, the preamble is
+  # dropped.
+  #
+  # Since we are reading line-by-line, there's a chance that metadata
+  # that should be associated with the following block gets consumed.
+  # To deal with this case, the method returns a running Hash of
+  # "orphaned" attributes that get passed to the next Section or Block.
+  #
+  # reader     - the source Reader
+  # parent     - the parent Section or Document of this new section
+  # attributes - a Hash of metadata that was left orphaned from the
+  #              previous Section.
+  #
+  # Examples
+  #
+  #   source
+  #   # => "Greetings\n---------\nThis is my doc.\n\nSalutations\n-----------\nIt is awesome."
+  #
+  #   reader = Reader.new source.lines.entries
+  #   # create empty document to parent the section
+  #   # and hold attributes extracted from header
+  #   doc = Document.new
+  #
+  #   Lexer.next_section(reader, doc).first.title
+  #   # => "Greetings"
+  #
+  #   Lexer.next_section(reader, doc).first.title
+  #   # => "Salutations"
+  #
+  # returns a two-element Array containing the Section and Hash of orphaned attributes
+  def self.next_section(reader, parent, attributes = {})
+    preamble = false
+    # check if we are at the start of processing the document
+    # NOTE we could drop a hint in the attributes to indicate
+    # that we are at a section title (so we don't have to check)
+    if parent.is_a?(Document) && parent.blocks.empty? &&
+        (parent.has_header? || !is_next_line_section?(reader))
+      if parent.has_header?
+        preamble = Block.new(parent, :preamble)
+        parent << preamble
+      end
+      section = parent
+      current_level = 0
+      if parent.attributes.has_key? 'fragment'
+        expected_next_levels = nil
+      # small tweak to allow subsequent level-0 sections for book doctype
+      elsif parent.doctype == 'book'
+        expected_next_levels = [0, 1]
+      else
+        expected_next_levels = [1]
+      end
     else
-      parent.document
+      section = initialize_section(reader, parent, attributes)
+      # clear attributes, except for title which carries over
+      # section title to next block of content
+      attributes = attributes.delete_if {|k, v| k != 'title'}
+      current_level = section.level
+      expected_next_levels = [current_level + 1]
     end
+    reader.skip_blank_lines
+    # Parse lines belonging to this section and its subsections until we
+    # reach the end of this section level
+    #
+    # 1. first look for metadata thingies (anchor, attribute list, block title line, etc)
+    # 2. then look for a section, recurse if found
+    # 3. then process blocks
+    #
+    # We have to parse all the metadata lines before continuing with the loop,
+    # otherwise subsequent metadata lines get interpreted as block content
+    while reader.has_lines?
+      parse_block_metadata_lines(reader, section, attributes)
+      next_level = is_next_line_section?(reader)
+      if next_level
+        doctype = parent.document.doctype
+        if next_level == 0 && doctype != 'book'
+          puts "asciidoctor: ERROR: only book doctypes can contain level 0 sections"
+        end
+        if next_level > current_level || (section.is_a?(Document) && next_level == 0)
+          unless expected_next_levels.nil? || expected_next_levels.include?(next_level)
+            puts "asciidoctor: WARNING: section title out of sequence: " +
+                "expected #{expected_next_levels.size > 1 ? 'levels' : 'level'} #{expected_next_levels * ' or '}, " +
+                "got level #{next_level}"
+          end
+          # the attributes returned are those that are orphaned
+          new_section, attributes = next_section(reader, section, attributes)
+          section << new_section
+        else
+          # close this section (and break out of the nesting) to begin a new one
+          break
+        end
+      else
+        # just take one block or else we run the risk of overrunning section boundaries
+        new_block = next_block(reader, section, attributes, :parse_metadata => false)
+        if !new_block.nil?
+          (preamble || section) << new_block
+          attributes = {}
+        else
+          # don't clear attributes if we don't find a block because they may
+          # be trailing attributes that didn't get associated with a block
+        end
+      end
+      reader.skip_blank_lines
+    end
+    # prune the preamble if it has no content
+    if preamble && preamble.blocks.empty?
+      section.delete_at(0)
+    end
+    # The attributes returned here are orphaned attributes that fall at the end
+    # of a section that need to get transfered to the next section
+    # see "trailing block attributes transfer to the following section" in
+    # test/attributes_test.rb for an example
+    [section != parent ? section : nil, attributes.dup]
   end
-  # Return the next block from the Reader.
+  # Public: Return the next Section or Block object from the Reader.
+  #
+  # Begins by skipping over blank lines to find the start of the next Section
+  # or Block. Processes each line of the reader in sequence until a Section or
+  # Block is found or the reader has no more lines.
   #
-  # * Skip over blank lines to find the start of the next content block.
-  # * Use defined regular expressions to determine the type of content block.
-  # * Based on the type of content block, grab lines to the end of the block.
-  # * Return a new Asciidoctor::Block or Asciidoctor::Section instance with the
-  #   content set to the grabbed lines.
-  def self.next_block(reader, parent = self)
+  # Uses regular expressions from the Asciidoctor module to match Section
+  # and Block delimiters. The ensuing lines are then processed according
+  # to the type of content.
+  #
+  # reader - The Reader from which to retrieve the next block
+  # parent - The Document, Section or Block to which the next block belongs
+  #
+  # Returns a Section or Block object holding the parsed content of the processed lines
+  def self.next_block(reader, parent, attributes = {}, options = {})
     # Skip ahead to the block content
-    reader.skip_blank
+    skipped = reader.skip_blank
+    # bail if we've reached the end of the section content
     return nil unless reader.has_lines?
-    context = parent.is_a?(Block) ? parent.context : nil
-    # NOTE: An anchor looks like this:
-    #   [[foo]]
-    # with the inside [foo] (including brackets) as match[1]
-    if match = reader.peek_line.match(REGEXP[:anchor])
-      Asciidoctor.debug "Found an anchor in line:\n\t#{reader.peek_line}"
-      # NOTE: This expression conditionally strips off the brackets from
-      # [foo], though REGEXP[:anchor] won't actually match without
-      # match[1] being bracketed, so the condition isn't necessary.
-      anchor = match[1].match(/^\[(.*)\]/) ? $1 : match[1]
-      # NOTE: Set @references['foo'] = '[foo]'
-      document_from_parent(parent).references[anchor] = match[1]
-      reader.get_line
-    else
-      anchor = nil
-    end
-    # skip a list continuation character if we're processing a list
-    if LIST_CONTEXTS.include?(context)
-      reader.skip_list_continuation
+    if options[:text] && skipped > 0
+      options.delete(:text)
     end
-    Asciidoctor.debug "/"*64
-    Asciidoctor.debug "#{File.basename(__FILE__)}:#{__LINE__} -> #{__method__} - First two lines are:"
-    Asciidoctor.debug reader.peek_line
-    tmp_line = reader.get_line
-    Asciidoctor.debug reader.peek_line
-    reader.unshift tmp_line
-    Asciidoctor.debug "/"*64
+    Asciidoctor.debug {
+      msg = []
+      msg << '/' * 64
+      msg << 'next_block() - First two lines are:'
+      msg << reader.peek_line
+      tmp_line = reader.get_line
+      msg << reader.peek_line
+      reader.unshift tmp_line
+      msg << '/' * 64
+      msg * "\n"
+    }
+    parse_metadata = options[:parse_metadata] || true
+    parse_sections = options[:parse_sections] || false
+    document = parent.document
+    context = parent.is_a?(Block) ? parent.context : nil
     block = nil
     title = nil
     caption = nil
-    buffer = []
-    attributes = {}
-    context = parent.is_a?(Block) ? parent.context : nil
-    while reader.has_lines? && block.nil?
-      buffer.clear
-      this_line = reader.get_line
-      next_line = reader.peek_line || ''
-      if this_line.match(REGEXP[:comment_blk])
-        Reader.new(reader.grab_lines_until {|line| line.match( REGEXP[:comment_blk] ) })
-      elsif this_line.match(REGEXP[:comment])
-        reader.skip_blank
-      elsif match = this_line.match(REGEXP[:attr_list_blk])
-        collect_attributes(match[1], attributes)
-        reader.skip_blank
+    while reader.has_lines? && block.nil?
+      if parse_metadata && parse_block_metadata_line(reader, document, attributes, options)
+        reader.next_line
+        next
+      elsif parse_sections && context.nil? && is_next_line_section?(reader)
+        block, attributes = next_section(reader, parent, attributes)
+        break
+      end
-      elsif is_section_heading?(this_line, next_line)
-        # If we've come to a new section, then we've found the end of this
-        # current block.  Likewise if we'd found an unassigned anchor, push
-        #
-        # FIXME when slurping up next section, give back trailing anchor to following section
-        reader.unshift(this_line)
-        Asciidoctor.debug "#{__method__}: SENDING to next_section with lines[0] = #{reader.peek_line}"
-        block = next_section(reader, parent)
+      this_line = reader.get_line
-      elsif match = this_line.match(REGEXP[:title])
-        title = match[1]
+      delimited_blk = delimited_block? this_line
+      # NOTE I've haven't decided whether I want this check here or in
+      # parse_block_metadata (where it is currently)
+      #if this_line.match(REGEXP[:comment_blk])
+      #  reader.grab_lines_until {|line| line.match( REGEXP[:comment_blk] ) }
+      #  reader.skip_blank
+      #  # NOTE we should break here because we have found a block, it
+      #  # just happens to be nil...if we keep going we potentially overrun
+      #  # a section heading which is not processed in this anymore
+      #  break
+      # NOTE we're letting ruler have attributes
+      if !options[:text] && this_line.match(REGEXP[:ruler])
+        block = Block.new(parent, :ruler)
         reader.skip_blank
-      elsif match = this_line.match(REGEXP[:image_blk])
-        collect_attributes(match[2], attributes, ['alt', 'width', 'height'])
+      elsif !options[:text] && (match = this_line.match(REGEXP[:image_blk]))
         block = Block.new(parent, :image)
-        # FIXME this seems kind of one-off here
+        AttributeList.new(document.sub_attributes(match[2])).parse_into(attributes, ['alt', 'width', 'height'])
         target = block.sub_attributes(match[1])
-        attributes['target'] = target
-        attributes['alt'] ||= File.basename(target, File.extname(target))
+        if !target.to_s.empty?
+          attributes['target'] = target
+          document.register(:images, target)
+          attributes['alt'] ||= File.basename(target, File.extname(target))
+        else
+          # drop the line if target resolves to nothing
+          block = nil
+        end
         reader.skip_blank
-      elsif this_line.match(REGEXP[:oblock])
-        # oblock is surrounded by '--' lines and has zero or more blocks inside
-        buffer = Reader.new(reader.grab_lines_until { |line| line.match(REGEXP[:oblock]) })
+      elsif delimited_blk && (match = this_line.match(REGEXP[:open_blk]))
+        # an open block is surrounded by '--' lines and has zero or more blocks inside
+        terminator = match[0]
+        buffer = Reader.new reader.grab_lines_until(:terminator => terminator)
         # Strip lines off end of block - not implemented yet
         # while buffer.has_lines? && buffer.last.strip.empty?
         #   buffer.pop
         # end
-        block = Block.new(parent, :oblock, [])
+        block = Block.new(parent, :open)
         while buffer.has_lines?
           new_block = next_block(buffer, block)
           block.blocks << new_block unless new_block.nil?
         end
       # needs to come before list detection
-      elsif this_line.match(REGEXP[:sidebar_blk])
+      elsif delimited_blk && (match = this_line.match(REGEXP[:sidebar_blk]))
         # sidebar is surrounded by '****' (4 or more '*' chars) lines
+        terminator = match[0]
         # FIXME violates DRY because it's a duplication of quote parsing
         block = Block.new(parent, :sidebar)
-        buffer = Reader.new(reader.grab_lines_until {|line| line.match( REGEXP[:sidebar_blk] ) })
+        buffer = Reader.new reader.grab_lines_until(:terminator => terminator)
         while buffer.has_lines?
           new_block = next_block(buffer, block)
           block.blocks << new_block unless new_block.nil?
         end
-      elsif list_type = [:olist, :colist].detect{|l| this_line.match( REGEXP[l] )}
+      elsif match = this_line.match(REGEXP[:colist])
+        block = Block.new(parent, :colist)
+        attributes['style'] = 'arabic'
         items = []
-        Asciidoctor.debug "Creating block of type: #{list_type}"
-        block = Block.new(parent, list_type)
-        attributes['style'] ||= 'arabic'
-        while !this_line.nil? && match = this_line.match(REGEXP[list_type])
-          item = ListItem.new(block)
-          reader.unshift match[2].lstrip.sub(/^\./, '\.')
-          item_segment = Reader.new(list_item_segment(reader, :alt_ending => REGEXP[list_type]))
-          while item_segment.has_lines?
-            new_block = next_block(item_segment, block)
-            item.blocks << new_block unless new_block.nil?
+        block.buffer = items
+        reader.unshift this_line
+        expected_index = 1
+        begin
+          # might want to move this check to a validate method
+          if match[1].to_i != expected_index
+            puts "asciidoctor: WARNING: callout list item index: expected #{expected_index} got #{match[1]}"
           end
+          list_item = next_list_item(reader, block, match)
+          expected_index += 1
+          if !list_item.nil?
+            items << list_item
+            coids = document.callouts.callout_ids(items.size)
+            if !coids.empty?
+              list_item.attributes['coids'] = coids
+            else
+              puts 'asciidoctor: WARNING: no callouts refer to list item ' + items.size.to_s
+            end
+          end
+        end while reader.has_lines? && match = reader.peek_line.match(REGEXP[:colist])
-          item.fold_first
-          items << item
-          reader.skip_blank
-          this_line = reader.get_line
-        end
-        reader.unshift(this_line) unless this_line.nil?
-        block.buffer = items
+        document.callouts.next_list
       elsif match = this_line.match(REGEXP[:ulist])
+        AttributeList.rekey(attributes, ['style'])
         reader.unshift(this_line)
-        block = build_ulist(reader, parent)
-      elsif match = this_line.match(REGEXP[:dlist])
-        # TODO build_dlist method?
-        pairs = []
-        block = Block.new(parent, :dlist)
-        # allows us to capture until we find a labeled item using the same delimiter (::, :::, :::: or ;;)
-        sibling_matcher = REGEXP[:dlist_siblings][match[3]]
+        block = next_outline_list(reader, :ulist, parent)
-        begin
-          dt = ListItem.new(block, match[2])
-          dt.anchor = match[1] unless match[1].nil?
-          dd = ListItem.new(block, match[5])
-          dd_segment = Reader.new(list_item_segment(reader, :alt_ending => sibling_matcher))
-          while dd_segment.has_lines?
-            new_block = next_block(dd_segment, block)
-            dd.blocks << new_block unless new_block.nil?
+      elsif match = this_line.match(REGEXP[:olist])
+        AttributeList.rekey(attributes, ['style'])
+        reader.unshift(this_line)
+        block = next_outline_list(reader, :olist, parent)
+        # QUESTION move this logic to next_outline_list?
+        if !(attributes.has_key? 'style') && !(block.attributes.has_key? 'style')
+          marker = block.buffer.first.marker
+          if marker.start_with? '.'
+            # first one makes more sense, but second on is AsciiDoc-compliant
+            #attributes['style'] = (ORDERED_LIST_STYLES[block.level - 1] || ORDERED_LIST_STYLES.first).to_s
+            attributes['style'] = (ORDERED_LIST_STYLES[marker.length - 1] || ORDERED_LIST_STYLES.first).to_s
+          else
+            style = ORDERED_LIST_STYLES.detect{|s| marker.match(ORDERED_LIST_MARKER_PATTERNS[s]) }
+            attributes['style'] = (style || ORDERED_LIST_STYLES.first).to_s
           end
+        end
-          dd.fold_first
-          pairs << [dt, dd]
-          # this skip_blank might be redundant
-          reader.skip_blank
-          this_line = reader.get_line
-        end while !this_line.nil? && match = this_line.match(sibling_matcher)
-        reader.unshift(this_line) unless this_line.nil?
-        block.buffer = pairs
+      elsif match = this_line.match(REGEXP[:dlist])
+        reader.unshift this_line
+        block = next_labeled_list(reader, match, parent)
+      elsif delimited_blk && (match = this_line.match(document.nested? ? REGEXP[:table_nested] : REGEXP[:table]))
+        # table is surrounded by lines starting with a | followed by 3 or more '=' chars
+        terminator = match[0]
+        AttributeList.rekey(attributes, ['style'])
+        table_reader = Reader.new reader.grab_lines_until(:terminator => terminator, :skip_line_comments => true)
+        block = next_table(table_reader, parent, attributes)
       # FIXME violates DRY because it's a duplication of other block parsing
-      elsif this_line.match(REGEXP[:example])
+      elsif delimited_blk && (match = this_line.match(REGEXP[:example]))
         # example is surrounded by lines with 4 or more '=' chars
-        rekey_positional_attributes(attributes, ['style'])
+        terminator = match[0]
+        AttributeList.rekey(attributes, ['style'])
         if admonition_style = ADMONITION_STYLES.detect {|s| attributes['style'] == s}
           block = Block.new(parent, :admonition)
           attributes['name'] = admonition_style.downcase
@@ -201,7 +382,7 @@ class Asciidoctor::Lexer
         else
           block = Block.new(parent, :example)
         end
-        buffer = Reader.new(reader.grab_lines_until {|line| line.match( REGEXP[:example] ) })
+        buffer = Reader.new reader.grab_lines_until(:terminator => terminator)
         while buffer.has_lines?
           new_block = next_block(buffer, block)
@@ -209,36 +390,45 @@ class Asciidoctor::Lexer
         end
       # FIXME violates DRY w/ non-delimited block listing
-      elsif this_line.match(REGEXP[:listing])
-        rekey_positional_attributes(attributes, ['style', 'language', 'linenums'])
-        buffer = reader.grab_lines_until {|line| line.match( REGEXP[:listing] )}
+      elsif delimited_blk && (match = this_line.match(REGEXP[:listing]))
+        terminator = match[0]
+        AttributeList.rekey(attributes, ['style', 'language', 'linenums'])
+        buffer = reader.grab_lines_until(:terminator => terminator)
         buffer.last.chomp! unless buffer.empty?
         block = Block.new(parent, :listing, buffer)
-      elsif this_line.match(REGEXP[:quote])
+      elsif delimited_blk && (match = this_line.match(REGEXP[:quote]))
         # multi-line verse or quote is surrounded by a block delimiter
-        rekey_positional_attributes(attributes, ['style', 'attribution', 'citetitle'])
+        terminator = match[0]
+        AttributeList.rekey(attributes, ['style', 'attribution', 'citetitle'])
         quote_context = (attributes['style'] == 'verse' ? :verse : :quote)
-        buffer = Reader.new(reader.grab_lines_until {|line| line.match( REGEXP[:quote] ) })
+        block_reader = Reader.new reader.grab_lines_until(:terminator => terminator)
         # only quote can have other section elements (as as section block)
         section_body = (quote_context == :quote)
         if section_body
           block = Block.new(parent, quote_context)
-          while buffer.has_lines?
-            new_block = next_block(buffer, block)
+          while block_reader.has_lines?
+            new_block = next_block(block_reader, block)
             block.blocks << new_block unless new_block.nil?
           end
         else
-          block = Block.new(parent, quote_context, buffer.lines)
+          block_reader.chomp_last!
+          block = Block.new(parent, quote_context, block_reader.lines)
         end
-      elsif this_line.match(REGEXP[:lit_blk])
-        # example is surrounded by '....' (4 or more '.' chars) lines
-        buffer = reader.grab_lines_until {|line| line.match( REGEXP[:lit_blk] ) }
+      elsif delimited_blk && (blk_ctx = [:literal, :pass].detect{|t| this_line.match(REGEXP[t])})
+        # literal is surrounded by '....' (4 or more '.' chars) lines
+        # pass is surrounded by '++++' (4 or more '+' chars) lines
+        terminator = $~[0]
+        buffer = reader.grab_lines_until(:terminator => terminator)
         buffer.last.chomp! unless buffer.empty?
-        block = Block.new(parent, :literal, buffer)
+        # a literal can masquerade as a listing
+        if attributes[1] == 'listing'
+          blk_ctx = :listing
+        end
+        block = Block.new(parent, blk_ctx, buffer)
       elsif this_line.match(REGEXP[:lit_par])
         # literal paragraph is contiguous lines starting with
@@ -246,343 +436,529 @@ class Asciidoctor::Lexer
         # So we need to actually include this one in the grab_lines group
         reader.unshift this_line
-        buffer = reader.grab_lines_until(:preserve_last_line => true) {|line|
-          (context == :dlist && line.match(REGEXP[:dlist])) || !line.match(REGEXP[:lit_par])
+        buffer = reader.grab_lines_until(:preserve_last_line => true, :break_on_blank_lines => true) {|line|
+          # labeled list terms can be indented, but a preceding blank indicates
+          # we are in a list continuation and therefore literals should be strictly literal
+          (context == :dlist && skipped == 0 && line.match(REGEXP[:dlist])) ||
+          delimited_block?(line)
         }
-        # trim off the indentation that put us in this literal paragraph
-        if !buffer.empty? && match = buffer.first.match(/^([[:blank:]]+)/)
-          offset = match[1].length
-          buffer = buffer.map {|l| l.slice(offset..-1)}
+        # trim off the indentation equivalent to the size of the least indented line
+        if !buffer.empty?
+          offset = buffer.map {|line| line.match(REGEXP[:leading_blanks])[1].length }.min
+          if offset > 0
+            buffer = buffer.map {|l| l.sub(/^\s{1,#{offset}}/, '') }
+          end
           buffer.last.chomp!
         end
         block = Block.new(parent, :literal, buffer)
+        # a literal gets special meaning inside of a definition list
+        if LIST_CONTEXTS.include?(context)
+          attributes['options'] ||= []
+          # TODO this feels hacky, better way to distinguish from explicit literal block?
+          attributes['options'] << 'listparagraph'
+        end
       ## these switches based on style need to come immediately before the else ##
-      elsif attributes[0] == 'source'
-        rekey_positional_attributes(attributes, ['style', 'language', 'linenums'])
+      elsif attributes[1] == 'source'
+        AttributeList.rekey(attributes, ['style', 'language', 'linenums'])
         reader.unshift(this_line)
         buffer = reader.grab_lines_until(:break_on_blank_lines => true)
         buffer.last.chomp! unless buffer.empty?
         block = Block.new(parent, :listing, buffer)
-      elsif admonition_style = ADMONITION_STYLES.detect{|s| attributes[0] == s}
-        # an admonition preceded by [*TYPE*] and lasts until a blank line
+      elsif admonition_style = ADMONITION_STYLES.detect{|s| attributes[1] == s}
+        # an admonition preceded by [<TYPE>] and lasts until a blank line
         reader.unshift(this_line)
         buffer = reader.grab_lines_until(:break_on_blank_lines => true)
+        buffer.last.chomp! unless buffer.empty?
         block = Block.new(parent, :admonition, buffer)
         attributes['style'] = admonition_style
         attributes['name'] = admonition_style.downcase
         attributes['caption'] ||= admonition_style.capitalize
-      elsif quote_context = [:quote, :verse].detect{|s| attributes[0] == s.to_s}
+      elsif quote_context = [:quote, :verse].detect{|s| attributes[1] == s.to_s}
         # single-paragraph verse or quote is preceded by [verse] or [quote], respectively, and lasts until a blank line
-        rekey_positional_attributes(attributes, ['style', 'attribution', 'citetitle'])
+        AttributeList.rekey(attributes, ['style', 'attribution', 'citetitle'])
         reader.unshift(this_line)
         buffer = reader.grab_lines_until(:break_on_blank_lines => true)
+        buffer.last.chomp! unless buffer.empty?
         block = Block.new(parent, quote_context, buffer)
-      else
-        # paragraph is contiguous nonblank/noncontinuation lines
+      else # paragraph, contiguous nonblank/noncontinuation lines
         reader.unshift this_line
-        buffer = reader.grab_lines_until(:break_on_blank_lines => true, :preserve_last_line => true) {|line|
-          (context == :dlist && line.match(REGEXP[:dlist])) ||
-          ([:ulist, :olist, :dlist].include?(context) && line.chomp == LIST_CONTINUATION) ||
-          line.match(REGEXP[:oblock])
+        buffer = reader.grab_lines_until(:break_on_blank_lines => true, :preserve_last_line => true, :skip_line_comments => true) {|line|
+          delimited_block?(line) || line.match(REGEXP[:attr_line]) ||
+          # next list item can be directly adjacent to paragraph of previous list item
+          context == :dlist && line.match(REGEXP[:dlist])
+          # not sure if there are any cases when we need this check for other list types
+          #LIST_CONTEXTS.include?(context) && line.match(REGEXP[context])
         }
-        if LIST_CONTEXTS.include?(context)
-          reader.skip_list_continuation
+        # NOTE we need this logic because the reader is processing line
+        # comments and that might leave us w/ an empty buffer
+        if buffer.empty?
+          reader.get_line
+          break
         end
-        if !buffer.empty? && admonition = buffer.first.match(Regexp.new('^(' + ADMONITION_STYLES.join('|') + '):\s+'))
+        catalog_inline_anchors(buffer.join, document)
+        if !options[:text] && (admonition = buffer.first.match(Regexp.new('^(' + ADMONITION_STYLES.join('|') + '):\s+')))
           buffer[0] = admonition.post_match
           block = Block.new(parent, :admonition, buffer)
           attributes['style'] = admonition[1]
           attributes['name'] = admonition[1].downcase
           attributes['caption'] ||= admonition[1].capitalize
         else
-          buffer.last.chomp! unless buffer.empty?
-          Asciidoctor.debug "Proud parent #{parent} getting a new paragraph with buffer: #{buffer}"
+          buffer.last.chomp!
           block = Block.new(parent, :paragraph, buffer)
         end
       end
     end
-    # when looking for nested content, a series of
-    # line comments or a comment block could leave us
-    # without a block
+    # when looking for nested content, one or more line comments, comment
+    # blocks or trailing attribute lists could leave us without a block,
+    # so handle accordingly
     if !block.nil?
-      block.anchor   ||= (anchor || attributes['id'])
-      block.title    ||= title
-      block.caption  ||= caption
+      block.id        = attributes['id'] if attributes.has_key?('id')
+      block.title   ||= (attributes['title'] || title)
+      block.caption ||= caption unless block.is_a?(Section)
+      # AsciiDoc always use [id] as the reftext in HTML output,
+      # but I'd like to do better in Asciidoctor
+      if block.id && block.title? && !attributes.has_key?('reftext')
+        document.register(:ids, [block.id, block.title])
+      end
       block.update_attributes(attributes)
+      if block.context == :listing || block.context == :literal
+        catalog_callouts(block.buffer.join, document)
+      end
     end
     block
   end
-  # Private: Return the Array of lines constituting the next list item
-  #          segment, removing them from the 'lines' Array passed in.
-  #
-  # reader  - the Reader instance from which to get input.
-  # options - an optional Hash of processing options:
-  #           * :alt_ending may be used to specify a regular expression match
-  #             other than a blank line to signify the end of the segment.
-  #           * :list_types may be used to specify list item patterns to
-  #             include. May be either a single Symbol or an Array of Symbols.
-  #           * :list_level may be used to specify a mimimum list item level
-  #             to include. If this is specified, then break if we find a list
-  #             item of a lower level.
+  # Public: Determines whether this line is the start of any of the delimited blocks
   #
-  # Returns the Array of lines forming the next segment.
-  #
-  # Examples
-  #
-  #   reader = Asciidoctor::Reader.new(
-  #      ["First paragraph\n", "+\n", "Second paragraph\n", "--\n",
-  #       "Open block\n", "\n", "Can have blank lines\n", "--\n", "\n",
-  #       "In a different segment\n"])
+  # returns the match data if this line is the first line of a delimited block or nil if not
+  #--
+  # TODO could use the match value as a lookup for the block type so we don't have
+  # to do any subsequent regexp
+  def self.delimited_block?(line)
+    # naive match
+    #line.match(REGEXP[:any_blk])
+    # attempt at better performance
+    if line.length > 0
+      # NOTE accessing the first element before calling ord is first Ruby 1.8.7 compat
+      REGEXP[:any_blk_ord].include?(line[0..0][0].ord) ? line.match(REGEXP[:any_blk]) : nil
+    else
+      nil
+    end
+  end
+  # Internal: Parse and construct an outline list Block from the current position of the Reader
   #
-  #   list_item_segment(reader)
-  #   => ["First paragraph\n", "+\n", "Second paragraph\n", "--\n",
-  #       "Open block\n", "\n", "Can have blank lines\n", "--\n"]
+  # reader    - The Reader from which to retrieve the outline list
+  # list_type - A Symbol representing the list type (:olist for ordered, :ulist for unordered)
+  # parent    - The parent Block to which this outline list belongs
   #
-  #   reader.peek_line
-  #   => "In a different segment\n"
-  def self.list_item_segment(reader, options={})
-    alternate_ending = options[:alt_ending]
-    list_types = Array(options[:list_types]) || [:ulist, :olist, :colist, :dlist]
-    list_level = options[:list_level].to_i
-    # We know we want to include :lit_par types, even if we have specified,
-    # say, only :ulist type list entries.
-    list_types << :lit_par unless list_types.include? :lit_par
-    segment = []
-    reader.skip_blank
-    # Grab lines until the first blank line not inside an open block
-    # or listing
-    in_oblock = false
-    in_listing = false
-    while reader.has_lines?
-      this_line = reader.get_line
-      Asciidoctor.debug "----->  Processing: #{this_line}"
-      in_oblock = !in_oblock if this_line.match(REGEXP[:oblock])
-      in_listing = !in_listing if this_line.match(REGEXP[:listing])
-      if !in_oblock && !in_listing
-        if this_line.strip.empty?
-          # TODO  - FIX THIS BEFORE ANY MORE KITTENS DIE AUGGGHHH!!!
-          next_nonblank = reader.instance_variable_get(:@lines).detect{|l| !l.strip.empty?}
-          # If there are blank lines ahead, but there's at least one
-          # more non-blank line that doesn't trigger an alternate_ending
-          # for the block of lines, then vacuum up all the blank lines
-          # into this segment and continue with the next non-blank line.
-          if next_nonblank &&
-             ( alternate_ending.nil? ||
-               !next_nonblank.match(alternate_ending)
-             ) && list_types.find { |list_type| next_nonblank.match(REGEXP[list_type]) }
-             while reader.has_lines? and reader.peek_line.strip.empty?
-               segment << this_line
-               this_line = reader.get_line
-             end
-          else
+  # Returns the Block encapsulating the parsed outline (unordered or ordered) list
+  def self.next_outline_list(reader, list_type, parent)
+    list_block = Block.new(parent, list_type)
+    items = []
+    list_block.buffer = items
+    if parent.context == list_type
+      list_block.level = parent.level + 1
+    else
+      list_block.level = 1
+    end
+    Asciidoctor.debug { "Created #{list_type} block: #{list_block}" }
+    while reader.has_lines? && (match = reader.peek_line.match(REGEXP[list_type]))
+      marker = resolve_list_marker(list_type, match[1])
+      # if we are moving to the next item, and the marker is different
+      # determine if we are moving up or down in nesting
+      if items.size > 0 && marker != items.first.marker
+        # assume list is nested by default, but then check to see if we are
+        # popping out of a nested list by matching an ancestor's list marker
+        this_item_level = list_block.level + 1
+        p = parent
+        while p.context == list_type
+          if marker == p.buffer.first.marker
+            this_item_level = p.level
             break
           end
-        # Have we come to a line matching an alternate_ending regexp?
-        elsif alternate_ending && this_line.match(alternate_ending)
-          reader.unshift this_line
-          break
-        # Do we have a minimum list_level, and have come to a list item
-        # line with a lower level?
-        elsif list_level &&
-              list_types.find { |list_type| this_line.match(REGEXP[list_type]) } &&
-              ($1.length < list_level)
-          reader.unshift this_line
-          break
+          p = p.parent
         end
+      else
+        this_item_level = list_block.level
+      end
-        # From the Asciidoc user's guide:
-        #   Another list or a literal paragraph immediately following
-        #   a list item will be implicitly included in the list item
-        # Thus, the list_level stuff may be wrong here.
+      if items.size == 0 || this_item_level == list_block.level
+        list_item = next_list_item(reader, list_block, match)
+      elsif this_item_level < list_block.level
+        # leave this block
+        break
+      elsif this_item_level > list_block.level
+        # If this next list level is down one from the
+        # current Block's, append it to content of the current list item
+        items.last.blocks << next_block(reader, list_block)
       end
-      segment << this_line
+      items << list_item unless list_item.nil?
+      list_item = nil
+      reader.skip_blank
     end
-    Asciidoctor.debug "*"*40
-    Asciidoctor.debug "#{File.basename(__FILE__)}:#{__LINE__} -> #{__method__}: Returning this:"
-    #Asciidoctor.debug segment.inspect
-    Asciidoctor.debug "*"*10
-    Asciidoctor.debug "Leaving #{__method__}: Top of reader queue is:"
-    Asciidoctor.debug reader.peek_line
-    Asciidoctor.debug "*"*40
-    segment
+    list_block
   end
-  # Private: Get the Integer ulist level based on the characters
-  # in front of the list item text.
+  # Internal: Catalog any callouts found in the text, but don't process them
   #
-  # line - the String line containing the list item
-  def self.ulist_level(line)
-    if m = line.strip.match(/^(- | \*{1,5})\s+/x)
-      return m[1].length
-    end
+  # text     - The String of text in which to look for callouts
+  # document - The current document on which the callouts are stored
+  #
+  # Returns nothing
+  def self.catalog_callouts(text, document)
+    text.scan(REGEXP[:callout_scan]) {
+      # alias match for Ruby 1.8.7 compat
+      m = $~
+      next if m[0].start_with? '\\'
+      document.callouts.register(m[1])
+    }
   end
-  def self.build_ulist_item(reader, block, match = nil)
-    list_type = :ulist
-    this_line = reader.get_line
-    return nil unless this_line
-    match ||= this_line.match(REGEXP[list_type])
-    if match.nil?
-      reader.unshift(this_line)
-      return nil
-    end
+  # Internal: Catalog any inline anchors found in the text, but don't process them
+  #
+  # text     - The String text in which to look for inline anchors
+  # document - The current document on which the references are stored
+  #
+  # Returns nothing
+  def self.catalog_inline_anchors(text, document)
+    text.scan(REGEXP[:anchor_macro]) {
+      # alias match for Ruby 1.8.7 compat
+      m = $~
+      next if m[0].start_with? '\\'
+      id, reftext = m[1].split(',')
+      id.sub!(/^("|)(.*)\1$/, '\2')
+      if !reftext.nil?
+        reftext.sub!(/^("|)(.*)\1$/m, '\2')
+      end
+      document.register(:ids, [id, reftext])
+    }
+    nil
+  end
-    level = match[1].length
+  # Internal: Parse and construct a labeled (e.g., definition) list Block from the current position of the Reader
+  #
+  # reader    - The Reader from which to retrieve the labeled list
+  # match     - The Regexp match for the head of the list
+  # parent    - The parent Block to which this labeled list belongs
+  #
+  # Returns the Block encapsulating the parsed labeled list
+  def self.next_labeled_list(reader, match, parent)
+    pairs = []
+    block = Block.new(parent, :dlist)
+    block.buffer = pairs
+    # allows us to capture until we find a labeled item
+    # that uses the same delimiter (::, :::, :::: or ;;)
+    sibling_pattern = REGEXP[:dlist_siblings][match[2]]
+    begin
+      pairs << next_list_item(reader, block, match, sibling_pattern)
+    end while reader.has_lines? && match = reader.peek_line.match(sibling_pattern)
-    list_item = ListItem.new(block)
-    list_item.level = level
-    Asciidoctor.debug "#{__FILE__}:#{__LINE__}: Created ListItem #{list_item} with match[2]: #{match[2]} and level: #{list_item.level}"
+    block
+  end
-    # Restore first line of list item
-    # Also prevent bullet list text starting with . from being treated as a paragraph
-    # title or some other unseemly thing in list_item_segment. I think. (NOTE)
-    reader.unshift match[2].lstrip.sub(/^\./, '\.')
+  # Internal: Parse and construct the next ListItem for the current bulleted
+  # (unordered or ordered) list Block, callout lists included, or the next
+  # term ListItem and definition ListItem pair for the labeled list Block.
+  #
+  # First collect and process all the lines that constitute the next list
+  # item for the parent list (according to its type). Next, parse those lines
+  # into blocks and associate them with the ListItem (in the case of a
+  # labeled list, the definition ListItem). Finally, fold the first block
+  # into the item's text attribute according to rules described in ListItem.
+  #
+  # reader        - The Reader from which to retrieve the next list item
+  # list_block    - The parent list Block of this ListItem. Also provides access to the list type.
+  # match         - The match Array which contains the marker and text (first-line) of the ListItem
+  # sibling_trait - The list marker or the Regexp to match a sibling item
+  #
+  # Returns the next ListItem or ListItem pair (depending on the list type)
+  # for the parent list Block.
+  def self.next_list_item(reader, list_block, match, sibling_trait = nil)
+    list_type = list_block.context
+    if list_type == :dlist
+      list_term = ListItem.new(list_block, match[1])
+      list_item = ListItem.new(list_block, match[3])
+      has_text = !match[3].to_s.empty?
+    else
+      # Create list item using first line as the text of the list item
+      list_item = ListItem.new(list_block, match[2])
-    item_segment = Reader.new(list_item_segment(reader, :alt_ending => REGEXP[list_type]))
-#    item_segment = list_item_segment(reader)
-    while item_segment.has_lines?
-      new_block = next_block(item_segment, block)
-      list_item.blocks << new_block unless new_block.nil?
+      if !sibling_trait
+        sibling_trait = resolve_list_marker(list_type, match[1], list_block.buffer.size, true)
+      end
+      list_item.marker = sibling_trait
+      has_text = true
     end
-    Asciidoctor.debug "\n\nlist_item has #{list_item.blocks.count} blocks, and first is a #{list_item.blocks.first.class} with context #{list_item.blocks.first.context rescue 'n/a'}\n\n"
+    # first skip the line with the marker / term
+    reader.get_line
+    list_item_reader = Reader.new grab_lines_for_list_item(reader, list_type, sibling_trait, has_text)
+    if list_item_reader.has_lines?
+      comment_lines = list_item_reader.consume_line_comments
+      subsequent_line = list_item_reader.peek_line
+      list_item_reader.unshift(*comment_lines) unless comment_lines.empty?
+      if !subsequent_line.nil?
+        continuation_connects_first_block = (subsequent_line == "\n")
+        content_adjacent = !subsequent_line.strip.empty?
+      else
+        continuation_connects_first_block = false
+        content_adjacent = false
+      end
+      # only relevant for :dlist
+      options = {:text => !has_text}
-    list_item.fold_first
+      while list_item_reader.has_lines?
+        new_block = next_block(list_item_reader, list_block, {}, options)
+        list_item.blocks << new_block unless new_block.nil?
+      end
-    list_item
+      list_item.fold_first(continuation_connects_first_block, content_adjacent)
+    end
+    if list_type == :dlist
+      unless list_item.text? || list_item.blocks?
+        list_item = nil
+      end
+      [list_term, list_item]
+    else
+      list_item
+    end
   end
-  def self.build_ulist(reader, parent = nil)
-    items = []
-    list_type = :ulist
-    block = Block.new(parent, list_type)
-    Asciidoctor.debug "Created :ulist block: #{block}"
-    first_item_level = nil
+  # Internal: Collect the lines belonging to the current list item, navigating
+  # through all the rules that determine what comprises a list item.
+  #
+  # Grab lines until a sibling list item is found, or the block is broken by a
+  # terminator (such as a line comment). Definition lists are more greedy if
+  # they don't have optional inline item text...they want that text
+  #
+  # reader          - The Reader from which to retrieve the lines.
+  # list_type       - The Symbol context of the list (:ulist, :olist, :colist or :dlist)
+  # sibling_trait   - A Regexp that matches a sibling of this list item or String list marker
+  #                   of the items in this list (default: nil)
+  # has_text        - Whether the list item has text defined inline (always true except for labeled lists)
+  #
+  # Returns an Array of lines belonging to the current list item.
+  def self.grab_lines_for_list_item(reader, list_type, sibling_trait = nil, has_text = true)
+    buffer = []
-    while reader.has_lines? && match = reader.peek_line.match(REGEXP[list_type])
+    # three states for continuation: :inactive, :active & :frozen
+    # :frozen signifies we've detected sequential continuation lines &
+    # continuation is not permitted until reset
+    continuation = :inactive
-      this_item_level = match[1].length
+    # if we are within a nested list, we don't throw away the list
+    # continuation marks because they will be processed when grabbing
+    # the lines for those nested lists
+    within_nested_list = false
-      if first_item_level && first_item_level < this_item_level
-        # If this next :uline level is down one from the
-        # current Block's, append it to content of the current list item
-        items.last.blocks << next_block(reader, block)
-      elsif first_item_level && first_item_level > this_item_level
-        break
-      else
-        list_item = build_ulist_item(reader, block, match)
-        # Set the base item level for this Block
-        first_item_level ||= list_item.level
-      end
+    # a detached continuation is a list continuation that follows a blank line
+    # it gets associated with the outermost block
+    detached_continuation = nil
-      items << list_item unless list_item.nil?
-      list_item = nil
+    while reader.has_lines?
+      this_line = reader.get_line
-      reader.skip_blank
-    end
+      # if we've arrived at a sibling item in this list, we've captured
+      # the complete list item and can begin processing it
+      # the remainder of the method determines whether we've reached
+      # the termination of the list
+      break if is_sibling_list_item?(this_line, list_type, sibling_trait)
-    block.buffer = items
-    block
-  end
+      prev_line = buffer.empty? ? nil : buffer.last.chomp
-  def self.build_ulist_ref(lines, parent = nil)
-    items = []
-    list_type = :ulist
-    block = Block.new(parent, list_type)
-    Asciidoctor.debug "Created :ulist block: #{block}"
-    last_item_level = nil
-    this_line = lines.shift
-    while this_line && match = this_line.match(REGEXP[list_type])
-      level = match[1].length
-      list_item = ListItem.new(block)
-      list_item.level = level
-      Asciidoctor.debug "Created ListItem #{list_item} with match[2]: #{match[2]} and level: #{list_item.level}"
-      lines.unshift match[2].lstrip.sub(/^\./, '\.')
-      item_segment = list_item_segment(lines, :alt_ending => REGEXP[list_type], :list_level => level)
-      while item_segment.any?
-        new_block = next_block(item_segment, block)
-        list_item.blocks << new_block unless new_block.nil?
-      end
+      if prev_line == LIST_CONTINUATION
+        if continuation == :inactive
+          continuation = :active
+          has_text = true
+          buffer[buffer.size - 1] = "\n" unless within_nested_list
+        end
-      list_item.fold_first
+        # dealing with adjacent list continuations (which is really a syntax error)
+        if this_line.chomp == LIST_CONTINUATION
+          if continuation != :frozen
+            continuation = :frozen
+            buffer << this_line
+          end
+          this_line = nil
+          next
+        end
+      end
-      if items.any? && (level > items.last.level)
-        Asciidoctor.debug "--> Putting this new level #{level} ListItem under my pops, #{items.last} (level: #{items.last.level})"
-        items.last.blocks << list_item
+      # a delimited block immediately breaks the list unless preceded
+      # by a list continuation (they are harsh like that ;0)
+      if (match = delimited_block?(this_line)) ||
+        # technically attr_line only breaks if ensuing line is not a list item
+        # which really means attr_line only breaks if it's acting as a block delimiter
+        (list_type == :dlist && match = this_line.match(REGEXP[:attr_line]))
+        terminator = match[0]
+        if continuation == :active
+          buffer << this_line
+          # grab all the lines in the block, leaving the delimiters in place
+          # we're being more strict here about the terminator, but I think that's a good thing
+          buffer.concat reader.grab_lines_until(:terminator => terminator, :grab_last_line => true)
+          continuation = :inactive
+        else
+          break
+        end
       else
-        Asciidoctor.debug "Stacking new list item in parent block's blocks"
-        items << list_item
-      end
+        if continuation == :active && !this_line.strip.empty?
+          # literal paragraphs have special considerations (and this is one of
+          # two entry points into one)
+          # if we don't process it as a whole, then a line in it that looks like a
+          # list item will throw off the exit from it
+          if this_line.match(REGEXP[:lit_par])
+            reader.unshift this_line
+            buffer.concat reader.grab_lines_until(
+              :preserve_last_line => true,
+              :break_on_blank_lines => true,
+              :break_on_list_continuation => true)
+          else
+            if nested_list_type = (within_nested_list ? [:dlist] : NESTABLE_LIST_CONTEXTS).detect {|ctx| this_line.match(REGEXP[ctx]) }
+              within_nested_list = true
+              if nested_list_type == :dlist && $~[3].to_s.empty?
+                # get greedy again
+                has_text = false
+              end
+            end
+            buffer << this_line
+          end
+          continuation = :inactive
+        elsif !prev_line.nil? && prev_line.strip.empty?
+          # advance to the next line of content
+          if this_line.strip.empty?
+            reader.skip_blank
+            this_line = reader.get_line
+            # if we hit eof or a sibling, stop reading
+            break if this_line.nil? || is_sibling_list_item?(this_line, list_type, sibling_trait)
+          end
-      last_item_level = list_item.level
+          if this_line.chomp == LIST_CONTINUATION
+            detached_continuation = buffer.size
+            buffer << this_line
+          else
+            # has_text is only relevant for dlist, which is more greedy until it has text for an item
+            # for all other lists, has_text is always true
+            # in this block, we have to see whether we stay in the list
+            if has_text
+              # slurp up any literal paragraph offset by blank lines
+              if this_line.match(REGEXP[:lit_par])
+                reader.unshift this_line
+                buffer.concat reader.grab_lines_until(
+                  :preserve_last_line => true,
+                  :break_on_blank_lines => true,
+                  :break_on_list_continuation => true)
+              # TODO any way to combine this with the check after skipping blank lines?
+              elsif is_sibling_list_item?(this_line, list_type, sibling_trait)
+                #buffer.pop unless within_nested_list
+                break
+              elsif nested_list_type = NESTABLE_LIST_CONTEXTS.detect {|ctx| this_line.match(REGEXP[ctx]) }
+                #buffer.pop unless within_nested_list
+                buffer << this_line
+                within_nested_list = true
+                if nested_list_type == :dlist && $~[3].to_s.empty?
+                  # get greedy again
+                  has_text = false
+                end
+              else
+                break
+              end
+            else # only dlist in need of item text, so slurp it up!
+              # pop the blank line so it's not interpretted as a list continuation
+              buffer.pop unless within_nested_list
+              buffer << this_line
+              has_text = true
+            end
+          end
+        else
+          has_text = true if !this_line.strip.empty?
+          if nested_list_type = (within_nested_list ? [:dlist] : NESTABLE_LIST_CONTEXTS).detect {|ctx| this_line.match(REGEXP[ctx]) }
+            within_nested_list = true
+            if nested_list_type == :dlist && $~[3].to_s.empty?
+              # get greedy again
+              has_text = false
+            end
+          end
+          buffer << this_line
+        end
+      end
+      this_line = nil
+    end
-      # TODO: This has to come from a Reader object
-      skip_blank(lines)
+    reader.unshift this_line if !this_line.nil?
-      this_line = lines.shift
+    if detached_continuation
+      buffer.delete_at detached_continuation
     end
-    lines.unshift(this_line) unless this_line.nil?
-    block.buffer = items
-    block
-  end
+    # QUESTION should we strip these trailing endlines?
+    #buffer.pop while buffer.last == "\n"
-  def self.collect_attributes(attrs, attributes, posattrs = [])
-    # TODO walk be properly rather than using split
-    attrs.split(/\s*,\s*/).each_with_index do |entry, i|
-      key, val = entry.split(/\s*=\s*/)
-      if !val.nil?
-        val.gsub!(/^(['"])(.*)\1$/, '\2') unless val.nil?
-        attributes[key] = val
-      else
-        attributes[i] = key
-        # positional attribute has a known key
-        if posattrs.size >= (i + 1)
-          attributes[posattrs[i]] = key
-        end
-      end
+    # We do need to replace the optional trailing continuation
+    # a blank line would have served the same purpose in the document
+    if !buffer.empty? && buffer.last.chomp == LIST_CONTINUATION
+      buffer.pop
     end
+    #puts "BUFFER>#{buffer.join}<BUFFER"
+    #puts "BUFFER>#{buffer}<BUFFER"
+    buffer
   end
-  def self.rekey_positional_attributes(attributes, posattrs)
-    posattrs.each_with_index do |key, i|
-      val = attributes[i]
-      if !val.nil?
-        attributes[key] = val
-      end
+  # Internal: Initialize a new Section object and assign any attributes provided
+  #
+  # The information for this section is retrieved by parsing the lines at the
+  # current position of the reader.
+  #
+  # reader     - the source reader
+  # parent     - the parent Section or Document of this Section
+  # attributes - a Hash of attributes to assign to this section (default: {})
+  def self.initialize_section(reader, parent, attributes = {})
+    section = Section.new parent
+    section.id, section.title, section.level, _ = parse_section_title(reader)
+    if section.id.nil? && attributes.has_key?('id')
+      section.id = attributes['id']
+    else
+      # generate an id if one was not *embedded* in the heading line
+      # or as an anchor above the section
+      section.id ||= section.generate_id
     end
+    section.update_attributes(attributes)
+    reader.skip_blank
+    section
   end
   # Private: Get the Integer section level based on the characters
-  # used in the ASCII line under the section name.
+  # used in the ASCII line under the section title.
   #
-  # line - the String line from under the section name.
+  # line - the String line from under the section title.
   def self.section_level(line)
     char = line.strip.chars.to_a.uniq
     case char
@@ -594,179 +970,631 @@ class Asciidoctor::Lexer
     end
   end
-  # == is level 0, === is level 1, etc.
+  #--
+  # = is level 0, == is level 1, etc.
   def self.single_line_section_level(line)
     [line.length - 1, 0].max
   end
-  def self.is_single_line_section_heading?(line)
-    !line.nil? && line.match(REGEXP[:level_title])
+  # Internal: Checks if the next line on the Reader is a section title
+  #
+  # This is a more efficient version of #is_section_title? and should
+  # eventually replace its usage.
+  #
+  # reader - the source Reader
+  #
+  # returns the section level if the Reader is positioned at a section title,
+  # false otherwise
+  def self.is_next_line_section?(reader)
+    if reader.has_lines?
+      line1 = reader.get_line
+      line2 = reader.peek_line
+      reader.unshift line1
+    else
+      return false
+    end
+    is_section_title?(line1, line2)
   end
-  def self.is_two_line_section_heading?(line1, line2)
-    !line1.nil? && !line2.nil? &&
-    line1.match(REGEXP[:name]) && line2.match(REGEXP[:line]) &&
-    # chomp so that a (non-visible) endline does not impact calculation
-    (line1.chomp.size - line2.chomp.size).abs <= 1
+  # Public: Checks if these lines are a section title
+  #
+  # line1 - the first line as a String
+  # line2 - the second line as a String (default: nil)
+  #
+  # returns the section level if these lines are a section title,
+  # false otherwise
+  def self.is_section_title?(line1, line2 = nil)
+    if (level = is_single_line_section_title?(line1))
+      level
+    elsif (level = is_two_line_section_title?(line1, line2))
+      level
+    else
+      false
+    end
   end
-  def self.is_section_heading?(line1, line2 = nil)
-    is_single_line_section_heading?(line1) ||
-    is_two_line_section_heading?(line1, line2)
+  def self.is_single_line_section_title?(line1)
+    if !line1.nil? && (match = line1.match(REGEXP[:section_title]))
+      single_line_section_level match[1]
+    else
+      false
+    end
   end
-  # Private: Extracts the name, level and (optional) embedded anchor from a
-  #          1- or 2-line section heading.
+  def self.is_two_line_section_title?(line1, line2)
+    if !line1.nil? && !line2.nil? && line1.match(REGEXP[:section_name]) &&
+        line2.match(REGEXP[:section_underline]) &&
+        # chomp so that a (non-visible) endline does not impact calculation
+        (line1.chomp.size - line2.chomp.size).abs <= 1
+      section_level line2
+    else
+      false
+    end
+  end
+  # Internal: Parse the section title from the current position of the reader
+  #
+  # Parse a single or double-line section title. After this method is called,
+  # the Reader will be positioned at the line after the section title.
   #
-  # Returns an array of a String, Integer, and String or nil.
+  # reader  - the source reader, positioned at a section title
   #
   # Examples
   #
-  #   line1
-  #   => "Foo\n"
-  #   line2
-  #   => "~~~\n"
+  #   reader.lines
+  #   # => ["Foo\n", "~~~\n"]
   #
-  #   name, level, anchor = extract_section_heading(line1, line2)
+  #   title, level, id, single = parse_section_title(reader)
   #
-  #   name
-  #   => "Foo"
+  #   title
+  #   # => "Foo"
   #   level
-  #   => 2
-  #   anchor
-  #   => nil
+  #   # => 2
+  #   id
+  #   # => nil
+  #   single
+  #   # => false
   #
   #   line1
-  #   => "==== Foo\n"
+  #   # => "==== Foo\n"
   #
-  #   name, level, anchor = extract_section_heading(line1)
+  #   title, level, id, single = parse_section_title(reader)
   #
-  #   name
-  #   => "Foo"
+  #   title
+  #   # => "Foo"
   #   level
-  #   => 3
-  #   anchor
-  #   => nil
+  #   # => 3
+  #   id
+  #   # => nil
+  #   single
+  #   # => true
+  #
+  # returns an Array of [String, Integer, String, Boolean], representing the
+  # id, title, level and line count of the Section, or nil.
   #
-  def self.extract_section_heading(line1, line2 = nil)
-    Asciidoctor.debug "#{__method__} -> line1: #{line1.chomp rescue 'nil'}, line2: #{line2.chomp rescue 'nil'}"
-    sect_name = sect_anchor = nil
+  #--
+  # NOTE for efficiency, we don't reuse methods that check for a section title
+  def self.parse_section_title(reader)
+    line1 = reader.get_line
+    sect_id = nil
+    sect_title = nil
     sect_level = 0
+    single_line = true
-    if is_single_line_section_heading?(line1)
-      header_match = line1.match(REGEXP[:level_title])
-      sect_name = header_match[2]
-      sect_level = single_line_section_level(header_match[1])
-    elsif is_two_line_section_heading?(line1, line2)
-      header_match = line1.match(REGEXP[:name])
-      if anchor_match = header_match[1].match(REGEXP[:anchor_embedded])
-        sect_name   = anchor_match[1]
-        sect_anchor = anchor_match[2]
-      else
-        sect_name = header_match[1]
+    if match = line1.match(REGEXP[:section_title])
+      sect_id = match[3]
+      sect_title = match[2]
+      sect_level = single_line_section_level match[1]
+    else
+      line2 = reader.peek_line
+      if !line2.nil? && (name_match = line1.match(REGEXP[:section_name])) &&
+        line2.match(REGEXP[:section_underline]) &&
+        # chomp so that a (non-visible) endline does not impact calculation
+        (line1.chomp.size - line2.chomp.size).abs <= 1
+        if anchor_match = name_match[1].match(REGEXP[:anchor_embedded])
+          sect_id = anchor_match[2]
+          sect_title = anchor_match[1]
+        else
+          sect_title = name_match[1]
+        end
+        sect_level = section_level line2
+        single_line = false
+        reader.get_line
       end
-      sect_level = section_level(line2)
     end
-    Asciidoctor.debug "#{__method__} -> Returning #{sect_name}, #{sect_level} (anchor: '#{sect_anchor || '<none>'}')"
-    return [sect_name, sect_level, sect_anchor]
+    return [sect_id, sect_title, sect_level, single_line]
   end
-  # Private: Return the next section from the Reader.
+  # Public: Consume and parse the two header lines (line 1 = author info, line 2 = revision info).
+  #
+  # Returns the Hash of header metadata. If a Document object is supplied, the metadata
+  # is applied directly to the attributes of the Document.
+  #
+  # reader   - the Reader holding the source lines of the document
+  # document - the Document we are building (default: nil)
   #
   # Examples
   #
-  #   source
-  #   => "GREETINGS\n---------\nThis is my doc.\n\nSALUTATIONS\n-----------\nIt is awesome."
+  #  parse_header_metadata(Reader.new ["Author Name <author@example.org>\n", "v1.0, 2012-12-21: Coincide w/ end of world.\n"])
+  #  # => {'author' => 'Author Name', 'firstname' => 'Author', 'lastname' => 'Name', 'email' => 'author@example.org',
+  #  #       'revnumber' => '1.0', 'revdate' => '2012-12-21', 'revremark' => 'Coincide w/ end of world.'}
+  def self.parse_header_metadata(reader, document = nil)
+    # capture consecutive comment lines so we can reinsert them after the header
+    comment_lines = reader.consume_comments
+    metadata = !document.nil? ? document.attributes : {}
+    author_initials = metadata['authorinitials']
+    if reader.has_lines? && !reader.peek_line.strip.empty?
+      author_line = reader.get_line
+      match = author_line.match(REGEXP[:author_info])
+      if match
+        metadata['firstname'] = fname = match[1].tr('_', ' ')
+        metadata['author'] = fname
+        metadata['authorinitials'] = fname[0, 1]
+        if !match[2].nil? && !match[3].nil?
+          metadata['middlename'] = mname = match[2].tr('_', ' ')
+          metadata['lastname'] = lname = match[3].tr('_', ' ')
+          metadata['author'] = [fname, mname, lname].join ' '
+          metadata['authorinitials'] = [fname[0, 1], mname[0, 1], lname[0, 1]].join
+        elsif !match[2].nil?
+          metadata['lastname'] = lname = match[2].tr('_', ' ')
+          metadata['author'] = [fname, lname].join ' '
+          metadata['authorinitials'] = [fname[0, 1], lname[0, 1]].join
+        end
+        metadata['email'] = match[4] unless match[4].nil?
+      else
+        metadata['author'] = metadata['firstname'] = author_line.strip.squeeze(' ')
+        metadata['authorinitials'] = metadata['firstname'][0, 1]
+      end
+      # hack because of incorrect order of attribute processing
+      metadata['authorinitials'] = author_initials unless author_initials.nil?
+      # capture consecutive comment lines so we can reinsert them after the header
+      comment_lines += reader.consume_comments
+      if reader.has_lines? && !reader.peek_line.strip.empty?
+        rev_line = reader.get_line
+        match = rev_line.match(REGEXP[:revision_info])
+        if match
+          metadata['revdate'] = match[2]
+          metadata['revnumber'] = match[1] unless match[1].nil?
+          metadata['revremark'] = match[3] unless match[3].nil?
+        else
+          metadata['revdate'] = rev_line.strip
+        end
+      end
+      reader.skip_blank
+    end
+    reader.unshift(*comment_lines)
+    metadata
+  end
+  # Internal: Parse lines of metadata until a line of metadata is not found.
+  #
+  # This method processes sequential lines containing block metadata, ignoring
+  # blank lines and comments.
+  #
+  # reader     - the source reader
+  # parent     - the parent to which the lines belong
+  # attributes - a Hash of attributes in which any metadata found will be stored (default: {})
+  # options    - a Hash of options to control processing: (default: {})
+  #              *  :text indicates that lexer is only looking for text content
+  #                   and thus the block title should not be captured
   #
-  #   TODO: doc = Asciidoctor::Document.new(source)
+  # returns the Hash of attributes including any metadata found
+  def self.parse_block_metadata_lines(reader, parent, attributes = {}, options = {})
+    while parse_block_metadata_line(reader, parent, attributes, options)
+      reader.next_line
+      reader.skip_blank_lines
+    end
+    attributes
+  end
+  # Internal: Parse the next line if it contains metadata for the following block
   #
-  #   doc.next_section
-  #   ["GREETINGS", [:paragraph, "This is my doc."]]
+  # This method handles lines with the following content:
   #
-  #   doc.next_section
-  #   ["SALUTATIONS", [:paragraph, "It is awesome."]]
-  def self.next_section(reader, parent = self)
-    section = Section.new(parent)
+  # * line or block comment
+  # * anchor
+  # * attribute list
+  # * block title
+  #
+  # Any attributes found will be inserted into the attributes argument.
+  # If the line contains block metadata, the method returns true, otherwise false.
+  #
+  # reader     - the source reader
+  # parent     - the parent of the current line
+  # attributes - a Hash of attributes in which any metadata found will be stored
+  # options    - a Hash of options to control processing: (default: {})
+  #              *  :text indicates that lexer is only looking for text content
+  #                   and thus the block title should not be captured
+  #
+  # returns true if the line contains metadata, otherwise false
+  def self.parse_block_metadata_line(reader, parent, attributes, options = {})
+    return false if !reader.has_lines?
+    next_line = reader.peek_line
+    if next_line.match(REGEXP[:comment])
+      # do nothing, we'll skip it
+    # QUESTION should we parse block comments here instead of next_block?
+    # disable until we can agree what the current line is coming in
+    elsif match = next_line.match(REGEXP[:comment_blk])
+      terminator = match[0]
+      reader.grab_lines_until(:skip_first_line => true, :preserve_last_line => true, :terminator => terminator)
+    elsif match = next_line.match(REGEXP[:anchor])
+      id, reftext = match[1].split(',')
+      attributes['id'] = id
+      # AsciiDoc always use [id] as the reftext in HTML output,
+      # but I'd like to do better in Asciidoctor
+      #parent.document.register(:ids, id)
+      if reftext
+        attributes['reftext'] = reftext
+        parent.document.register(:ids, [id, reftext])
+      end
+    elsif match = next_line.match(REGEXP[:blk_attr_list])
+      AttributeList.new(parent.document.sub_attributes(match[1]), parent.document).parse_into(attributes)
+    # NOTE title doesn't apply to section, but we need to stash it for the first block
+    # TODO need test for this getting passed on to first block after section if found above section
+    # TODO should issue an error if this is found above the document title
+    elsif !options[:text] && (match = next_line.match(REGEXP[:blk_title]))
+      attributes['title'] = match[1]
+    else
+      return false
+    end
-    Asciidoctor.debug "%"*64
-    Asciidoctor.debug "#{File.basename(__FILE__)}:#{__LINE__} -> #{__method__} - First two lines are:"
-    Asciidoctor.debug reader.peek_line
-    tmp_line = reader.get_line
-    Asciidoctor.debug reader.peek_line
-    reader.unshift tmp_line
-    Asciidoctor.debug "%"*64
+    true
+  end
-    # Skip ahead to the next section definition
-    while reader.has_lines? && section.name.nil?
-      this_line = reader.get_line
-      next_line = reader.peek_line || ''
-      if match = this_line.match(REGEXP[:anchor])
-        section.anchor = match[1]
-      elsif is_section_heading?(this_line, next_line)
-        section.name, section.level, section.anchor = extract_section_heading(this_line, next_line)
-        reader.get_line unless is_single_line_section_heading?(this_line)
+  # Internal: Resolve the 0-index marker for this list item
+  #
+  # For ordered lists, match the marker used for this list item against the
+  # known list markers and determine which marker is the first (0-index) marker
+  # in its number series.
+  #
+  # For callout lists, return <1>.
+  #
+  # For bulleted lists, return the marker as passed to this method.
+  #
+  # list_type  - The Symbol context of the list
+  # marker     - The String marker for this list item
+  # ordinal    - The position of this list item in the list
+  # validate   - Whether to validate the value of the marker
+  #
+  # Returns the String 0-index marker for this list item
+  def self.resolve_list_marker(list_type, marker, ordinal = 0, validate = false)
+    if list_type == :olist && !marker.start_with?('.')
+      resolve_ordered_list_marker(marker, ordinal, validate)
+    elsif list_type == :colist
+      '<1>'
+    else
+      marker
+    end
+  end
+  # Internal: Resolve the 0-index marker for this ordered list item
+  #
+  # Match the marker used for this ordered list item against the
+  # known ordered list markers and determine which marker is
+  # the first (0-index) marker in its number series.
+  #
+  # The purpose of this method is to normalize the implicit numbered markers
+  # so that they can be compared against other list items.
+  #
+  # marker   - The marker used for this list item
+  # ordinal  - The 0-based index of the list item (default: 0)
+  # validate - Perform validation that the marker provided is the proper
+  #            marker in the sequence (default: false)
+  #
+  # Examples
+  #
+  #  marker = 'B.'
+  #  Lexer::resolve_ordered_list_marker(marker, 1, true)
+  #  # => 'A.'
+  #
+  # Returns the String of the first marker in this number series
+  def self.resolve_ordered_list_marker(marker, ordinal = 0, validate = false)
+    number_style = ORDERED_LIST_STYLES.detect {|s| marker.match(ORDERED_LIST_MARKER_PATTERNS[s]) }
+    expected = actual = nil
+    case number_style
+      when :arabic
+        if validate
+          expected = ordinal + 1
+          actual = marker.to_i
+        end
+        marker = '1.'
+      when :loweralpha
+        if validate
+          expected = ('a'[0].ord + ordinal).chr
+          actual = marker.chomp('.')
+        end
+        marker = 'a.'
+      when :upperalpha
+        if validate
+          expected = ('A'[0].ord + ordinal).chr
+          actual = marker.chomp('.')
+        end
+        marker = 'A.'
+      when :lowerroman
+        if validate
+          # TODO report this in roman numerals; see https://github.com/jamesshipton/roman-numeral/blob/master/lib/roman_numeral.rb
+          expected = ordinal + 1
+          actual = roman_numeral_to_int(marker.chomp(')'))
+        end
+        marker = 'i)'
+      when :upperroman
+        if validate
+          # TODO report this in roman numerals; see https://github.com/jamesshipton/roman-numeral/blob/master/lib/roman_numeral.rb
+          expected = ordinal + 1
+          actual = roman_numeral_to_int(marker.chomp(')'))
+        end
+        marker = 'I)'
+    end
+    if validate && expected != actual
+      puts "asciidoctor: WARNING: list item index: expected #{expected}, got #{actual}"
+    end
+    marker
+  end
+  # Internal: Determine whether the this line is a sibling list item
+  # according to the list type and trait (marker) provided.
+  #
+  # line          - The String line to check
+  # list_type     - The context of the list (:olist, :ulist, :colist, :dlist)
+  # sibling_trait - The String marker for the list or the Regexp to match a sibling
+  #
+  # Returns a Boolean indicating whether this line is a sibling list item given
+  # the criteria provided
+  def self.is_sibling_list_item?(line, list_type, sibling_trait)
+    if sibling_trait.is_a?(Regexp)
+      matcher = sibling_trait
+      expected_marker = false
+    else
+      matcher = REGEXP[list_type]
+      expected_marker = sibling_trait
+    end
+    if m = line.match(matcher)
+      if expected_marker
+        expected_marker == resolve_list_marker(list_type, m[1])
+      else
+        true
       end
+    else
+      false
     end
+  end
+  # Internal: Parse the table contained in the provided Reader
+  #
+  # table_reader - a Reader containing the source lines of an AsciiDoc table
+  # parent       - the parent Block of this Asciidoctor::Table
+  # attributes   - attributes captured from above this Block
+  #
+  # returns an instance of Asciidoctor::Table parsed from the provided reader
+  def self.next_table(table_reader, parent, attributes)
+    table = Table.new(parent, attributes)
-    if !section.anchor.nil?
-      anchor_id = section.anchor.match(/^\[(.*)\]/) ? $1 : section.anchor
-      document_from_parent(parent).references[anchor_id] = section.anchor
-      section.anchor = anchor_id
+    if attributes.has_key? 'cols'
+      table.create_columns(parse_col_specs(attributes['cols']))
+      explicit_col_specs = true
+    else
+      explicit_col_specs = false
     end
-    # Grab all the lines that belong to this section
-    section_lines = []
-    while reader.has_lines?
-      this_line = reader.get_line
-      next_line = reader.peek_line
-      if is_section_heading?(this_line, next_line)
-        _, this_level, _ = extract_section_heading(this_line, next_line)
-        if this_level <= section.level
-          # A section can't contain a section level lower than itself,
-          # so this signifies the end of the section.
-          reader.unshift this_line
-          if section_lines.any? && section_lines.last.match(REGEXP[:anchor])
-            # Put back the anchor that came before this new-section line
-            # on which we're bailing.
-            reader.unshift section_lines.pop
+    table_reader.skip_blank_lines
+    parser_ctx = Asciidoctor::Table::ParserContext.new(table, attributes)
+    while table_reader.has_lines?
+      line = table_reader.get_line
+      if parser_ctx.format == 'psv'
+        if parser_ctx.starts_with_delimiter? line
+          line = line[1..-1]
+          # push an empty cell spec if boundary at start of line
+          parser_ctx.close_open_cell
+        else
+          next_cell_spec, line = parse_cell_spec(line, :start)
+          # if the cell spec is not null, then we're at a cell boundary
+          if !next_cell_spec.nil?
+            parser_ctx.close_open_cell next_cell_spec
+          else
+            # QUESTION do we not advance to next line? if so, when
+            # will we if we came into this block?
           end
-          break
+        end
+      end
+      while !line.empty?
+        if m = parser_ctx.match_delimiter(line)
+          if parser_ctx.format == 'csv'
+            if parser_ctx.buffer_has_unclosed_quotes?(m.pre_match)
+              # throw it back, it's too small
+              line = parser_ctx.skip_matched_delimiter(m)
+              next
+            end
+          else
+            if m.pre_match.end_with? '\\'
+              line = parser_ctx.skip_matched_delimiter(m, true)
+              next
+            end
+          end
+          if parser_ctx.format == 'psv'
+            next_cell_spec, cell_text = parse_cell_spec(m.pre_match, :end)
+            parser_ctx.push_cell_spec next_cell_spec
+            parser_ctx.buffer << cell_text
+          else
+            parser_ctx.buffer << m.pre_match
+          end
+          line = m.post_match
+          parser_ctx.close_cell
         else
-          section_lines << this_line
-          section_lines << reader.get_line unless is_single_line_section_heading?(this_line)
+          # no other delimiters to see here
+          # suck up this line into the buffer and move on
+          parser_ctx.buffer << line
+          # QUESTION make this an option? (unwrap-option?)
+          if parser_ctx.format == 'csv'
+            parser_ctx.buffer.rstrip!.concat(' ')
+          end
+          line = ''
+          if parser_ctx.format == 'psv' || (parser_ctx.format == 'csv' &&
+              parser_ctx.buffer_has_unclosed_quotes?)
+            parser_ctx.keep_cell_open
+          else
+            parser_ctx.close_cell true
+          end
         end
-      else
-        section_lines << this_line
       end
-    end
-    section_reader = Reader.new(section_lines)
-    # Now parse section_lines into Blocks belonging to the current Section
-    while section_reader.has_lines?
-      section_reader.skip_blank
+      table_reader.skip_blank_lines unless parser_ctx.cell_open?
-      if section_reader.has_lines?
-        new_block = next_block(section_reader, section)
-        section << new_block unless new_block.nil?
+      if !table_reader.has_lines?
+        parser_ctx.close_cell true
       end
     end
-    # detect preamble and push it into a block
-    # QUESTION make this an operation on Section?
-    if section.level == 0
-      blocks = section.blocks.take_while {|b| !b.is_a? Section}
-      if !blocks.empty?
-        # QUESTION Should we propagate the buffer?
-        #preamble = Block.new(section, :preamble, blocks.reduce {|a, b| a.buffer + b.buffer})
-        preamble = Block.new(section, :preamble)
-        blocks.each { preamble << section.delete_at(0) }
-        section.insert(0, preamble)
-      end
+    table.attributes['colcount'] ||= parser_ctx.col_count
+    if !explicit_col_specs
+      # TODO further encapsulate this logic (into table perhaps?)
+      even_width = (100.0 / parser_ctx.col_count).floor
+      table.columns.each {|c| c.assign_width(0, even_width) }
     end
-    section
+    table.partition_header_footer attributes
+    table
   end
+  # Internal: Parse the column specs for this table.
+  #
+  # The column specs dictate the number of columns, relative
+  # width of columns, default alignments for cells in each
+  # column, and/or default styles or filters applied to the cells in
+  # the column.
+  #
+  # Every column spec is guaranteed to have a width
+  #
+  # returns a Hash of attributes that specify how to format
+  # and layout the cells in the table.
+  def self.parse_col_specs(records)
+    specs = []
+    # check for deprecated syntax
+    if m = records.match(REGEXP[:digits])
+      1.upto(m[0].to_i) {
+        specs << {'width' => 1}
+      }
+      return specs
+    end
+    records.split(',').each {|record|
+      # TODO might want to use scan rather than this mega-regexp
+      if m = record.match(REGEXP[:table_colspec])
+        spec = {}
+        if m[2]
+          # make this an operation
+          colspec, rowspec = m[2].split '.'
+          if !colspec.to_s.empty? && Table::ALIGNMENTS[:h].has_key?(colspec)
+            spec['halign'] = Table::ALIGNMENTS[:h][colspec]
+          end
+          if !rowspec.to_s.empty? && Table::ALIGNMENTS[:v].has_key?(rowspec)
+            spec['valign'] = Table::ALIGNMENTS[:v][rowspec]
+          end
+        end
+        # TODO support percentage width
+        spec['width'] = !m[3].nil? ? m[3].to_i : 1
+        # make this an operation
+        if m[4] && Table::TEXT_STYLES.has_key?(m[4])
+          spec['style'] = Table::TEXT_STYLES[m[4]]
+        end
+        repeat = !m[1].nil? ? m[1].to_i : 1
+        1.upto(repeat) {
+          specs << spec.dup
+        }
+      end
+    }
+    specs
+  end
+  # Internal: Parse the cell specs for the current cell.
+  #
+  # The cell specs dictate the cell's alignments, styles or filters,
+  # colspan, rowspan and/or repeating content.
+  #
+  # returns the Hash of attributes that indicate how to layout
+  # and style this cell in the table.
+  def self.parse_cell_spec(line, pos = :start)
+    # the default for the end pos it {} since we
+    # know we're at a delimiter; when the pos
+    # is start, we *may* be at a delimiter and
+    # nil indicates we're not
+    spec = (pos == :end ? {} : nil)
+    rest = line
+    if m = line.match(REGEXP[:table_cellspec][pos])
+      spec = {}
+      return [spec, line] if m[0].strip.empty?
+      rest = (pos == :start ? m.post_match : m.pre_match)
+      if m[1]
+        colspec, rowspec = m[1].split '.'
+        colspec = colspec.to_s.empty? ? 1 : colspec.to_i
+        rowspec = rowspec.to_s.empty? ? 1 : rowspec.to_i
+        if m[2] == '+'
+          spec['colspan'] = colspec unless colspec == 1
+          spec['rowspan'] = rowspec unless rowspec == 1
+        elsif m[2] == '*'
+          spec['repeatcol'] = colspec unless colspec == 1
+        end
+      end
+      if m[3]
+        colspec, rowspec = m[3].split '.'
+        if !colspec.to_s.empty? && Table::ALIGNMENTS[:h].has_key?(colspec)
+          spec['halign'] = Table::ALIGNMENTS[:h][colspec]
+        end
+        if !rowspec.to_s.empty? && Table::ALIGNMENTS[:v].has_key?(rowspec)
+          spec['valign'] = Table::ALIGNMENTS[:v][rowspec]
+        end
+      end
+      if m[4] && Table::TEXT_STYLES.has_key?(m[4])
+        spec['style'] = Table::TEXT_STYLES[m[4]]
+      end
+    end
+    [spec, rest]
+  end
+  # Internal: Converts a Roman numeral to an integer value.
+  #
+  # value - The String Roman numeral to convert
+  #
+  # Returns the Integer for this Roman numeral
+  def self.roman_numeral_to_int(value)
+    value = value.downcase
+    digits = { 'i' => 1, 'v' => 5, 'x' => 10 }
+    result = 0
+    (0..value.length - 1).each {|i|
+      digit = digits[value[i..i]]
+      if i + 1 < value.length && digits[value[i+1..i+1]] > digit
+        result -= digit
+      else
+        result += digit
+      end
+    }
+    result
+  end
 end