RubyGems - epub-parser - Versions diffs - 0.2.7 → 0.2.8 - Mend

epub-parser 0.2.7 → 0.2.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

checksums.yaml +4 -4
data/.gitlab-ci.yml +19 -0
data/.travis.yml +1 -1
data/CHANGELOG.markdown +6 -0
data/Gemfile +4 -0
data/README.markdown +8 -7
data/docs/Home.markdown +1 -1
data/docs/Searcher.markdown +44 -29
data/examples/find-elements-and-cfis.rb +0 -4
data/lib/epub/content_document/navigation.rb +2 -0
data/lib/epub/ocf/physical_container.rb +9 -1
data/lib/epub/ocf/physical_container/unpacked_directory.rb +1 -3
data/lib/epub/ocf/physical_container/unpacked_uri.rb +1 -3
data/lib/epub/ocf/physical_container/zipruby.rb +2 -6
data/lib/epub/parser/version.rb +1 -1
data/lib/epub/publication/package/manifest.rb +1 -0
data/lib/epub/searcher.rb +6 -2
data/lib/epub/searcher/publication.rb +57 -7
data/lib/epub/searcher/result.rb +9 -20
data/lib/epub/searcher/xhtml.rb +5 -5
data/test/helper.rb +1 -0
data/test/test_parser_cfi.rb +16 -1
data/test/test_searcher.rb +58 -22
metadata +4 -3

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: e92165c76652996a441e9996bb9bdee8bb0e7b04
-  data.tar.gz: c7a62b70d282f9b8343c0b850db21d7f078961d9
+  metadata.gz: 84aac696d82b7eb55bf80b1448685ac4c210abdd
+  data.tar.gz: a32f0e557b928502e0825cbb6b2d808f0fc9dd1d
 SHA512:
-  metadata.gz: f56160b8148faf112e6ff8941a380223f1ce4d0ad114b2375f8e9793fe4eb0d7d9e18dda540f36c1ce702c90c7791006f5fa65c270498d5d6e5b341862e6aa37
-  data.tar.gz: f139ae34069e6bcfe85d23ae5b4db32cecd99ae90cfc1fbe12ba1b2541f31d93329a6215cf099074b0fc0a3b03996ea6fca2508ad9b3165f27522be5fb8c759e
+  metadata.gz: 5a28c163db08c10c57f733d6ffc9a68a768b30a5fe84439bff1fbb03941448c822eb916f3338016b1cd8f2a96954f69a775be0f65bb629231767dfb995318934
+  data.tar.gz: f5535095748701b940555ca424f3488b4e7b007c39d6e2688cf16d00394a9e03c2c6f12290c820ca15aee2a11ce0ed43e5745225507c6baab9c2a7e33bf513ab

data/.gitlab-ci.yml ADDED

@@ -0,0 +1,19 @@
+before_script:
+  - apt-get update -qq && apt-get install -y zip
+  - ruby -v
+  - which ruby
+  - gem install bundler --no-document
+  - bundle install --jobs=$(nproc) "${FLAGS[@]}"
+test:2.2:
+  image: ruby:2.2
+  script:
+    - bundle exec rake test
+test:2.3:
+  image: ruby:2.3
+  script: bundle exec rake test
+test:2.4:
+  image: ruby:2.4
+  script: bundle exec rake test

data/.travis.yml CHANGED

@@ -1,4 +1,4 @@
 rvm:
-  - "2.1.10"
   - "2.2.5"
   - "2.3.1"
+  - "2.4.0"

data/CHANGELOG.markdown CHANGED

@@ -1,6 +1,12 @@
 CHANGELOG
 =========
+0.2.8
+-----
+* Change Searcher API: #search -> #search_text
+* Add Searcher.search_element
 0.2.7
 -----

data/Gemfile CHANGED

@@ -1,2 +1,6 @@
 source 'https://rubygems.org'
 gemspec
+if RUBY_PLATFORM.match /darwin/
+  gem 'terminal-notifier'
+end

data/README.markdown CHANGED

@@ -1,6 +1,7 @@
 EPUB Parser
 ===========
 [![Build Status](https://secure.travis-ci.org/KitaitiMakoto/epub-parser.png?branch=master)](http://travis-ci.org/KitaitiMakoto/epub-parser)
+[![build status](https://gitlab.com/KitaitiMakoto/epub-parser/badges/master/build.svg)](https://gitlab.com/KitaitiMakoto/epub-parser/commits/master)
 [![Dependency Status](https://gemnasium.com/KitaitiMakoto/epub-parser.png)](https://gemnasium.com/KitaitiMakoto/epub-parser)
 [![Gem Version](https://badge.fury.io/rb/epub-parser.svg)](http://badge.fury.io/rb/epub-parser)
@@ -31,7 +32,7 @@ USAGE
 See document's {file:docs/Home.markdown} or [API Documentation][rubydoc] for more info.
-[rubydoc]: http://rubydoc.info/gems/epub-parser
+[rubydoc]: http://www.rubydoc.info/gems/epub-parser
 ### `epubinfo` command-line tool
@@ -114,7 +115,7 @@ It will show you path to generated documentation(`/path/to/gempath/ruby/2.2.0/do
 Or, generating by yardoc command is possible, too:
-    $ git clone https://github.com/KitaitiMakoto/epub-parser.git
+    $ git clone https://gitlab.com/KitaitiMakoto/epub-parser.git
     $ cd epub-parser
     $ bundle install --path=deps
     $ bundle exec rake doc:yard
@@ -151,6 +152,11 @@ If you find other gems, please tell me or request a pull request.
 RECENT CHANGES
 --------------
+### 0.2.8
+* Change Searcher API: #search -> #search_text
+* Add Searcher.search_element
 ### 0.2.7
 * Add `EPUB::Metadata#children`
@@ -169,11 +175,6 @@ RECENT CHANGES
 [multi-rendition]: http://www.idpf.org/epub/renditions/multiple/
-### 0.2.5
-* [BUG FIX]Don't load Zip/Ruby if unneccessary
-* Add `EPUB::CFI::PhysicalContainer.find_adapter`
 See {file:CHANGELOG.markdown} for older changelogs and details.
 TODOS

data/docs/Home.markdown CHANGED

@@ -122,7 +122,7 @@ It will show you path to generated documentation(`/path/to/gempath/ruby/2.2.0/do
 Or, generating yardoc command is possible, too:
-    $ git clone https://github.com/KitaitiMakoto/epub-parser.git
+    $ git clone https://gitlab.com/KitaitiMakoto/epub-parser.git
     $ cd epub-parser
     $ bundle install --path=deps
     $ bundle exec rake doc:yard

data/docs/Searcher.markdown CHANGED

@@ -8,37 +8,37 @@ Searcher
 Example
 -------
-    epub = EPUB::Parser.parse('childrens-literature-20130206.epub')
+    epub = EPUB::Parser.parse('childrens-literature.epub')
     search_word = 'INTRODUCTORY'
-    results = EPUB::Searcher.search(epub, search_word)
-    # => [#<EPUB::Searcher::Result:0x007f938ed517a8
-    #   @end_steps=[#<EPUB::Searcher::Result::Step:0x007f938ed51a50 @index=12, @info={}, @type=:character>],
+    results = EPUB::Searcher.search_text(epub, search_word)
+    # => [#<EPUB::Searcher::Result:0x007f80ccde9528
+    #   @end_steps=[#<EPUB::Searcher::Result::Step:0x007f80ccde9730 @index=12, @info={}, @type=:character>],
     #   @parent_steps=
-    #    [#<EPUB::Searcher::Result::Step:0x007f938f1c1e78 @index=2, @info={:name=>"spine", :id=>nil}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938f1caa78 @index=1, @info={:id=>nil}, @type=:itemref>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ed521d0 @index=1, @info={:name=>"body", :id=>nil}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ed52158 @index=0, @info={:name=>"nav", :id=>"toc"}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ed52108 @index=1, @info={:name=>"ol", :id=>"tocList"}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ed52090 @index=0, @info={:name=>"li", :id=>"np-313"}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ed52040 @index=1, @info={:name=>"ol", :id=>nil}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ed51ff0 @index=1, @info={:name=>"li", :id=>"np-317"}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ed51f78 @index=0, @info={:name=>"a", :id=>nil}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ed51f28 @index=0, @info={}, @type=:text>],
-    #   @start_steps=[#<EPUB::Searcher::Result::Step:0x007f938ed51e88 @index=0, @info={}, @type=:character>]>,
-    #  #<EPUB::Searcher::Result:0x007f938ef8f5d8
-    #   @end_steps=[#<EPUB::Searcher::Result::Step:0x007f938ef8f808 @index=12, @info={}, @type=:character>],
+    #    [#<EPUB::Searcher::Result::Step:0x007f80ccf571d0 @index=2, @info={:name=>"spine", :id=>nil}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccf3d3e8 @index=1, @info={:id=>nil}, @type=:itemref>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccde9e88 @index=1, @info={:name=>"body", :id=>nil}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccde9e38 @index=0, @info={:name=>"nav", :id=>"toc"}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccde9de8 @index=1, @info={:name=>"ol", :id=>"tocList"}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccde9d98 @index=0, @info={:name=>"li", :id=>"np-313"}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccde9d48 @index=1, @info={:name=>"ol", :id=>nil}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccde9ca8 @index=1, @info={:name=>"li", :id=>"np-317"}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccde9c08 @index=0, @info={:name=>"a", :id=>nil}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccde9bb8 @index=0, @info={}, @type=:text>],
+    #   @start_steps=[#<EPUB::Searcher::Result::Step:0x007f80ccde9af0 @index=0, @info={}, @type=:character>]>,
+    #  #<EPUB::Searcher::Result:0x007f80ccebcb30
+    #   @end_steps=[#<EPUB::Searcher::Result::Step:0x007f80ccebcdb0 @index=12, @info={}, @type=:character>],
     #   @parent_steps=
-    #    [#<EPUB::Searcher::Result::Step:0x007f938f1c1e78 @index=2, @info={:name=>"spine", :id=>nil}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ed51730 @index=2, @info={:id=>nil}, @type=:itemref>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ef8fce0 @index=1, @info={:name=>"body", :id=>nil}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ef8fc90 @index=0, @info={:name=>"section", :id=>"pgepubid00492"}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ef8fc40 @index=3, @info={:name=>"section", :id=>"pgepubid00498"}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ef8fbf0 @index=1, @info={:name=>"h3", :id=>nil}, @type=:element>,
-    #     #<EPUB::Searcher::Result::Step:0x007f938ef8fb28 @index=0, @info={}, @type=:text>],
-    #   @start_steps=[#<EPUB::Searcher::Result::Step:0x007f938ef8fa88 @index=0, @info={}, @type=:character>]>]
-    puts results.collect(&:to_cfi_s)
-    # /6/4!/4/2[toc]/4[tocList]/2[np-313]/4/4[np-317]/2/1,:0,:12
-    # /6/6!/4/2[pgepubid00492]/8[pgepubid00498]/4/1,:0,:12
+    #    [#<EPUB::Searcher::Result::Step:0x007f80ccf571d0 @index=2, @info={:name=>"spine", :id=>nil}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccde94b0 @index=2, @info={:id=>nil}, @type=:itemref>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccebd328 @index=1, @info={:name=>"body", :id=>nil}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccebd2d8 @index=0, @info={:name=>"section", :id=>"pgepubid00492"}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccebd260 @index=3, @info={:name=>"section", :id=>"pgepubid00498"}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccebd210 @index=1, @info={:name=>"h3", :id=>nil}, @type=:element>,
+    #     ##<EPUB::Searcher::Result::Step:0x007f80ccebd198 @index=0, @info={}, @type=:text>],
+    #   @start_steps=[#<EPUB::Searcher::Result::Step:0x007f80ccebd0d0 @index=0, @info={}, @type=:character>]>]
+    puts results.collect(&:to_cfi).collect(&:to_fragment)
+    # epubcfi(/6/4!/4/2[toc]/4[tocList]/2[np-313]/4/4[np-317]/2/1,:0,:12)
+    # epubcfi(/6/6!/4/2[pgepubid00492]/8[pgepubid00498]/4/1,:0,:12)
     # => nil
 Search result
@@ -91,4 +91,19 @@ because the words 'search' and 'word' are not in the same element.
 To use restricted searcher, specify `algorithm` option for `search` method:
-    results = EPUB::Searcher.search(epub, search_word, algorithm: :restricted)
+    results = EPUB::Searcher.search_text(epub, search_word, algorithm: :restricted)
+Element Searcher
+----------------
+You can search XHTML elements by CSS selector or XPath.
+    EPUB::Searcher::Publication.search_element(@package, css: 'ol > li').collect {|result| result[:location]}.map(&:to_fragment)
+    # => ["epubcfi(/4/4!/4/2[toc]/4[tocList]/2[np-313])",
+    #  "epubcfi(/4/4!/4/2[toc]/4[tocList]/2[np-313]/4/2[np-315])",
+    #  "epubcfi(/4/4!/4/2[toc]/4[tocList]/2[np-313]/4/4[np-317])",
+    #  "epubcfi(/4/4!/4/2[toc]/4[tocList]/2[np-313]/4/6)",
+    #  "epubcfi(/4/4!/4/2[toc]/4[tocList]/2[np-313]/4/6/4/2[np-319])",
+    #  "epubcfi(/4/4!/4/2[toc]/4[tocList]/2[np-313]/4/6/4/2[np-319]/4/2)",
+    #    :
+    #    :

data/examples/find-elements-and-cfis.rb CHANGED

@@ -23,10 +23,6 @@ def main(argv)
   epub = EPUB::Parser.parse(epub_path)
   epub.package.spine.each_itemref.with_index do |itemref, i|
-    itemref_step = {
-      :step => (i + 1) * 2,
-      :id => itemref.id
-    }
     assertion = itemref.id ? EPUB::CFI::IDAssertion.new(itemref.id) : nil
     itemref_step = EPUB::CFI::Step.new((i + 1) * 2, assertion)
     path_to_itemref = EPUB::CFI::Path.new([spine_step, itemref_step])

data/lib/epub/content_document/navigation.rb CHANGED

@@ -5,6 +5,8 @@ module EPUB
       def initialize
         @navigations = []
+        @hidden = false
+        @parent = nil
         super
       end

data/lib/epub/ocf/physical_container.rb CHANGED

@@ -7,7 +7,15 @@ module EPUB
   class OCF
     # @todo: Make thread save
     class PhysicalContainer
-      class NoEntry < StandardError; end
+      class NoEntry < StandardError
+        class << self
+          def from_error(error)
+            no_entry = new(error.message)
+            no_entry.set_backtrace error.backtrace
+            no_entry
+          end
+        end
+      end
       @adapter = ArchiveZip

data/lib/epub/ocf/physical_container/unpacked_directory.rb CHANGED

@@ -9,9 +9,7 @@ module EPUB
         def read(path_name)
           ::File.read(::File.join(@container_path, path_name))
         rescue ::Errno::ENOENT => error
-          no_entry = NoEntry.new(error.message)
-          no_entry.set_backtrace error.backtrace
-          raise no_entry
+          raise NoEntry.from_error(error)
         end
       end
     end

data/lib/epub/ocf/physical_container/unpacked_uri.rb CHANGED

@@ -20,9 +20,7 @@ module EPUB
         def read(path_name)
           (@container_path + path_name).read
         rescue ::OpenURI::HTTPError => error
-          no_entry = NoEntry.new(error.message)
-          no_entry.set_backtrace error.backtrace
-          raise no_entry
+          raise NoEntry.from_error(error)
         end
       end
     end

data/lib/epub/ocf/physical_container/zipruby.rb CHANGED

@@ -11,9 +11,7 @@ module EPUB
                 @archive = archive
                 yield self
               rescue ::Zip::Error => error
-                no_entry = NoEntry.new(error.message)
-                no_entry.set_backtrace error.backtrace
-                raise no_entry
+                raise NoEntry.from_error(error)
               ensure
                 @archive = nil
               end
@@ -28,9 +26,7 @@ module EPUB
             open {|container| container.read(path_name)}
           end
         rescue ::Zip::Error => error
-          no_entry = NoEntry.new(error.message)
-          no_entry.set_backtrace error.backtrace
-          raise no_entry
+          raise NoEntry.from_error(error)
         ensure
           @archive = nil
         end

data/lib/epub/parser/version.rb CHANGED

@@ -1,5 +1,5 @@
 module EPUB
   class Parser
-    VERSION = "0.2.7"
+    VERSION = "0.2.8"
   end
 end

data/lib/epub/publication/package/manifest.rb CHANGED

@@ -101,6 +101,7 @@ module EPUB
           def initialize
             @properties = Set.new
+            @full_path = nil
           end
           def properties=(props)

data/lib/epub/searcher.rb CHANGED

@@ -5,8 +5,12 @@ require 'epub/searcher/xhtml'
 module EPUB
   module Searcher
     class << self
-      def search(epub, word, **options)
-        Publication.search(epub.package, word, options)
+      def search_text(epub, word, **options)
+        Publication.search_text(epub.package, word, options)
+      end
+      def search_element(epub, css: nil, xpath: nil, namespaces: {})
+        Publication.search_element(epub.package, css: css, xpath: xpath, namespaces: namespaces)
       end
     end
   end

data/lib/epub/searcher/publication.rb CHANGED

@@ -4,29 +4,79 @@ module EPUB
   module Searcher
     class Publication
       class << self
-        def search(package, word, **options)
-          new(word).search(package, options)
+        def search_text(package, word, **options)
+          new(package).search_text(word, options)
+        end
+        def search_element(package, css: nil, xpath: nil, namespaces: {})
+          new(package).search_element(css: css, xpath: xpath, namespaces: namespaces)
         end
       end
-      def initialize(word)
-        @word = word
+      def initialize(package)
+        @package = package
       end
-      def search(package, algorithm: :seamless)
+      def search_text(word, algorithm: :seamless)
         results = []
-        spine = package.spine
+        spine = @package.spine
         spine_step = Result::Step.new(:element, 2, {:name => 'spine', :id => spine.id})
         spine.each_itemref.with_index do |itemref, index|
           itemref_step = Result::Step.new(:itemref, index, {:id => itemref.id})
-          XHTML::ALGORITHMS[algorithm].search(Nokogiri.XML(itemref.item.read), @word).each do |sub_result|
+          XHTML::ALGORITHMS[algorithm].search_text(Nokogiri.XML(itemref.item.read), word).each do |sub_result|
             results << Result.new([spine_step, itemref_step] + sub_result.parent_steps, sub_result.start_steps, sub_result.end_steps)
           end
         end
         results
       end
+      # @todo: Refactoring
+      def search_element(css: nil, xpath: nil, namespaces: {})
+        raise ArgumentError, 'Both css and xpath are nil' if css.nil? && xpath.nil?
+        namespaces = EPUB::NAMESPACES.merge(namespaces)
+        results = []
+        spine_step = EPUB::CFI::Step.new(EPUB::Publication::Package::CONTENT_MODELS.index(:spine) * 2)
+        @package.spine.each_itemref.with_index do |itemref, index|
+          assertion = itemref.id ? EPUB::CFI::IDAssertion.new(itemref.id) : nil
+          itemref_step = EPUB::CFI::Step.new((index + 1) * 2, assertion)
+          path_to_itemref = EPUB::CFI::Path.new([spine_step, itemref_step])
+          content_document = itemref.item.content_document
+          next unless content_document
+          doc = content_document.nokogiri
+          elems = if xpath
+                    doc.xpath(xpath, namespaces)
+                  else
+                    doc.css(css)
+                  end
+          elems.each do |elem|
+            path = find_path(elem)
+            results << {
+              location: EPUB::CFI::Location.new([path_to_itemref, path]),
+              package: @package,
+              element: elem
+            }
+          end
+        end
+        results
+      end
+      private
+      def find_path(elem)
+        steps = []
+        until elem.parent.document?
+          index = elem.parent.element_children.index(elem)
+          assertion = elem["id"] ? EPUB::CFI::IDAssertion.new(elem["id"]) : nil
+          steps.unshift EPUB::CFI::Step.new((index + 1) * 2, assertion)
+          elem = elem.parent
+        end
+        EPUB::CFI::Path.new(steps)
+      end
     end
   end
 end

data/lib/epub/searcher/result.rb CHANGED

@@ -1,3 +1,6 @@
+require 'epub/cfi'
+require 'epub/parser/cfi'
 module EPUB
   module Searcher
     class Result
@@ -9,7 +12,7 @@ module EPUB
         #   # Note that c here is not included in the first element of returned value.
         # @param steps1 [Array<Step>, Array<Array>]
         # @param steps2 [Array<Step>, Array<Array>]
-        # @return [Array<Array<Array>>] Thee arrays:
+        # @return [Array<Array<Array>>] Three arrays:
         #   1. "intersection" of +steps1+ and +steps2+. "intersection" here is not the term of mathmatics
         #   2. remaining steps of +steps1+
         #   3. remaining steps of +steps2+
@@ -41,25 +44,11 @@ module EPUB
         @parent_steps, @start_steps, @end_steps = parent_steps, start_steps, end_steps
       end
-      def to_xpath_and_offset(with_xmlns=false)
-        xpath = (@parent_steps + @start_steps).reduce('.') {|path, step|
-          case step.type
-          when :element
-            path + '/%s*[%d]' % [with_xmlns ? 'xhtml:' : nil, step.index + 1]
-          when :text
-            path + '/text()[%s]' % [step.index + 1]
-          else
-            path
-          end
-        }
-        [xpath, @start_steps.last.index]
-      end
-      def to_cfi_s
-        [@parent_steps, @start_steps, @end_steps].collect {|steps|
-          steps ? steps.collect(&:to_cfi_s).join : nil
+      def to_cfi
+        str = [@parent_steps, @start_steps, @end_steps].collect {|steps|
+          steps ? steps.collect(&:to_cfi).join : nil
         }.compact.join(',')
+        EPUB::CFI(str)
       end
       def ==(other)
@@ -80,7 +69,7 @@ module EPUB
             self.info == other.info
         end
-        def to_cfi_s
+        def to_cfi
           case type
           when :element
             '/%d%s' % [(index + 1) * 2, id_assertion]

data/lib/epub/searcher/xhtml.rb CHANGED

@@ -10,8 +10,8 @@ module EPUB
         # @param element [Nokogiri::XML::Element, Nokogiri::XML::Document]
         # @param word [String]
         # @return [Array<Result>]
-        def search(element, word)
-          new(element.respond_to?(:root) ? element.root : element).search(word)
+        def search_text(element, word)
+          new(element.respond_to?(:root) ? element.root : element).search_text(word)
         end
       end
@@ -23,7 +23,7 @@ module EPUB
       class Restricted < self
         # @param element [Nokogiri::XML::Element]
         # @return [Array<Result>]
-        def search(word, element=nil)
+        def search_text(word, element=nil)
           results = []
           elem_index = 0
@@ -35,7 +35,7 @@ module EPUB
                   results << Result.new([child_step], nil, nil)
                 end
               else
-                search(word, child).each do |sub_result|
+                search_text(word, child).each do |sub_result|
                   results << Result.new([child_step] + sub_result.parent_steps, sub_result.start_steps, sub_result.end_steps)
                 end
               end
@@ -62,7 +62,7 @@ module EPUB
           @indices = nil
         end
-        def search(word)
+        def search_text(word)
           unless @indices
             @indices, @content = build_indices(@element)
           end

data/test/helper.rb CHANGED

@@ -1,3 +1,4 @@
+Encoding.default_external = 'UTF-8'
 require 'simplecov'
 SimpleCov.start do
   add_filter '/test|deps/'

data/test/test_parser_cfi.rb CHANGED

@@ -18,6 +18,7 @@ class TestParserCFI < Test::Unit::TestCase
     'epubcfi(/6/4[chap01ref]!/4[body01]/10[para05]/2/1:3[,y])',
     'epubcfi(/6/4[chap01ref]!/4[body01]/10[para05]/2/1:3[;s=b])',
     'epubcfi(/6/4[chap01ref]!/4[body01]/10[para05]/2/1:3[yyy;s=b])',
+    'epubcfi(/6/4[chap01ref]!/4[body01]/10[para05]/2/1:3[^(;s=b])',
     'epubcfi(/6/4[chap01ref]!/4[body01]/10[para05]/2[;s=b])',
     'epubcfi(/6/4[chap01ref]!/4[body01]/10[para05]/3:10)',
     'epubcfi(/6/4[chap01ref]!/4[body01]/16[svgimg])',
@@ -25,7 +26,8 @@ class TestParserCFI < Test::Unit::TestCase
     'epubcfi(/6/4[chap01ref]!/4[body01]/10[para05]/2/1:0)',
     'epubcfi(/6/4[chap01ref]!/4[body01]/10[para05]/2/1:3)',
     'epubcfi(/6/4[chap01ref]!/4[body01]/10[para05],/2/1:1,/3:4)',
-    'epubcfi(/6,:1,:3)'
+    'epubcfi(/6,:1,:3)',
+    'epubcfi(/6/4[chap01ref]!/4[body01]/10[mov01]~23.5@5.75:97.6)'
   ].reduce({}) {|data, cfi|
     data[cfi] = cfi
     data
@@ -35,4 +37,17 @@ class TestParserCFI < Test::Unit::TestCase
       @parser.parse(cfi)
     end
   end
+  data([
+    '/6/4[chap01ref]!/4[body01]/10[para05]/2/1:3[(;s=b]',
+    '/6/4[chap01ref]!/4[body01]/10[para05]/2/1:3[);s=b]'
+  ].reduce({}) {|data, cfi|
+    data[cfi] = cfi
+    data
+  })
+  def test_raise_error_on_parsing_invalid_cfi(cfi)
+    assert_raise Racc::ParseError do
+      EPUB::CFI(cfi)
+    end
+  end
 end

data/test/test_searcher.rb CHANGED

@@ -1,6 +1,7 @@
 # -*- coding: utf-8 -*-
 require_relative 'helper'
 require 'epub/searcher'
+require 'epub/parser/cfi'
 class TestSearcher < Test::Unit::TestCase
   class TestPublication < self
@@ -17,7 +18,7 @@ class TestSearcher < Test::Unit::TestCase
     end
     def test_no_result
-      assert_empty EPUB::Searcher::Publication.search(@package, 'no result')
+      assert_empty EPUB::Searcher::Publication.search_text(@package, 'no result')
     end
     def test_simple
@@ -26,13 +27,53 @@ class TestSearcher < Test::Unit::TestCase
           [[[:element, 2, {:name => 'spine', :id => nil}], [:itemref, 0, {:id => nil}], [:element, 0, {:name => 'head', :id => nil}], [:element, 0, {:name => 'title', :id => nil}], [:text, 0]], [[:character, 9]], [[:character, 16]]],
           [[[:element, 2, {:name => 'spine', :id => nil}], [:itemref, 0, {:id => nil}], [:element, 1, {:name => 'body', :id => nil}], [:element, 0, {:name => 'div', :id => nil}], [:element, 0, {:name => 'nav', :id => 'idid'}], [:element, 0, {:name => 'hgroup', :id => nil}], [:element, 1, {:name => 'h1', :id => nil}], [:text, 0]], [[:character, 9]], [[:character, 16]]]
         ]),
-        EPUB::Searcher::Publication.search(@package, 'Content')
+        EPUB::Searcher::Publication.search_text(@package, 'Content')
+      )
+    end
+    def test_search_element_xpath_without_namespaces
+      assert_equal(
+        [
+          "epubcfi(/4/2!/4/2/2[idid]/4/2/2)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/2/2)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/4/2)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/6/2)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/8/2)"
+        ],
+        EPUB::Searcher::Publication.search_element(@package, xpath: './/xhtml:a').collect {|result| result[:location]}.map(&:to_fragment)
+      )
+    end
+    def test_search_element_xpath_with_namespaces
+      assert_equal(
+        [
+          "epubcfi(/4/2!/4/2/2[idid]/4/2/2)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/2/2)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/4/2)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/6/2)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/8/2)"
+        ],
+        EPUB::Searcher::Publication.search_element(@package, xpath: './/customnamespace:a', namespaces: {'customnamespace' => 'http://www.w3.org/1999/xhtml'}).collect {|result| result[:location]}.map(&:to_fragment)
+      )
+    end
+    def test_search_element_css_selector
+      assert_equal(
+        [
+          "epubcfi(/4/2!/4/2/2[idid]/4/2)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/2)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/4)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/6)",
+          "epubcfi(/4/2!/4/2/2[idid]/4/4/4/8)"
+        ],
+        EPUB::Searcher::Publication.search_element(@package, css: 'ol > li').collect {|result| result[:location]}.map(&:to_fragment)
       )
     end
     class TesetResult < self
-      def test_to_cfi_s
-        assert_equal '/6/2!/4/2/2[idid]/2/4/1,:9,:16', EPUB::Searcher::Publication.search(@package, 'Content').last.to_cfi_s
+      def test_to_cfi
+        assert_equal 'epubcfi(/6/2!/4/2/2[idid]/2/4/1,:9,:16)', EPUB::Searcher::Publication.search_text(@package, 'Content').last.to_cfi.to_fragment
       end
     end
   end
@@ -48,35 +89,35 @@ class TestSearcher < Test::Unit::TestCase
     module TestSearch
       def test_no_result
-        assert_empty @searcher.search(@h1, 'no result')
+        assert_empty @searcher.search_text(@h1, 'no result')
       end
       def test_simple
-        assert_equal results([[[[:text, 0]], [[:character, 9]], [[:character, 16]]]]), @searcher.search(@h1, 'Content')
+        assert_equal results([[[[:text, 0]], [[:character, 9]], [[:character, 16]]]]), @searcher.search_text(@h1, 'Content')
       end
       def test_multiple_text_result
-        assert_equal results([[[[:text, 0]], [[:character, 6]], [[:character, 7]]], [[[:text, 0]], [[:character, 10]], [[:character, 11]]]]), @searcher.search(@h1, 'o')
+        assert_equal results([[[[:text, 0]], [[:character, 6]], [[:character, 7]]], [[[:text, 0]], [[:character, 10]], [[:character, 11]]]]), @searcher.search_text(@h1, 'o')
       end
       def test_text_after_element
         elem = Nokogiri.XML('<root><elem>inner</elem>after</root>')
-        assert_equal results([[[[:text, 1]], [[:character, 0]], [[:character, 5]]]]), @searcher.search(elem, 'after')
+        assert_equal results([[[[:text, 1]], [[:character, 0]], [[:character, 5]]]]), @searcher.search_text(elem, 'after')
       end
       def test_entity_reference
         elem = Nokogiri.XML('<root>before&lt;after</root>')
-        assert_equal results([[[[:text, 0]], [[:character, 6]], [[:character, 7]]]]), @searcher.search(elem, '<')
+        assert_equal results([[[[:text, 0]], [[:character, 6]], [[:character, 7]]]]), @searcher.search_text(elem, '<')
       end
       def test_nested_result
-        assert_equal results([[[[:element, 1, {:name => 'ol', :id => nil}], [:element, 1, {:name => 'li', :id => nil}], [:element, 1, {:name => 'ol', :id => nil}], [:element, 1, {:name => 'li', :id => nil}], [:element, 0, {:name => 'a', :id => nil}], [:text, 0]], [[:character, 0]], [[:character, 3]]]]), @searcher.search(@nav, '第二節')
+        assert_equal results([[[[:element, 1, {:name => 'ol', :id => nil}], [:element, 1, {:name => 'li', :id => nil}], [:element, 1, {:name => 'ol', :id => nil}], [:element, 1, {:name => 'li', :id => nil}], [:element, 0, {:name => 'a', :id => nil}], [:text, 0]], [[:character, 0]], [[:character, 3]]]]), @searcher.search_text(@nav, '第二節')
       end
       def test_img
-        assert_equal [result([[[:element, 1, {:name => 'ol', :id => nil}], [:element, 1, {:name => 'li', :id => nil}], [:element, 1, {:name => 'ol', :id => nil}], [:element, 2, {:name => 'li', :id => nil}], [:element, 0, {:name => 'a', :id => nil}], [:element, 0, {:name => 'img', :id => nil}]], nil, nil])], @searcher.search(@nav, '第三節')
+        assert_equal [result([[[:element, 1, {:name => 'ol', :id => nil}], [:element, 1, {:name => 'li', :id => nil}], [:element, 1, {:name => 'ol', :id => nil}], [:element, 2, {:name => 'li', :id => nil}], [:element, 0, {:name => 'a', :id => nil}], [:element, 0, {:name => 'img', :id => nil}]], nil, nil])], @searcher.search_text(@nav, '第三節')
       end
     end
@@ -99,27 +140,22 @@ class TestSearcher < Test::Unit::TestCase
       def test_seamless
         elem = Nokogiri.XML('<root>This <em>includes</em> a child element.</root>')
-        assert_equal results([[[], [[:text, 0], [:character, 0]], [[:text, 1], [:character, 17]]]]), @searcher.search(elem, 'This includes a child element.')
+        assert_equal results([[[], [[:text, 0], [:character, 0]], [[:text, 1], [:character, 17]]]]), @searcher.search_text(elem, 'This includes a child element.')
       end
     end
     class TestResult < self
       def setup
         super
-        @result = EPUB::Searcher::XHTML::Restricted.search(@doc, '第二節').first
-      end
-      def test_to_xpath_and_offset
-        assert_equal ['./*[2]/*[1]/*[1]/*[2]/*[2]/*[2]/*[2]/*[1]/text()[1]', 0], @result.to_xpath_and_offset
-        assert_equal ['./xhtml:*[2]/xhtml:*[1]/xhtml:*[1]/xhtml:*[2]/xhtml:*[2]/xhtml:*[2]/xhtml:*[2]/xhtml:*[1]/text()[1]', 0], @result.to_xpath_and_offset(true)
+        @result = EPUB::Searcher::XHTML::Restricted.search_text(@doc, '第二節').first
       end
-      def test_to_cfi_s
-        assert_equal '/4/2/2[idid]/4/4/4/4/2/1,:0,:3', @result.to_cfi_s
+      def test_to_cfi
+        assert_equal 'epubcfi(/4/2/2[idid]/4/4/4/4/2/1,:0,:3)', @result.to_cfi.to_fragment
       end
-      def test_to_cfi_s_img
-        assert_equal '/4/2/2[idid]/4/4/4/6/2/2', EPUB::Searcher::XHTML::Restricted.search(@doc, '第三節').first.to_cfi_s
+      def test_to_cfi_img
+        assert_equal 'epubcfi(/4/2/2[idid]/4/4/4/6/2/2)', EPUB::Searcher::XHTML::Restricted.search_text(@doc, '第三節').first.to_cfi.to_fragment
       end
     end
   end

metadata CHANGED

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: epub-parser
 version: !ruby/object:Gem::Version
-  version: 0.2.7
+  version: 0.2.8
 platform: ruby
 authors:
 - KITAITI Makoto
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2016-07-30 00:00:00.000000000 Z
+date: 2017-02-07 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: rake
@@ -301,6 +301,7 @@ extra_rdoc_files: []
 files:
 - ".gemtest"
 - ".gitignore"
+- ".gitlab-ci.yml"
 - ".gitmodules"
 - ".travis.yml"
 - ".yardopts"
@@ -419,7 +420,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
       version: '0'
 requirements: []
 rubyforge_project:
-rubygems_version: 2.5.1
+rubygems_version: 2.6.8
 signing_key:
 specification_version: 4
 summary: EPUB 3 Parser