RubyGems - rbook - Versions diffs - 0.4.3 → 0.5 - Mend

rbook 0.4.3 → 0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (87) hide show

data/Rakefile +13 -176
metadata +57 -117
data/COPYING +0 -340
data/LICENSE +0 -13
data/README +0 -17
data/examples/gbip.rb +0 -12
data/examples/onix/stream_reader.rb +0 -13
data/examples/pacstream.rb +0 -13
data/examples/titlepage.rb +0 -14
data/examples/titlepage_with_proxy.rb +0 -14
data/examples/titlepage_www.rb +0 -18
data/examples/www/find_all.rb +0 -23
data/examples/www/find_cover_from_amazon.rb +0 -16
data/examples/www/find_url_from_rainbow.rb +0 -12
data/examples/www/list.rb +0 -13
data/lib/rbook/bisac.rb +0 -31
data/lib/rbook/bisac/message.rb +0 -99
data/lib/rbook/bisac/po.rb +0 -97
data/lib/rbook/bisac/po_line_item.rb +0 -33
data/lib/rbook/bisac/product.rb +0 -176
data/lib/rbook/errors.rb +0 -8
data/lib/rbook/gbip.rb +0 -21
data/lib/rbook/gbip/pos.rb +0 -118
data/lib/rbook/gbip/title.rb +0 -36
data/lib/rbook/gbip/warehouse.rb +0 -27
data/lib/rbook/isbn.rb +0 -255
data/lib/rbook/onix.rb +0 -70
data/lib/rbook/onix/contributor.rb +0 -60
data/lib/rbook/onix/lists.rb +0 -2
data/lib/rbook/onix/lists/contributor_role.rb +0 -10
data/lib/rbook/onix/lists/product_form.rb +0 -100
data/lib/rbook/onix/message.rb +0 -112
data/lib/rbook/onix/product.rb +0 -189
data/lib/rbook/onix/sales_restriction.rb +0 -51
data/lib/rbook/onix/stream_reader.rb +0 -120
data/lib/rbook/onix/stream_writer.rb +0 -40
data/lib/rbook/onix/supply_detail.rb +0 -68
data/lib/rbook/onix/xchar.rb +0 -98
data/lib/rbook/pacstream.rb +0 -64
data/lib/rbook/titlepage.rb +0 -37
data/lib/rbook/titlepage/client.rb +0 -126
data/lib/rbook/titlepage/titlepage_driver.rb +0 -137
data/lib/rbook/titlepage/titlepage_utils.rb +0 -379
data/lib/rbook/titlepage/wwwclient.rb +0 -96
data/lib/rbook/www.rb +0 -172
data/lib/rbook/www/aau_scraper.rb +0 -76
data/lib/rbook/www/amazon_uk_scraper.rb +0 -44
data/lib/rbook/www/ban_scraper.rb +0 -62
data/lib/rbook/www/base.rb +0 -87
data/lib/rbook/www/harper_au_scraper.rb +0 -56
data/lib/rbook/www/harper_us_scraper.rb +0 -55
data/lib/rbook/www/hha_scraper.rb +0 -50
data/lib/rbook/www/macmillan_scraper.rb +0 -62
data/lib/rbook/www/orbis_scraper.rb +0 -48
data/lib/rbook/www/oup_scraper.rb +0 -64
data/lib/rbook/www/paulist_scraper.rb +0 -53
data/lib/rbook/www/pearson_au_scraper.rb +0 -52
data/lib/rbook/www/penguin_scraper.rb +0 -45
data/lib/rbook/www/random_au_scraper.rb +0 -90
data/lib/rbook/www/random_us_scraper.rb +0 -59
data/lib/rbook/www/sas_scraper.rb +0 -54
data/lib/rbook/www/unireps_scraper.rb +0 -58
data/lib/rbook/www/wiley_us_scraper.rb +0 -54
data/test/data/abingdon.xml +0 -38931
data/test/data/augsburg.xml +0 -39009
data/test/data/bisac_po.txt +0 -112
data/test/data/chalice.xml +0 -10851
data/test/data/eerdsman.xml +0 -36942
data/test/data/invalid_no_product.xml +0 -9
data/test/data/not_xml.csv +0 -1
data/test/data/single_product.xml +0 -50
data/test/data/valid_bisac.txt +0 -213
data/test/data/xml_not_onix.xml +0 -7
data/test/mocks/titlepage_driver.rb +0 -111
data/test/unit/bisac/bisac_test.rb +0 -96
data/test/unit/bisac/po_line_item_test.rb +0 -38
data/test/unit/bisac/po_test.rb +0 -82
data/test/unit/isbn_test.rb +0 -153
data/test/unit/onix/contributor_test.rb +0 -50
data/test/unit/onix/message_test.rb +0 -119
data/test/unit/onix/product_test.rb +0 -101
data/test/unit/onix/sales_restriction_test.rb +0 -48
data/test/unit/onix/stream_reader_test.rb +0 -22
data/test/unit/onix/stream_writer_test.rb +0 -32
data/test/unit/onix/supply_detail_test.rb +0 -53
data/test/unit/onix/xchar_test.rb +0 -37
data/test/unit/titlepage_test.rb +0 -140

data/lib/rbook/www/base.rb DELETED

@@ -1,87 +0,0 @@
-require 'net/http'
-require 'uri'
-module RBook
-  module WWW
-  class Base
-    @@scrapers = []
-    # registers a new scraper with the library.
-    # classname - the class to add
-    def self.add_scraper(classname)
-      @@scrapers << classname
-    end
-    # find a scraper matching the requested id
-    # id - a scraper id as a symbol
-    def self.find_scraper(id)
-      @@scrapers.each do |scraper|
-        return scraper if scraper::SCRAPER_ID == id
-      end
-      return nil
-    end
-    # find any scrapers matching the requested ids
-    # ids - an array of scraper id's as symbols
-    def self.find_scrapers(ids)
-      ret = []
-      @@scrapers.each do |scraper|
-        ret << scraper if ids.include?(scraper::SCRAPER_ID)
-      end
-      return ret
-    end
-    # This method can be overwritten in each scraper. It should return a hash containing the binary data
-    # and mimetype of the largest cover image it can find for the requested isbn
-    def get_cover(isbn)
-      info = get_info(isbn)
-      return nil if info.nil?
-      return nil unless info.kind_of?(Hash)
-      link = info[:cover_large] || info[:cover_medium] || info[:cover_thumb]
-      return nil if link.nil?
-      begin
-        response = Net::HTTP.get_response URI.parse(link)
-          if response.code != "200"
-            raise response.code.to_s
-            return nil
-          else
-            result = {}
-            result[:data] = response.body
-            result[:content_type] = "image/jpeg"
-            return result
-          end
-      rescue
-        return nil
-      end
-    end
-    # This method can be overwritten in each scraper. It should return a hash of any information on
-    # the requested isbn it can find
-    def get_info(isbn)
-      nil
-    end
-    # This method can be overwritten in each scraper. It should return a link to the requested isbn
-    # on the targets website
-    def get_link(isbn)
-      nil
-    end
-    # return the symbol used to uniquely identify each scraper
-    def scraper_id
-      return SCRAPER_ID
-    end
-    def self.scrapers
-      @@scrapers
-    end
-  end
-end
-end

data/lib/rbook/www/harper_au_scraper.rb DELETED

@@ -1,56 +0,0 @@
-module RBook
-  module WWW
-  class HarperCollinsAUScraper < Base
-    SCRAPER_ID = :harper_au
-    SCRAPER_NAME = "Harper Collins Australia".freeze
-    SCRAPER_SITE = "http://www.harpercollins.com.au/".freeze
-    #add_publisher( self, "9780006400000", "9780006499999" )
-    #add_publisher( self, "9780007100000", "9780007199999" )
-    add_scraper( self )
-    def get_info(isbn)
-      raise ArgumentError, 'Supplied isbn is not valid' unless ISBN::valid_isbn?(isbn)
-      isbn = ISBN::convert_to_isbn13(isbn) unless ISBN::valid_isbn13?(isbn)
-      @protocol = "http://"
-      @host = "www.harpercollins.com.au"
-      @path = "/global_scripts/product_catalog/book_xml.asp?isbn="
-      @link = @protocol + @host + @path + ISBN::convert_to_isbn10(isbn)
-      rba = Scraper.define do
-        process "div.header", :title => :text
-        process "div.subtitle", :subtitle => :text
-        process "div.byline", :author => :text
-        process "img.bookJacket", :cover => "@src"
-        result :title, :subtitle, :author, :cover
-      end
-      content = Net::HTTP.get URI.parse(@link)
-      result = rba.scrape(content)
-      if result.title.nil?
-        return nil
-      else
-        info = {}
-        info[:isbn] = isbn
-        info[:title] = result.title
-        info[:subtitle] = result.subtitle
-        info[:author] = result.author.gsub("by ","")
-        info[:cover] = result.cover
-        info[:link] = @link
-        info[:from_name] = SCRAPER_NAME
-        info[:from_url] = SCRAPER_SITE
-        return info
-      end
-    end
-  end
-  end
-end

data/lib/rbook/www/harper_us_scraper.rb DELETED

@@ -1,55 +0,0 @@
-module RBook
-  module WWW
-  class HarperCollinsUSScraper < Base
-    SCRAPER_ID = :harper_us
-    SCRAPER_NAME = "Harper Collins United States".freeze
-    SCRAPER_SITE = "http://www.harpercollins.com/".freeze
-    #add_publisher( self, "9780060000000", "9780060999999" )
-    add_scraper( self )
-    def get_info(isbn)
-      raise ArgumentError, 'Supplied isbn is not valid' unless ISBN::valid_isbn?(isbn)
-      isbn = ISBN::convert_to_isbn13(isbn) unless ISBN::valid_isbn13?(isbn)
-      @protocol = "http://"
-      @host = "www.harpercollins.com"
-      @path = "/book/index.aspx?isbn="
-      @link = @protocol + @host + @path + isbn
-      rba = Scraper.define do
-        process "h1.bookTitle", :title => :text
-        process "h2.bookSubTitle", :subtitle => :text
-        process "h3.byLine", :author => :text
-        process "img.bookJacket", :cover => "@src"
-        result :title, :subtitle, :author, :cover
-      end
-      content = Net::HTTP.get URI.parse(@link)
-      result = rba.scrape(content)
-      if result.title.nil?
-        return nil
-      else
-        info = {}
-        info[:isbn] = isbn
-        info[:title] = result.title
-        info[:subtitle] = result.subtitle
-        info[:author] = result.author.gsub("by ", "")
-        info[:cover_thumb] = result.cover
-        info[:cover_medium] = result.cover.gsub("medium", "large")
-        info[:link] = @link
-        info[:from_name] = SCRAPER_NAME
-        info[:from_url] = SCRAPER_SITE
-        return info
-      end
-    end
-  end
-  end
-end

data/lib/rbook/www/hha_scraper.rb DELETED

@@ -1,50 +0,0 @@
-module RBook
-  module WWW
-  class HHAScraper < Base
-    SCRAPER_ID = :hha
-    SCRAPER_NAME = "Hodder Headline Australia".freeze
-    SCRAPER_SITE = "http://www.hha.com.au/".freeze
-    #add_publisher( self, "9780340800000", "9780340899999" )
-    #add_publisher( self, "9780755300000", "9780755399999" )
-    #add_publisher( self, "9780733600000", "9780733699999" )
-    add_scraper( self )
-    def get_info(isbn)
-      @protocol = "http://"
-      @host = "www.hha.com.au"
-      @path = "/books/"
-      @suffix = ".html"
-      @link = @protocol + @host + @path + ISBN::convert_to_isbn10(isbn) + @suffix
-      rba = Scraper.define do
-        process "h1.fiction", :title => :text
-        process "p.author", :author => :text
-        process "p.thumb>img", :cover_thumb => "@src"
-        result :title, :author, :cover_thumb
-      end
-      content = Net::HTTP.get URI.parse(@link)
-      result = rba.scrape(content)
-      if result.cover_thumb.nil?
-        return nil
-      else
-        info = {}
-        info[:isbn] = isbn
-        info[:author] = result.author
-        info[:cover_thumb] = @protocol + @host + result.cover_thumb
-        info[:link] = @link
-        info[:from_name] = SCRAPER_NAME
-        info[:from_url] = SCRAPER_SITE
-        return info
-      end
-    end
-  end
-  end
-end

data/lib/rbook/www/macmillan_scraper.rb DELETED

@@ -1,62 +0,0 @@
-module RBook
-  module WWW
-  class MacmillanScraper < Base
-    SCRAPER_ID = :macmillan
-    SCRAPER_NAME = "Pan Macmillan".freeze
-    SCRAPER_SITE = "http://www.panmacmillan.com.au/".freeze
-    #add_publisher( self, "9780312900000", "9780312999999" )
-    #add_publisher( self, "9780330400000", "9780330499999" )
-    #add_publisher( self, "9781403000000", "9781405099999" )
-    add_scraper( self )
-    def initialize
-      @url_protocol = "http://"
-      @url_host = "www.panmacmillan.com.au"
-      @url_path = "/display_title.asp?ISBN="
-      @url_suffix = "&Author=Barker,%20Robin"
-    end
-    def get_info(isbn)
-      isbn = ISBN::convert_to_isbn13(isbn)
-      return nil if isbn.nil?
-      mac = Scraper.define do
-        process "div.titlecontent>div.isbn>span", :isbn => :text
-        process "td[width=70%]>h1", :title => :text
-        process "a[title=Click on image to view a larger version]>img", :cover_medium => "@src"
-        process "a[title=Click on image to view a larger version]", :cover_large => "@href"
-        result :isbn, :title, :cover_medium, :cover_large
-      end
-      content = Net::HTTP.get URI.parse(get_link(isbn))
-      result = mac.scrape(content)
-      if result.title.nil?
-        return nil
-      else
-        info = {}
-        info[:isbn] = isbn
-        info[:title] = result.title
-        info[:cover_medium] = @url_protocol + @url_host + result.cover_medium.gsub("..", "") unless result.cover_medium.nil?
-        info[:cover_large] = @url_protocol + @url_host + result.cover_large.gsub("..", "") unless result.cover_large.nil?
-        info[:link] = get_link(isbn)
-        info[:from_name] = SCRAPER_NAME
-        info[:from_url] = SCRAPER_SITE
-        return info
-      end
-    end
-    def get_link(isbn)
-      return nil unless ISBN::valid_isbn?(isbn)
-      return @url_protocol + @url_host + @url_path + ISBN::convert_to_isbn10(isbn) + @url_suffix
-    end
-  end
-  end
-end

data/lib/rbook/www/orbis_scraper.rb DELETED

@@ -1,48 +0,0 @@
-module RBook
-  module WWW
-  class OrbisScraper < Base
-    SCRAPER_ID = :orbis
-    SCRAPER_NAME = "Orbis Books"
-    SCRAPER_SITE = "http://www.orbisbooks.com/"
-    #add_publisher( self, "978157070000", "9781570799999")
-    add_scraper( self )
-    def get_info(isbn)
-      @protocol = "http://"
-      @host = "www.maryknollmall.org"
-      @path = "/description.cfm?ISBN="
-      @grouped_isbn = ISBN::add_groups(ISBN::convert_to_isbn10(isbn))
-      @link = @protocol + @host + @path + @grouped_isbn
-      oup = Scraper.define do
-        process "tr>td[colspan=4]>font[size=3]", :description => :text # doesn't currently work
-        process "table>tr>td[rowspan=2]>img", :cover_thumb => "@src"
-        result :description, :cover_thumb
-      end
-      content = Net::HTTP.get URI.parse(@link)
-      result = oup.scrape(content)
-      if result.cover_thumb.nil?
-        return nil
-      else
-        info = {}
-        info[:isbn] = isbn
-        info[:cover_thumb] = @protocol + @host + result.cover_thumb unless result.cover_thumb.nil?
-        info[:link] = @link
-        info[:from_name] = SCRAPER_NAME
-        info[:from_url] = SCRAPER_SITE
-        return info
-      end
-    end
-  end
-  end
-end

data/lib/rbook/www/oup_scraper.rb DELETED

@@ -1,64 +0,0 @@
-module RBook
-  module WWW
-  class OUPScraper < Base
-    SCRAPER_ID = :oup
-    SCRAPER_NAME = "Oxford University Press"
-    SCRAPER_SITE = "http://au.oup.com/"
-    #add_publisher( self, "978019200000", "978019999999")
-    add_scraper( self )
-    def get_info(isbn)
-      isbn = ISBN::convert_to_isbn10(isbn)
-      @protocol = "http://"
-      @host = "au.oup.com"
-      @path = "/searchbuy/SearchBook.asp?isbn="
-      @link = @protocol + @host + @path + isbn
-      oup = Scraper.define do
-        process "div.isbn13", :isbn => :text
-        process "td.title", :title => :text
-        process "td.author", :author => :text
-        process "div.BookInfo", :misc => :text
-        process "td>p.blurb", :description => :text
-        process "td>img[width=100]", :cover => "@src"
-        result :isbn, :title, :author, :misc, :description, :cover
-      end
-      content = Net::HTTP.get URI.parse(@link)
-      result = oup.scrape(content)
-      if result.isbn.nil?
-        return nil
-      else
-        info = {}
-        info[:isbn] = result.isbn.gsub(/\ ISBN-13:\n/, "")
-        info[:title] = result.title
-        info[:author] = result.author
-        info[:description] = result.description
-        info[:cover_thumb] = @protocol + @host + result.cover
-        info[:link] = @link
-        tmp = result.misc.match(/\n(.+)\n(.+) pages\n(.+)\n(.+)\n(.+)/)
-        if !tmp.nil? && tmp.length == 5
-          info[:published] = tmp[1]
-          info[:pages] = tmp[2]
-          info[:format] = tmp[3]
-          info[:rrp] = tmp[4]
-        end
-        info[:from_name] = SCRAPER_NAME
-        info[:from_url] = SCRAPER_SITE
-        return info
-      end
-    end
-  end
-  end
-end

data/lib/rbook/www/paulist_scraper.rb DELETED

@@ -1,53 +0,0 @@
-module RBook
-  module WWW
-  class PaulistScraper < Base
-    SCRAPER_ID = :paulist
-    SCRAPER_NAME = "Paulist Press".freeze
-    SCRAPER_SITE = "http://www.paulistpress.com/".freeze
-    #add_publisher( self, "9780809100000", "9780809199999" )
-    add_scraper( self )
-    def get_info(isbn)
-      raise ArgumentError, 'Supplied isbn is not valid' unless ISBN::valid_isbn?(isbn)
-      isbn = ISBN::convert_to_isbn13(isbn) unless ISBN::valid_isbn13?(isbn)
-      @protocol = "http://"
-      @host = "www.paulistpress.com"
-      @path = "/"
-      @abv_isbn = ISBN::convert_to_isbn10(isbn)[-5, 5]
-      @suffix = ".html"
-      @link = @protocol + @host + @path + @abv_isbn[0,4] + "-" + @abv_isbn[-1,1] + @suffix
-      rba = Scraper.define do
-        process "tr>td>h4", :title => :text
-        process "img[width=120][height=180]", :cover => "@src"
-        result :title, :cover
-      end
-      content = Net::HTTP.get URI.parse(@link)
-      result = rba.scrape(content)
-      if result.title.nil?
-        return nil
-      else
-        info = {}
-        info[:isbn] = isbn
-        info[:title] = result.title.gsub("Details for ", "")
-        info[:cover_thumb] = @protocol + @host + result.cover
-        info[:link] = @link
-        info[:from_name] = SCRAPER_NAME
-        info[:from_url] = SCRAPER_SITE
-        return info
-      end
-    end
-  end
-  end
-end