RubyGems - yayimdbs - Versions diffs - 0.1.8 → 0.1.9 - Mend

yayimdbs 0.1.8 → 0.1.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

data/lib/yay_imdbs.rb +29 -11
metadata +5 -35

data/lib/yay_imdbs.rb CHANGED Viewed

@@ -1,7 +1,15 @@
 # encoding: UTF-8
 require 'open-uri'
 require 'nokogiri'
-require 'active_support/all'
+begin
+  # Rails 3
+  require 'active_support/core_ext/object'
+  require 'active_support/core_ext/hash/indifferent_access.rb'
+rescue
+  # Rails 2.3
+  require 'active_support/all'
+end
 class YayImdbs
   IMDB_BASE_URL = 'http://www.imdb.com/'
@@ -74,10 +82,10 @@ class YayImdbs
     info_hash[:plot] = doc.xpath("//td[@id='overview-top']/p[2]").inner_text.strip
     found_info_divs = false
-    doc.xpath("//div[@class='txt-block']").each do |div|
-      next if div.xpath(".//h4").empty?
+    doc.xpath("//div/h4").each do |h4|
+      div = h4.parent
       found_info_divs = true
-      raw_key = div.xpath(".//h4").first.inner_text
+      raw_key = h4.inner_text
       key = raw_key.sub(':', '').strip.downcase
       value = div.inner_text[((div.inner_text =~ /#{Regexp.escape(raw_key)}/) + raw_key.length).. -1]
       value = value.gsub(/\302\240\302\273/u, '').strip.gsub(/(See more)|(see all)$/, '').strip
@@ -95,15 +103,24 @@ class YayImdbs
         else
           p "Unexpected runtime format #{value} for movie #{imdb_id}"
         end
-      elsif key == 'genre'
-        value = value.strip.split
+      elsif key == 'genres'
+        value = value.split('|').collect { |l| l.gsub(/[^a-zA-Z0-9\-]/, '') }
+        # Backwards compatibility hack
+        info_hash[:genre] = value
       elsif key == 'year'
         value = value.split('|').collect { |l| l.strip.to_i }.reject { |y| y <= 0 }
+        # TV shows can have multiple years
+        info_hash[:years] = value
+        value = value.sort.first
       elsif key == 'language'
-        value = value.split('|').collect { |l| l.strip }
+        value = value.split('|').collect { |l| l.gsub(/[^a-zA-Z0-9]/, '') }
       elsif key == 'taglines'
         # Backwards compatibility
         info_hash['tagline'] = value
+      elsif key == 'motion picture rating (mpaa)'
+        value = value.gsub(/See all certifications/, '').strip
+        # Backwards compatibility FIXME do with a map
+        info_hash['mpaa'] = value
       end
       info_hash[key.downcase.gsub(/\s/, '_')] = value
     end
@@ -117,7 +134,7 @@ class YayImdbs
     #scrap episodes if tv series
     if info_hash.has_key?('season')
-      self.scrap_episodes(doc, info_hash)
+      self.scrap_episodes(info_hash)
     end
     return info_hash
@@ -144,15 +161,16 @@ class YayImdbs
     end
    end
-   def self.scrap_episodes(doc, info_hash)
+   def self.scrap_episodes(info_hash)
       episodes = []
       doc = self.get_episodes_page(info_hash[:imdb_id])
       episode_divs = doc.css(".filter-all")
       episode_divs.each do |e_div|
         if e_div.xpath('.//h3').inner_text =~ /Season (\d+), Episode (\d+):/
           episode = {"series" => $1.to_i, "episode" => $2.to_i, "title" => $'.strip}
-          if e_div.xpath(".//td").inner_text =~ /(\d+ (January|February|March|April|May|June|July|August|September|October|November|December) \d{4})/
-            episode['date'] = Date.parse($1)
+          raw_date = e_div.xpath('.//span/strong').inner_text.strip
+          episode['date'] = Date.parse(raw_date)
+          if e_div.inner_text =~ /#{raw_date}/
             episode['plot'] = $'.strip
           end
           episodes << episode

metadata CHANGED Viewed

@@ -5,8 +5,8 @@ version: !ruby/object:Gem::Version
   segments:
   - 0
   - 1
-  - 8
-  version: 0.1.8
+  - 9
+  version: 0.1.9
 platform: ruby
 authors:
 - Sam Cavenagh
@@ -14,7 +14,7 @@ autorequire:
 bindir: bin
 cert_chain: []
-date: 2010-10-14 00:00:00 +11:00
+date: 2010-10-25 00:00:00 +11:00
 default_executable:
 dependencies:
 - !ruby/object:Gem::Dependency
@@ -47,40 +47,10 @@ dependencies:
         version: 3.0.0
   type: :runtime
   version_requirements: *id002
-- !ruby/object:Gem::Dependency
-  name: tzinfo
-  prerelease: false
-  requirement: &id003 !ruby/object:Gem::Requirement
-    none: false
-    requirements:
-    - - ">="
-      - !ruby/object:Gem::Version
-        segments:
-        - 0
-        - 3
-        - 22
-        version: 0.3.22
-  type: :runtime
-  version_requirements: *id003
-- !ruby/object:Gem::Dependency
-  name: i18n
-  prerelease: false
-  requirement: &id004 !ruby/object:Gem::Requirement
-    none: false
-    requirements:
-    - - ">="
-      - !ruby/object:Gem::Version
-        segments:
-        - 0
-        - 4
-        - 1
-        version: 0.4.1
-  type: :runtime
-  version_requirements: *id004
 - !ruby/object:Gem::Dependency
   name: rspec
   prerelease: false
-  requirement: &id005 !ruby/object:Gem::Requirement
+  requirement: &id003 !ruby/object:Gem::Requirement
     none: false
     requirements:
     - - ">="
@@ -91,7 +61,7 @@ dependencies:
         - 0
         version: 2.0.0
   type: :development
-  version_requirements: *id005
+  version_requirements: *id003
 description: A simple imdb scraper built on Nokogiri for ruby 1.9+
 email: cavenaghweb@hotmail.com
 executables: []