RubyGems - newly - Versions diffs - 1.0.0 → 1.1.0 - Mend

newly 1.0.0 → 1.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

data/README.rdoc CHANGED Viewed

@@ -1,17 +1,18 @@
 = newly
-Fetching breaking news from websites
+==Fetching breaking news from websites
+* Based on Nokogiri https://github.com/sparklemotion/nokogiri
 == SYNOPSIS:
   # Fecthing breaking news from some website
   reader = Newly.new('http://g1.globo.com/bahia/')
   news = reader.highlights(
                             selector: '#ultimas-regiao div, #ultimas-regiao ul li',
-                            url: 'a',
+                            href: 'a',
                             date: '.data-hora',
                             title: '.titulo',
                             subtitle: '.subtitulo',
-                            image: 'img')
+                            img: 'img')
   # Presentation News
   news.each |n| do

data/VERSION CHANGED Viewed

	@@ -1 +1 @@
1	- 1.0.0
1	+ 1.1.0

data/lib/newly.rb CHANGED Viewed

@@ -6,13 +6,9 @@ class Newly
   attr_reader :title, :selector, :url
-  def initialize(url, html_file=nil)
+  def initialize(url, selector=Nokogiri::HTML(open(url)))
     @url = url
-    if (html_file)
-      @selector = Nokogiri::HTML.parse(File.read(html_file))
-    else
-      @selector = Nokogiri::HTML(open(url))
-    end
+    @selector = selector
     @title = @selector.at_css("title").text
   end
@@ -20,25 +16,19 @@ class Newly
     news = Array.new
     @selector.css(args[:selector]).each do |item|
       if (item)
-        url = item.css(args[:url]).map { |doc| doc['href'] }.first if args[:url]
-        # doc = Nokogiri::HTML(open(url))
-        # keywords = doc.xpath("//meta[@name='Keywords']/@content") if doc
-        keywords = nil
+        href = item.css(args[:href]).map { |doc| doc['href'] }.first if args[:href]
         date = item.css(args[:date]).text if args[:date]
         title = item.css(args[:title]).text if args[:title]
         subtitle = item.css(args[:subtitle]).text if args[:subtitle]
-        image = item.css(args[:image]).map { |doc| doc['src'] }.first if args[:image]
+        img = item.css(args[:img]).map { |doc| doc['src'] }.first if args[:img]
         if (args[:host])
           host = args[:host]
           url = "#{host}/#{url}".gsub('../', '') if url
           image = "#{host}/#{image}".gsub('../', '') if image && image.include?('../')
         end
-        news << News.new(url: url, keywords: keywords, date: date, title: title, subtitle: subtitle, image: image)
+        news << News.new(url: href, keywords: keywords, date: date, title: title, subtitle: subtitle, image: img)
       end
     end
     news
   end
 end

data/newly.gemspec CHANGED Viewed

@@ -5,11 +5,11 @@
 Gem::Specification.new do |s|
   s.name = "newly"
-  s.version = "1.0.0"
+  s.version = "1.1.0"
   s.required_rubygems_version = Gem::Requirement.new(">= 0") if s.respond_to? :required_rubygems_version=
   s.authors = ["Alab\u{ea} Duarte"]
-  s.date = "2012-08-13"
+  s.date = "2012-08-14"
   s.description = "Fetching breaking news from websites"
   s.email = "alabeduarte@gmail.com"
   s.extra_rdoc_files = [

data/spec/newly_spec.rb CHANGED Viewed

@@ -2,10 +2,11 @@ require File.expand_path(File.dirname(__FILE__) + '/spec_helper')
 # require 'spec_helper'
 describe Newly do
-  let(:ec_bahia) { ec_bahia = Newly.new('http://www.ecbahia.com', 'spec/html/ecbahia.html') }
-  let(:g1) { g1_bahia = Newly.new('http://g1.globo.com', 'spec/html/g1.html') }
-  let(:g1_bahia) { g1_bahia = Newly.new('http://g1.globo.com/bahia/', 'spec/html/g1_bahia.html') }
-  let(:metro1) { g1_bahia = Newly.new('http://www.metro1.com.br/portal/?varSession=noticia&varEditoria=cidade', 'spec/html/metro1_cidade.html') }
+  let(:selector) { Nokogiri::HTML }
+  let(:ec_bahia) { Newly.new('http://www.ecbahia.com', parse('spec/html/ecbahia.html')) }
+  let(:g1) { Newly.new('http://g1.globo.com', parse('spec/html/g1.html')) }
+  let(:g1_bahia) { Newly.new('http://g1.globo.com/bahia/', parse('spec/html/g1_bahia.html')) }
+  let(:metro1) { Newly.new('http://www.metro1.com.br/portal/?varSession=noticia&varEditoria=cidade', parse('spec/html/metro1_cidade.html')) }
   it "should fetch ecbahia title" do
     ec_bahia.title.should == "ecbahia.com - \u00e9 goleada tricolor na internet!  (ecbahia, ecbahia.com, ecbahia.com.br, Esporte Clube Bahia)"
@@ -13,11 +14,11 @@ describe Newly do
   it "should fetch highlights from http://g1.globo.com/bahia" do
     highlights = g1_bahia.highlights( selector: '#ultimas-regiao div, #ultimas-regiao ul li',
-                                      url: 'a',
+                                      href: 'a',
                                       date: '.data-hora',
                                       title: '.titulo',
                                       subtitle: '.subtitulo',
-                                      image: 'img'
+                                      img: 'img'
                                       )
     highlights.should_not be_empty
   end
@@ -25,10 +26,10 @@ describe Newly do
   context "fetching news from http://g1.globo.com" do
     it "should fetch highlights news" do
       highlights = g1.highlights( selector: '#glb-corpo .glb-area .chamada-principal',
-                                        url: 'a',
+                                        href: 'a',
                                         title: '.chapeu',
                                         subtitle: '.subtitulo',
-                                        image: '.foto a img'
+                                        img: '.foto a img'
                                         )
       highlights.should_not be_empty
       highlights[0].url.should == 'http://g1.globo.com/mundo/noticia/2012/08/ira-encerra-resgate-apos-terremotos-e-revisa-mortos-para-227-diz-tv-estatal.html'
@@ -43,10 +44,10 @@ describe Newly do
     xit "should fetch keywords" do
       highlights = g1.highlights( selector: '#glb-corpo .glb-area .chamada-principal',
-                                        url: 'a',
+                                        href: 'a',
                                         title: '.chapeu',
                                         subtitle: '.subtitulo',
-                                        image: '.foto a img'
+                                        img: '.foto a img'
                                         )
       highlights[0].url.should == 'http://g1.globo.com/mundo/noticia/2012/08/ira-encerra-resgate-apos-terremotos-e-revisa-mortos-para-227-diz-tv-estatal.html'
       highlights[0].keywords.should == 'noticias, noticia, Mundo'
@@ -55,13 +56,18 @@ describe Newly do
   it "should fetch highlights from http://www.metro1.com.br" do
     highlights = metro1.highlights( selector: '#lista-de-resultados .resultado',
-                                      url: 'a',
+                                      href: 'a',
                                       date: '.resultado-data',
                                       title: '.resultado-titulo',
                                       subtitle: '.resultado-texto',
-                                      image: 'a img.img-resultado',
+                                      img: 'a img.img-resultado',
                                       host: 'http://www.metro1.com.br'
                                       )
     highlights.should_not be_empty
   end
+private
+  def parse(path)
+    selector.parse(File.read(path))
+  end
 end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: newly
 version: !ruby/object:Gem::Version
-  version: 1.0.0
+  version: 1.1.0
   prerelease:
 platform: ruby
 authors:
@@ -9,11 +9,11 @@ authors:
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2012-08-13 00:00:00.000000000 Z
+date: 2012-08-14 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: nokogiri
-  requirement: &70275429701820 !ruby/object:Gem::Requirement
+  requirement: &70132223688900 !ruby/object:Gem::Requirement
     none: false
     requirements:
     - - ! '>='
@@ -21,10 +21,10 @@ dependencies:
         version: '0'
   type: :runtime
   prerelease: false
-  version_requirements: *70275429701820
+  version_requirements: *70132223688900
 - !ruby/object:Gem::Dependency
   name: rspec
-  requirement: &70275429699520 !ruby/object:Gem::Requirement
+  requirement: &70132223687300 !ruby/object:Gem::Requirement
     none: false
     requirements:
     - - ~>
@@ -32,10 +32,10 @@ dependencies:
         version: 2.8.0
   type: :development
   prerelease: false
-  version_requirements: *70275429699520
+  version_requirements: *70132223687300
 - !ruby/object:Gem::Dependency
   name: rdoc
-  requirement: &70275429697780 !ruby/object:Gem::Requirement
+  requirement: &70132223684620 !ruby/object:Gem::Requirement
     none: false
     requirements:
     - - ~>
@@ -43,10 +43,10 @@ dependencies:
         version: '3.12'
   type: :development
   prerelease: false
-  version_requirements: *70275429697780
+  version_requirements: *70132223684620
 - !ruby/object:Gem::Dependency
   name: bundler
-  requirement: &70275429696240 !ruby/object:Gem::Requirement
+  requirement: &70132223715700 !ruby/object:Gem::Requirement
     none: false
     requirements:
     - - ~>
@@ -54,10 +54,10 @@ dependencies:
         version: 1.1.5
   type: :development
   prerelease: false
-  version_requirements: *70275429696240
+  version_requirements: *70132223715700
 - !ruby/object:Gem::Dependency
   name: jeweler
-  requirement: &70275429694540 !ruby/object:Gem::Requirement
+  requirement: &70132223714340 !ruby/object:Gem::Requirement
     none: false
     requirements:
     - - ~>
@@ -65,10 +65,10 @@ dependencies:
         version: 1.8.4
   type: :development
   prerelease: false
-  version_requirements: *70275429694540
+  version_requirements: *70132223714340
 - !ruby/object:Gem::Dependency
   name: simplecov
-  requirement: &70275429735780 !ruby/object:Gem::Requirement
+  requirement: &70132223712120 !ruby/object:Gem::Requirement
     none: false
     requirements:
     - - ! '>='
@@ -76,7 +76,7 @@ dependencies:
         version: '0'
   type: :development
   prerelease: false
-  version_requirements: *70275429735780
+  version_requirements: *70132223712120
 description: Fetching breaking news from websites
 email: alabeduarte@gmail.com
 executables: []
@@ -119,7 +119,7 @@ required_ruby_version: !ruby/object:Gem::Requirement
       version: '0'
       segments:
       - 0
-      hash: -2351285680129146534
+      hash: 4551793471179022495
 required_rubygems_version: !ruby/object:Gem::Requirement
   none: false
   requirements: