RubyGems - linkedin-scraper - Versions diffs - 0.1.0 → 0.1.1 - Mend

linkedin-scraper 0.1.0 → 0.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

checksums.yaml +4 -4
data/.gitignore +1 -0
data/.travis.yml +0 -1
data/bin/linkedin-scraper +1 -1
data/lib/linkedin-scraper/profile.rb +36 -78
data/lib/linkedin-scraper/version.rb +1 -1
metadata +4 -3

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 23c5331d7544944c0d719cac70b4b281f53c5de3
-  data.tar.gz: 84d78b9812b6f5f0b572481bdad5b550e6d39b16
+  metadata.gz: d72a6f4f56878e6396f87b2114ee75e73cb71fc4
+  data.tar.gz: 7ec26c6b44a2cec0551d544ecc72152683eb439a
 SHA512:
-  metadata.gz: 763a28b6d6a482f8534c3339ddedefcc31784000dce77eb129282b0cff4ee402a2c962e778d75b9925113830fa466058f6eee1dcad4378555d2a8db4bbc67e91
-  data.tar.gz: 0d7f262e9aa12896e33fd9d9abe347ceb95854fbb9b9eef600b0e04d5cd9a3c6de3ccd81c2fdf20d0968dfb64af94be9e3c3c4457f39f3b420d700192d2c224a
+  metadata.gz: f69f100f22938a93703177a2495ef439cdb7120c89d2d23ba231849a37a65a9b20173456d68421280faf572798b88e5271f042cb6a8fccba742bd5c2e48299c1
+  data.tar.gz: e2509eed12a03b23be0860b057c7031c9e467c26e8d2fe2048d7aefa381228ae3ef515fbc0708945a54c1f7e3912b24c0ebfeb3540cd6837350ad378971ea139

data/.gitignore CHANGED Viewed

@@ -18,3 +18,4 @@ test/version_tmp
 tmp
 .ruby-version
 .ruby-gemset
+.projectile

data/.travis.yml CHANGED Viewed

@@ -4,4 +4,3 @@ rvm:
   - 1.9.3
   - 1.9.2
   - jruby-19mode
-  - rbx-19mode

data/bin/linkedin-scraper CHANGED Viewed

@@ -2,4 +2,4 @@
 require_relative '../lib/linkedin-scraper'
 profile = Linkedin::Profile.new(ARGV[0])
-puts profile.to_json
+puts JSON.pretty_generate JSON.parse(profile.to_json)

data/lib/linkedin-scraper/profile.rb CHANGED Viewed

@@ -70,85 +70,51 @@ module Linkedin
     end
     def education
-      unless @education
-        @education = []
-        if @page.search('.position.education.vevent.vcard').first
-          @education = @page.search('.position.education.vevent.vcard').map do |item|
-            name   = item.at('h3').text.gsub(/\s+|\n/, ' ').strip      if item.at('h3')
-            desc   = item.at('h4').text.gsub(/\s+|\n/, ' ').strip      if item.at('h4')
-            period = item.at('.period').text.gsub(/\s+|\n/, ' ').strip if item.at('.period')
-            {:name => name, :description => desc, :period => period}
-          end
-        end
+      @education ||= @page.search('.position.education.vevent.vcard').map do |item|
+        name   = item.at('h3').text.gsub(/\s+|\n/, ' ').strip      if item.at('h3')
+        desc   = item.at('h4').text.gsub(/\s+|\n/, ' ').strip      if item.at('h4')
+        period = item.at('.period').text.gsub(/\s+|\n/, ' ').strip if item.at('.period')
+        {:name => name, :description => desc, :period => period}
       end
-      @education
     end
     def websites
-      unless @websites
-        @websites = []
-        if @page.search('.website').first
-          @websites = @page.search('.website').map do |site|
-            url = site.at('a')['href']
-            url = "http://www.linkedin.com#{url}"
-            CGI.parse(URI.parse(url).query)['url']
-          end.flatten!
-        end
+      @websites ||=  @page.search('.website').flat_map do |site|
+        url = "http://www.linkedin.com#{site.at('a')['href']}"
+        CGI.parse(URI.parse(url).query)['url']
       end
-      @websites
     end
     def groups
-      unless @groups
-        @groups = []
-        if page.search('.group-data').first
-          @groups = page.search('.group-data').map do |item|
-            name = item.text.gsub(/\s+|\n/, ' ').strip
-            link = "http://www.linkedin.com#{item.at('a')['href']}"
-            {:name => name, :link => link}
-          end
-        end
+      @groups ||= @page.search('.group-data').map do |item|
+        name = item.text.gsub(/\s+|\n/, ' ').strip
+        link = "http://www.linkedin.com#{item.at('a')['href']}"
+        {:name => name, :link => link}
       end
-      @groups
     end
     def organizations
-      unless @organizations
-        @organizations = []
-        if @page.search('ul.organizations/li.organization').first
-          @organizations = @page.search('ul.organizations/li.organization').map do |item|
-            name       = item.search('h3').text.gsub(/\s+|\n/, ' ').strip rescue nil
-            start_date, end_date = item.search('ul.specifics li').text.gsub(/\s+|\n/, ' ').strip.split(' to ')
-            start_date = Date.parse(start_date) rescue nil
-            end_date   = Date.parse(end_date)   rescue nil
-            {:name => name, :start_date => start_date, :end_date => end_date}
-          end
-        end
+      @organizations ||= @page.search('ul.organizations/li.organization').map do |item|
+        name       = item.search('h3').text.gsub(/\s+|\n/, ' ').strip rescue nil
+        start_date, end_date = item.search('ul.specifics li').text.gsub(/\s+|\n/, ' ').strip.split(' to ')
+        start_date = Date.parse(start_date) rescue nil
+        end_date   = Date.parse(end_date)   rescue nil
+        {:name => name, :start_date => start_date, :end_date => end_date}
       end
-      @organizations
     end
     def languages
-      unless @languages
-        @languages = []
-        if @page.at('ul.languages/li.language')
-          @languages = @page.search('ul.languages/li.language').map do |item|
-            language    = item.at('h3').text rescue nil
-            proficiency = item.at('span.proficiency').text.gsub(/\s+|\n/, ' ').strip rescue nil
-            {:language=> language, :proficiency => proficiency }
-          end
-        end
+      @languages ||= @page.search('ul.languages/li.language').map do |item|
+        language    = item.at('h3').text rescue nil
+        proficiency = item.at('span.proficiency').text.gsub(/\s+|\n/, ' ').strip rescue nil
+        {:language=> language, :proficiency => proficiency }
       end
-      @languages
     end
     def certifications
-      unless @certtifications
-        @certifications = []
-        if @page.at('ul.certifications/li.certification')
-          @certifications = @page.search('ul.certifications/li.certification').map do |item|
+        @certifications ||= @page.search('ul.certifications/li.certification').map do |item|
             name       = item.at('h3').text.gsub(/\s+|\n/, ' ').strip                         rescue nil
             authority  = item.at('.specifics/.org').text.gsub(/\s+|\n/, ' ').strip            rescue nil
             license    = item.at('.specifics/.licence-number').text.gsub(/\s+|\n/, ' ').strip rescue nil
@@ -156,27 +122,19 @@ module Linkedin
             {:name => name, :authority => authority, :license => license, :start_date => start_date}
           end
-        end
-      end
-      @certifications
     end
     def recommended_visitors
-      unless @recommended_visitors
-        @recommended_visitors = []
-        if @page.at('.browsemap/.content/ul/li')
-          @recommended_visitors = @page.search('.browsemap/.content/ul/li').map do |visitor|
-            v = {}
-            v[:link]    = visitor.at('a')['href']
-            v[:name]    = visitor.at('strong/a').text
-            v[:title]   = visitor.at('.headline').text.gsub('...',' ').split(' at ').first
-            v[:company] = visitor.at('.headline').text.gsub('...',' ').split(' at ')[1]
-            v
-          end
-        end
+      @recommended_visitors ||= @page.search('.browsemap/.content/ul/li').map do |visitor|
+        v = {}
+        v[:link]    = visitor.at('a')['href']
+        v[:name]    = visitor.at('strong/a').text
+        v[:title]   = visitor.at('.headline').text.gsub('...',' ').split(' at ').first
+        v[:company] = visitor.at('.headline').text.gsub('...',' ').split(' at ')[1]
+        v
       end
-      @recommended_visitors
     end
     def to_json
@@ -196,11 +154,11 @@ module Linkedin
           company[:title]       = node.at('h3').text.gsub(/\s+|\n/, ' ').strip if node.at('h3')
           company[:company]     = node.at('h4').text.gsub(/\s+|\n/, ' ').strip if node.at('h4')
           company[:description] = node.at(".description.#{type}-position").text.gsub(/\s+|\n/, ' ').strip if node.at(".description.#{type}-position")
-          start_date  = node.at('.dtstart').text.gsub(/\s+|\n/, ' ').strip rescue nil
+          start_date  = node.at('.dtstart')['title'] rescue nil
           company[:start_date] = parse_date(start_date) rescue nil
-          end_date = node.at('.dtend').text.gsub(/\s+|\n/, ' ').strip rescue nil
-          end_date ||= node.at('.dtstamp').text.gsub(/\s+|\n/, ' ').strip rescue nil
+          end_date = node.at('.dtend')['title'] rescue nil
           company[:end_date] = parse_date(end_date) rescue nil
           company_link = node.at('h4/strong/a')['href'] if node.at('h4/strong/a')

data/lib/linkedin-scraper/version.rb CHANGED Viewed

@@ -1,5 +1,5 @@
 module Linkedin
   module Scraper
-    VERSION = '0.1.0'
+    VERSION = '0.1.1'
   end
 end

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: linkedin-scraper
 version: !ruby/object:Gem::Version
-  version: 0.1.0
+  version: 0.1.1
 platform: ruby
 authors:
 - Yatish Mehta
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2013-11-13 00:00:00.000000000 Z
+date: 2014-03-25 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: mechanize
@@ -93,7 +93,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
       version: '0'
 requirements: []
 rubyforge_project:
-rubygems_version: 2.1.2
+rubygems_version: 2.1.11
 signing_key:
 specification_version: 4
 summary: when a url of  public linkedin profile page is given it scrapes the entire
@@ -102,3 +102,4 @@ test_files:
 - spec/fixtures/jgrevich.html
 - spec/linkedin-scraper/profile_spec.rb
 - spec/spec_helper.rb
+has_rdoc: