RubyGems - linkedindata - Versions diffs - 0.0.1 - Mend

linkedindata 0.0.1

Files changed (2) hide show

data/lib/linkedindata.rb +69 -0
metadata +47 -0

data/lib/linkedindata.rb ADDED Viewed

@@ -0,0 +1,69 @@
+require 'mechanize'
+require 'linkedin-scraper'
+require 'json'
+class LinkedinData
+  def initialize(input)
+   @input = input
+   @output = Array.new
+  end
+  # Searches for links on Google
+  def search
+    agent = Mechanize.new
+    gform = agent.get("http://google.com").form("f")
+    gform.q = "site:linkedin.com/pub " + @input
+    page = agent.submit(gform, gform.buttons.first)
+    examine(page)
+  end
+  # Examines a search page
+  def examine(page)
+    startindex = 0
+    page.links.each do |link|
+      if (link.href.include? "linkedin.com") && (!link.href.include? "webcache") && (!link.href.include? "site:linkedin.com/pub+")
+        saveurl = link.href.split("?q=")
+        if saveurl[1]
+          url = saveurl[1].split("&")
+          scrape(url[0])
+        end
+      end
+      if (link.href.include? "&sa=N") && (link.href.include? "&start=")
+        url1 = link.href.split("&start=")
+        url2 = url1[1].split("&sa=N")
+        if url2[0].to_i < startindex
+          agent = Mechanize.new
+          examine(agent.get("http://google.com" + link.href))
+        else startindex = url2[0].to_i
+        end
+      end
+    end
+  end
+  # Scrapes profile and makes JSON
+  def scrape(url)
+    profile = Linkedin::Profile.get_profile(url)
+    if profile
+      profile.current_companies.each do |c|
+        c.merge!(:name => profile.first_name + " " + profile.last_name)
+        @output.push(c)
+      end
+      profile.past_companies.each do |c|
+        c.merge!(:name => profile.first_name + " " + profile.last_name)
+        @output.push(c)
+      end
+    end
+  end
+  # Gets all data and returns in JSON
+  def getData
+    search
+    return @output.to_json
+  end
+end

metadata ADDED Viewed

@@ -0,0 +1,47 @@
+--- !ruby/object:Gem::Specification
+name: linkedindata
+version: !ruby/object:Gem::Version
+  version: 0.0.1
+  prerelease:
+platform: ruby
+authors:
+- M. C. McGrath
+autorequire:
+bindir: bin
+cert_chain: []
+date: 2014-01-07 00:00:00.000000000 Z
+dependencies: []
+description: Scrapes all LinkedIn profiles including terms you specify.
+email: shidash@shidash.com
+executables: []
+extensions: []
+extra_rdoc_files: []
+files:
+- lib/linkedindata.rb
+homepage: https://github.com/Shidash/LinkedInData
+licenses:
+- GPL
+post_install_message:
+rdoc_options: []
+require_paths:
+- lib
+required_ruby_version: !ruby/object:Gem::Requirement
+  none: false
+  requirements:
+  - - ! '>='
+    - !ruby/object:Gem::Version
+      version: '0'
+required_rubygems_version: !ruby/object:Gem::Requirement
+  none: false
+  requirements:
+  - - ! '>='
+    - !ruby/object:Gem::Version
+      version: '0'
+requirements: []
+rubyforge_project:
+rubygems_version: 1.8.23
+signing_key:
+specification_version: 3
+summary: Get all LinkedIn profiles including terms you specify
+test_files: []
+has_rdoc: