RubyGems - linkedindata - Versions diffs - 0.0.11 → 0.0.12 - Mend

linkedindata 0.0.11 → 0.0.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 94bb03be0b7d5757a4ec8175b829db45bf1ea0d5
-  data.tar.gz: c51b94a00043330d9ba9b821c7ecdb47a11b3340
+  metadata.gz: 8f7c5ffe3de4948c6b28d505079581a10825ea91
+  data.tar.gz: 05df543799dd12fbc1e6c25671f539d5644aefab
 SHA512:
-  metadata.gz: 306b9d008c6f5958357ff94b2b07379e5bbf66631a343133d7471c459a5eaf66a5e6fd3d5d8cdeb6caca3d6b56873718c7f07ee049f2c4c329f8f106105dd6a4
-  data.tar.gz: 15d39ed929395b149807868875a614c188a22bacf773d546cc5fce84080ab8db732558bd29de5e9819f12ccb429c21c4a10c85544dd02e48bec4bc4a649df4ad
+  metadata.gz: a62b36e080463295eb988c37e8538f2f0181561f1fa48b7e61f0f8c13334990953c830fafd7db852fbaddace5f7c204ea441becc3f9c7995b372bb7feff90dc6
+  data.tar.gz: 7d1c02373a972dbaf6851179b46fcee58c30e04a321cfa54143ef5b96b053b973b4b9123531a95722393d02953d2050ecbc45ccbec34f6dd7b46faa4108e77b0

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: linkedindata
 version: !ruby/object:Gem::Version
-  version: 0.0.11
+  version: 0.0.12
 platform: ruby
 authors:
 - M. C. McGrath
@@ -15,8 +15,7 @@ email: shidash@shidash.com
 executables: []
 extensions: []
 extra_rdoc_files: []
-files:
-- lib/linkedindata.rb
+files: []
 homepage: https://github.com/transparencytoolkit/linkedindata
 licenses:
 - GPL

data/lib/linkedindata.rb DELETED Viewed

@@ -1,85 +0,0 @@
-require 'mechanize'
-require 'linkedin-scraper'
-require 'json'
-require 'nokogiri'
-require 'open-uri'
-load 'parseprofile.rb'
-require 'pry'
-require 'urlarchiver'
-class LinkedinData
-  def initialize(input, todegree)
-    @input = input
-    @output = Array.new
-    @startindex = 10
-  end
-  # Searches for profiles on Google
-  def search
-    agent = Mechanize.new
-    agent.user_agent_alias = 'Linux Firefox'
-    gform = agent.get("http://google.com").form("f")
-    gform.q = "site:linkedin.com/pub " + @input
-    page = agent.submit(gform, gform.buttons.first)
-    examine(page)
-  end
-  # Examines a search page
-  def examine(page)
-    # Separate getting profile links and going to next page
-      # Method for getting links to all result pages
-      # Different method for getting all profile links on page and scraping (split to new thread for this)
-         # Has own output set, merge into full one at end (make sure threadsafe)
-    # Have own input and output
-    page.links.each do |link|
-      if (link.href.include? "linkedin.com") && (!link.href.include? "webcache") && (!link.href.include? "site:linkedin.com/pub+")
-        saveurl = link.href.split("?q=")
-        if saveurl[1]
-          url = saveurl[1].split("&")
-          begin
-            scrape(url[0])
-          rescue
-          end
-        end
-      end
-      # Find the link to the next page and go to it
-      if (link.href.include? "&sa=N") && (link.href.include? "&start=")
-        url1 = link.href.split("&start=")
-        url2 = url1[1].split("&sa=N")
-        if url2[0].to_i == @startindex
-          sleep(rand(5..10))
-          @startindex += 10
-          agent = Mechanize.new
-          examine(agent.get("http://google.com" + link.href))
-        end
-      end
-    end
-  end
-  # Scrapes profile
-  def scrape(url)
-    # Download profile and rescue on error
-    begin
-      url.gsub!("https", "http")
-      profile = Linkedin::Profile.get_profile(url)
-    rescue
-    end
-    # Parse profile if returned
-    if profile
-      p = ParseProfile.new(profile, url)
-      @output.concat(p.parse)
-    end
-  end
-  # Gets all data and returns in JSON
-  def getData
-    search
-    formatted_json = JSON.pretty_generate(@output)
-    return formatted_json
-  end
-end