linkedincrawler 0.0.14 → 0.0.15

Sign up to get free protection for your applications and to get access to all the features.
Files changed (3) hide show
  1. checksums.yaml +4 -4
  2. data/lib/linkedincrawler.rb +9 -3
  3. metadata +2 -2
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 9cab546fac1482b262f2435257af20d645b7a2ca
4
- data.tar.gz: 8a18d774dbaf1791b13a104b85bd96edd3400dc9
3
+ metadata.gz: d133e662b783dcf61594013b375ddec17cb22102
4
+ data.tar.gz: 4c477ee0f284c4bc13171d25c747cf9f2b42c090
5
5
  SHA512:
6
- metadata.gz: fb059768cdaf5204cfef18ca7fc8ec8670c0ed4bed5346fc984ab57a44eb6d7fa988e8e2b584920b1f500a20257196fcf45bedaafdf86197887e3ad232fe398c
7
- data.tar.gz: e6b09adb74fec01250746172e372e82b5277badda83c8156d8c60049945d36bdafcc528e5bf69f2063c219cfc3508c771138d363a0226742ac45aa25a0eb00e7
6
+ metadata.gz: 47a121927417ce0d195d5be681d533f35c88613710f104d540e032bc9539ebd25840163eda54c75a63caeb27924f1fc65fd767042e5e18664d4c0fd13809e01e
7
+ data.tar.gz: 87f53246bb4d98c67683525ea32095729a453502e0426f87268edd949809fea93ea27da0f288598a1698202b433e7a75f660c64820a2bb66b2605a56ad8d563c
@@ -6,7 +6,7 @@ require 'selenium-webdriver'
6
6
  require 'pry'
7
7
 
8
8
  class LinkedinCrawler
9
- def initialize(search_terms, retry_limit, requests, requests_google, solver_details)
9
+ def initialize(search_terms, retry_limit, requests, requests_google, requests_google2, solver_details)
10
10
  @search_terms = search_terms
11
11
  @output = Array.new
12
12
 
@@ -15,6 +15,7 @@ class LinkedinCrawler
15
15
 
16
16
  @requests = requests
17
17
  @requests_google = requests_google
18
+ @requests_google2 = requests_google2
18
19
  @solver_details = solver_details
19
20
  end
20
21
 
@@ -23,9 +24,13 @@ class LinkedinCrawler
23
24
  # Run Google search
24
25
  g = GeneralScraper.new("site:linkedin.com/pub -site:linkedin.com/pub/dir/", @search_terms, @requests_google, @solver_details)
25
26
  urls = g.getURLs
26
-
27
+
28
+ # Look for new LI urls
29
+ g2 = GeneralScraper.new("site:linkedin.com/in", @search_terms, @requests_google2, @solver_details)
30
+ urls = JSON.parse(urls) + JSON.parse(g2.getURLs)
31
+
27
32
  # Scrape each resulting LinkedIn page
28
- JSON.parse(urls).each do |profile|
33
+ urls.each do |profile|
29
34
  if check_right_page(profile)
30
35
  scrape(profile)
31
36
  end
@@ -85,3 +90,4 @@ class LinkedinCrawler
85
90
  JSON.pretty_generate(@output)
86
91
  end
87
92
  end
93
+
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: linkedincrawler
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.0.14
4
+ version: 0.0.15
5
5
  platform: ruby
6
6
  authors:
7
7
  - M. C. McGrath
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2015-12-06 00:00:00.000000000 Z
11
+ date: 2016-03-16 00:00:00.000000000 Z
12
12
  dependencies: []
13
13
  description: Crawls public LinkedIn profiles via Google
14
14
  email: shidash@shidash.com