linkedincrawler 0.0.5 → 0.0.6

Sign up to get free protection for your applications and to get access to all the features.
Files changed (3) hide show
  1. checksums.yaml +4 -4
  2. data/lib/linkedincrawler.rb +18 -5
  3. metadata +1 -1
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: c1933a4a905a2b52b2d3b888d54c4d8d044ec7c5
4
- data.tar.gz: 771175b55c592fc4bf14317a1c63cc76efb4ecd9
3
+ metadata.gz: 99433021962017d0dc2ef40342127cce06abac54
4
+ data.tar.gz: 4a0a0a5441e6a9bcdb76ce69b9fb1be8f3647619
5
5
  SHA512:
6
- metadata.gz: a427d86d2ddc648e1bb6362b93f97ffb56e1f68420ce418d6b4754062e752b8961b8e4e72da6a465c990d69367097e37e1d3a9ac054394e077de6449ca1fe62d
7
- data.tar.gz: 23618949f1ce1bd4eaf16589bed5078e6cc840b36f8c8624f6e477e0f89890c48ac1c5efa5a8d2d191119689509f5284090714c8380693d1ae7fc93bd014c92f
6
+ metadata.gz: ec59a52e5c73cdf9f3d91bd4e7936a2957c7671ee92d5566f06ba64ae230380ecfcb00aa52093bed3c84b5909309f1b1f41d3b40d78968b66a116c8215f149ba
7
+ data.tar.gz: 1bafd3d56a9b3ad9422a25ef2118cb610aaa229eb899c63a070fa46c8c933b65052402f8191246421fbaa8983910591a3fbb38bce704d48f0c6e1457a8b7f549
@@ -19,11 +19,21 @@ class LinkedinCrawler
19
19
  def search
20
20
  # Run Google search
21
21
  g = GeneralScraper.new("site:linkedin.com/pub -site:linkedin.com/pub/dir/", @search_terms, @proxy_list)
22
-
23
- # Scrape each resulting LinkedIn page
24
- JSON.parse(g.getURLs).each do |profile|
25
- if profile.include?(".linkedin.") && !profile.include?("/search")
26
- scrape(profile)
22
+ begin
23
+ urls = g.getURLs
24
+ rescue # Search again if it didn't work the first time
25
+ search
26
+ end
27
+
28
+ # Search again if it didn't run
29
+ if urls.length == 0 || urls.empty?
30
+ search
31
+ else
32
+ # Scrape each resulting LinkedIn page
33
+ JSON.parse(urls).each do |profile|
34
+ if profile.include?(".linkedin.") && !profile.include?("/search")
35
+ scrape(profile)
36
+ end
27
37
  end
28
38
  end
29
39
 
@@ -64,3 +74,6 @@ class LinkedinCrawler
64
74
  JSON.pretty_generate(@output)
65
75
  end
66
76
  end
77
+ c = LinkedinCrawler.new("remotely piloted aircraft", 5, "/home/shidash/proxylist2", [3, 5])
78
+ c.search
79
+ File.write("test.json", c.gen_json)
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: linkedincrawler
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.0.5
4
+ version: 0.0.6
5
5
  platform: ruby
6
6
  authors:
7
7
  - M. C. McGrath