linkedin-scraper-v2 0.1.8 → 0.1.9
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/bin/linkedin-scraper +1 -1
- metadata +17 -37
- data/.gitignore +0 -23
- data/.rubocop.yml +0 -11
- data/.travis.yml +0 -8
- data/Gemfile +0 -4
- data/LICENSE +0 -22
- data/README.md +0 -272
- data/Rakefile +0 -3
- data/lib/linkedin_scraper.rb +0 -5
- data/lib/linkedin_scraper/profile.rb +0 -252
- data/lib/linkedin_scraper/version.rb +0 -5
- data/linkedin-scraper.gemspec +0 -22
- data/spec/fixtures/jeffweiner08.html +0 -308
- data/spec/linkedin_scraper/profile_spec.rb +0 -110
- data/spec/spec_helper.rb +0 -17
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 735f35e301624a85934837627b44373effea2af1
|
4
|
+
data.tar.gz: a04506d29ca7979008d95d29c4085d9e97050dd7
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 8b73e4a9f0ecfeca8dc062e10096460db3ff20b80eedf283f870b31f4ff2e46c68e3f64411d7d5edecdab15ef69c6c239a1b2a29335c11721f8935f01dae5e70
|
7
|
+
data.tar.gz: 00506fb9daa0e52e702c57e0f383288442f34f951bed871cc2dab889e1d94198caac93b1cc82db9950a96616eec0747abb884df60d91fc3cd580f611024d9cd8
|
data/bin/linkedin-scraper
CHANGED
metadata
CHANGED
@@ -1,83 +1,67 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: linkedin-scraper-v2
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.1.
|
4
|
+
version: 0.1.9
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Yatish Mehta
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2015-10-
|
11
|
+
date: 2015-10-07 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: mechanize
|
15
15
|
requirement: !ruby/object:Gem::Requirement
|
16
16
|
requirements:
|
17
|
-
- -
|
17
|
+
- - '>='
|
18
18
|
- !ruby/object:Gem::Version
|
19
|
-
version: '
|
19
|
+
version: '0'
|
20
20
|
type: :runtime
|
21
21
|
prerelease: false
|
22
22
|
version_requirements: !ruby/object:Gem::Requirement
|
23
23
|
requirements:
|
24
|
-
- -
|
24
|
+
- - '>='
|
25
25
|
- !ruby/object:Gem::Version
|
26
|
-
version: '
|
26
|
+
version: '0'
|
27
27
|
- !ruby/object:Gem::Dependency
|
28
28
|
name: rspec
|
29
29
|
requirement: !ruby/object:Gem::Requirement
|
30
30
|
requirements:
|
31
|
-
- -
|
31
|
+
- - '>='
|
32
32
|
- !ruby/object:Gem::Version
|
33
|
-
version: '
|
33
|
+
version: '0'
|
34
34
|
type: :development
|
35
35
|
prerelease: false
|
36
36
|
version_requirements: !ruby/object:Gem::Requirement
|
37
37
|
requirements:
|
38
|
-
- -
|
38
|
+
- - '>='
|
39
39
|
- !ruby/object:Gem::Version
|
40
|
-
version: '
|
40
|
+
version: '0'
|
41
41
|
- !ruby/object:Gem::Dependency
|
42
42
|
name: rake
|
43
43
|
requirement: !ruby/object:Gem::Requirement
|
44
44
|
requirements:
|
45
|
-
- -
|
45
|
+
- - '>='
|
46
46
|
- !ruby/object:Gem::Version
|
47
|
-
version: '
|
47
|
+
version: '0'
|
48
48
|
type: :development
|
49
49
|
prerelease: false
|
50
50
|
version_requirements: !ruby/object:Gem::Requirement
|
51
51
|
requirements:
|
52
|
-
- -
|
52
|
+
- - '>='
|
53
53
|
- !ruby/object:Gem::Version
|
54
|
-
version: '
|
55
|
-
description: 'Scrapes the
|
54
|
+
version: '0'
|
55
|
+
description: 'Scrapes the linkedin profile when a url is given '
|
56
56
|
email:
|
57
57
|
executables:
|
58
58
|
- linkedin-scraper
|
59
59
|
extensions: []
|
60
60
|
extra_rdoc_files: []
|
61
61
|
files:
|
62
|
-
- .gitignore
|
63
|
-
- .rubocop.yml
|
64
|
-
- .travis.yml
|
65
|
-
- Gemfile
|
66
|
-
- LICENSE
|
67
|
-
- README.md
|
68
|
-
- Rakefile
|
69
62
|
- bin/linkedin-scraper
|
70
|
-
- lib/linkedin_scraper.rb
|
71
|
-
- lib/linkedin_scraper/profile.rb
|
72
|
-
- lib/linkedin_scraper/version.rb
|
73
|
-
- linkedin-scraper.gemspec
|
74
|
-
- spec/fixtures/jeffweiner08.html
|
75
|
-
- spec/linkedin_scraper/.DS_Store
|
76
|
-
- spec/linkedin_scraper/profile_spec.rb
|
77
|
-
- spec/spec_helper.rb
|
78
63
|
homepage: https://github.com/yatishmehta27/linkedin-scraper
|
79
|
-
licenses:
|
80
|
-
- MIT
|
64
|
+
licenses: []
|
81
65
|
metadata: {}
|
82
66
|
post_install_message:
|
83
67
|
rdoc_options: []
|
@@ -100,8 +84,4 @@ signing_key:
|
|
100
84
|
specification_version: 4
|
101
85
|
summary: when a url of public linkedin profile page is given it scrapes the entire
|
102
86
|
page and converts into a accessible object
|
103
|
-
test_files:
|
104
|
-
- spec/fixtures/jeffweiner08.html
|
105
|
-
- spec/linkedin_scraper/.DS_Store
|
106
|
-
- spec/linkedin_scraper/profile_spec.rb
|
107
|
-
- spec/spec_helper.rb
|
87
|
+
test_files: []
|
data/.gitignore
DELETED
@@ -1,23 +0,0 @@
|
|
1
|
-
*.gem
|
2
|
-
*.rbc
|
3
|
-
.bundle
|
4
|
-
.config
|
5
|
-
.rspec
|
6
|
-
.yardoc
|
7
|
-
Gemfile.lock
|
8
|
-
InstalledFiles
|
9
|
-
_yardoc
|
10
|
-
coverage
|
11
|
-
doc/
|
12
|
-
lib/bundler/man
|
13
|
-
pkg
|
14
|
-
rdoc
|
15
|
-
spec/reports
|
16
|
-
test/tmp
|
17
|
-
test/version_tmp
|
18
|
-
tmp
|
19
|
-
.ruby-version
|
20
|
-
.ruby-gemset
|
21
|
-
.projectile
|
22
|
-
*.DS_Store
|
23
|
-
.idea/*
|
data/.rubocop.yml
DELETED
data/.travis.yml
DELETED
data/Gemfile
DELETED
data/LICENSE
DELETED
@@ -1,22 +0,0 @@
|
|
1
|
-
Copyright (c) 2012 Yatish Mehta
|
2
|
-
|
3
|
-
MIT License
|
4
|
-
|
5
|
-
Permission is hereby granted, free of charge, to any person obtaining
|
6
|
-
a copy of this software and associated documentation files (the
|
7
|
-
"Software"), to deal in the Software without restriction, including
|
8
|
-
without limitation the rights to use, copy, modify, merge, publish,
|
9
|
-
distribute, sublicense, and/or sell copies of the Software, and to
|
10
|
-
permit persons to whom the Software is furnished to do so, subject to
|
11
|
-
the following conditions:
|
12
|
-
|
13
|
-
The above copyright notice and this permission notice shall be
|
14
|
-
included in all copies or substantial portions of the Software.
|
15
|
-
|
16
|
-
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
17
|
-
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
18
|
-
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
19
|
-
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
|
20
|
-
LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
|
21
|
-
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
|
22
|
-
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
data/README.md
DELETED
@@ -1,272 +0,0 @@
|
|
1
|
-
[](http://travis-ci.org/yatish27/linkedin-scraper)
|
2
|
-
[](http://badge.fury.io/rb/linkedin-scraper)
|
3
|
-
|
4
|
-
Linkedin Scraper
|
5
|
-
================
|
6
|
-
|
7
|
-
Linkedin-scraper is a gem for scraping linkedin public profiles.
|
8
|
-
Given the URL of the profile, it gets the name, country, title, area, current companies, past companies,
|
9
|
-
organizations, skills, groups, etc
|
10
|
-
|
11
|
-
|
12
|
-
## Installation
|
13
|
-
|
14
|
-
Install the gem from RubyGems:
|
15
|
-
|
16
|
-
gem install linkedin-scraper
|
17
|
-
|
18
|
-
This gem is tested on 1.9.2, 1.9.3, 2.0.0, JRuby1.9, rbx1.9,
|
19
|
-
|
20
|
-
## Usage
|
21
|
-
|
22
|
-
|
23
|
-
Initialize a scraper instance
|
24
|
-
|
25
|
-
profile = Linkedin::Profile.get_profile("http://www.linkedin.com/in/jeffweiner08")
|
26
|
-
|
27
|
-
The returning object responds to the following methods
|
28
|
-
|
29
|
-
|
30
|
-
profile.first_name # The first name of the contact
|
31
|
-
|
32
|
-
profile.last_name # The last name of the contact
|
33
|
-
|
34
|
-
profile.name # The full name of the profile
|
35
|
-
|
36
|
-
profile.title # The job title
|
37
|
-
|
38
|
-
profile.summary # The summary of the profile
|
39
|
-
|
40
|
-
profile.location # The location of the contact
|
41
|
-
|
42
|
-
profile.country # The country of the contact
|
43
|
-
|
44
|
-
profile.industry # The domain for which the contact belongs
|
45
|
-
|
46
|
-
profile.picture # The profile picture link of profile
|
47
|
-
|
48
|
-
profile.skills # Array of skills of the profile
|
49
|
-
|
50
|
-
profile.organizations # Array organizations of the profile
|
51
|
-
|
52
|
-
profile.education # Array of hashes for education
|
53
|
-
|
54
|
-
profile.websites # Array of websites
|
55
|
-
|
56
|
-
profile.groups # Array of groups
|
57
|
-
|
58
|
-
profile.languages # Array of languages
|
59
|
-
|
60
|
-
profile.certifications # Array of certifications
|
61
|
-
|
62
|
-
profile.number_of_connections # The number of connections as a string
|
63
|
-
|
64
|
-
|
65
|
-
For current and past companies it also provides the details of the companies like company size, industry, address, etc
|
66
|
-
|
67
|
-
profile.current_companies
|
68
|
-
|
69
|
-
[
|
70
|
-
[0] {
|
71
|
-
:current_company => "LinkedIn",
|
72
|
-
:current_title => "CEO",
|
73
|
-
:current_company_url => "http://www.linkedin.com",
|
74
|
-
:description => nil,
|
75
|
-
:linkedin_company_url => "http://www.linkedin.com/company/linkedin?trk=ppro_cprof",
|
76
|
-
:url => "http://www.linkedin.com",
|
77
|
-
:type => "Public Company",
|
78
|
-
:company_size => "1001-5000 employees",
|
79
|
-
:website => "http://www.linkedin.com",
|
80
|
-
:industry => "Internet",
|
81
|
-
:founded => "2003",
|
82
|
-
:address => "2029 Stierlin Court Mountain View, CA 94043 United States"
|
83
|
-
},
|
84
|
-
[1] {
|
85
|
-
:current_company => "Intuit",
|
86
|
-
:current_title => "Member, Board of Directors",
|
87
|
-
:current_company_url => "http://network.intuit.com/",
|
88
|
-
:description => nil,
|
89
|
-
:linkedin_company_url => "http://www.linkedin.com/company/intuit?trk=ppro_cprof",
|
90
|
-
:url => "http://network.intuit.com/",
|
91
|
-
:type => "Public Company",
|
92
|
-
:company_size => "5001-10,000 employees",
|
93
|
-
:website => "http://network.intuit.com/",
|
94
|
-
:industry => "Computer Software",
|
95
|
-
:founded => "1983",
|
96
|
-
:address => "2632 Marine Way Mountain View, CA 94043 United States"
|
97
|
-
},
|
98
|
-
[2] {
|
99
|
-
:current_company => "DonorsChoose",
|
100
|
-
:current_title => "Member, Board of Directors",
|
101
|
-
:current_company_url => "http://www.donorschoose.org",
|
102
|
-
:description => nil,
|
103
|
-
:linkedin_company_url => "http://www.linkedin.com/company/donorschoose.org?trk=ppro_cprof",
|
104
|
-
:url => "http://www.donorschoose.org",
|
105
|
-
:type => "Nonprofit",
|
106
|
-
:company_size => "51-200 employees",
|
107
|
-
:website => "http://www.donorschoose.org",
|
108
|
-
:industry => "Nonprofit Organization Management",
|
109
|
-
:founded => "2000",
|
110
|
-
:address => "213 West 35th Street 2nd Floor East New York, NY 10001 United States"
|
111
|
-
},
|
112
|
-
[3] {
|
113
|
-
:current_company => "Malaria No More",
|
114
|
-
:current_title => "Member, Board of Directors",
|
115
|
-
:current_company_url => nil,
|
116
|
-
:description => nil
|
117
|
-
},
|
118
|
-
[4] {
|
119
|
-
:current_company => "Venture For America",
|
120
|
-
:current_title => "Member, Advisory Board",
|
121
|
-
:current_company_url => "http://ventureforamerica.org/",
|
122
|
-
:description => nil,
|
123
|
-
:linkedin_company_url => "http://www.linkedin.com/company/venture-for-america?trk=ppro_cprof",
|
124
|
-
:url => "http://ventureforamerica.org/",
|
125
|
-
:type => "Nonprofit",
|
126
|
-
:company_size => "1-10 employees",
|
127
|
-
:website => "http://ventureforamerica.org/",
|
128
|
-
:industry => "Nonprofit Organization Management",
|
129
|
-
:founded => "2011"
|
130
|
-
}
|
131
|
-
]
|
132
|
-
|
133
|
-
|
134
|
-
profile.past_companies
|
135
|
-
[
|
136
|
-
[0] {
|
137
|
-
:past_company => "Accel Partners",
|
138
|
-
:past_title => "Executive in Residence",
|
139
|
-
:past_company_website => "http://www.facebook.com/accel",
|
140
|
-
:description => nil,
|
141
|
-
:linkedin_company_url => "http://www.linkedin.com/company/accel-partners?trk=ppro_cprof",
|
142
|
-
:url => "http://www.facebook.com/accel",
|
143
|
-
:type => "Partnership",
|
144
|
-
:company_size => "51-200 employees",
|
145
|
-
:website => "http://www.facebook.com/accel",
|
146
|
-
:industry => "Venture Capital & Private Equity",
|
147
|
-
:address => "428 University Palo Alto, CA 94301 United States"
|
148
|
-
},
|
149
|
-
[1] {
|
150
|
-
:past_company => "Greylock",
|
151
|
-
:past_title => "Executive in Residence",
|
152
|
-
:past_company_website => "http://www.greylock.com",
|
153
|
-
:description => nil,
|
154
|
-
:linkedin_company_url => "http://www.linkedin.com/company/greylock-partners?trk=ppro_cprof",
|
155
|
-
:url => "http://www.greylock.com",
|
156
|
-
:type => "Partnership",
|
157
|
-
:company_size => "51-200 employees",
|
158
|
-
:website => "http://www.greylock.com",
|
159
|
-
:industry => "Venture Capital & Private Equity",
|
160
|
-
:address => "2550 Sand Hill Road Menlo Park, CA 94025 United States"
|
161
|
-
},
|
162
|
-
[2] {
|
163
|
-
:past_company => "Yahoo!",
|
164
|
-
:past_title => "Executive Vice President Network Division",
|
165
|
-
:past_company_website => "http://www.yahoo.com",
|
166
|
-
:description => nil,
|
167
|
-
:linkedin_company_url => "http://www.linkedin.com/company/yahoo?trk=ppro_cprof",
|
168
|
-
:url => "http://www.yahoo.com",
|
169
|
-
:type => "Public Company",
|
170
|
-
:company_size => "10,001+ employees",
|
171
|
-
:website => "http://www.yahoo.com",
|
172
|
-
:industry => "Internet",
|
173
|
-
:founded => "1994",
|
174
|
-
:address => "701 First Avenue Sunnyvale, CA 94089 United States"
|
175
|
-
},
|
176
|
-
[3] {
|
177
|
-
:past_company => "Windsor Media",
|
178
|
-
:past_title => "Founding Partner",
|
179
|
-
:past_company_website => nil,
|
180
|
-
:description => nil
|
181
|
-
},
|
182
|
-
[4] {
|
183
|
-
:past_company => "Warner Bros.",
|
184
|
-
:past_title => "Vice President Online",
|
185
|
-
:past_company_website => "http://www.warnerbros.com/",
|
186
|
-
:description => nil,
|
187
|
-
:linkedin_company_url => "http://www.linkedin.com/company/warner-bros.-entertainment-group-of-companies?trk=ppro_cprof",
|
188
|
-
:url => "http://www.warnerbros.com/",
|
189
|
-
:type => "Public Company",
|
190
|
-
:company_size => "10,001+ employees",
|
191
|
-
:website => "http://www.warnerbros.com/",
|
192
|
-
:industry => "Entertainment",
|
193
|
-
:address => "4000 Warner Boulevard Burbank, CA 91522 United States"
|
194
|
-
}
|
195
|
-
]
|
196
|
-
|
197
|
-
|
198
|
-
profile.recommended_visitors
|
199
|
-
#It is the list of visitors "Viewers of this profile also viewed..."
|
200
|
-
[
|
201
|
-
[0] {
|
202
|
-
:link => "http://www.linkedin.com/in/barackobama?trk=pub-pbmap",
|
203
|
-
:name => "Barack Obama",
|
204
|
-
:title => "President of the United States of ",
|
205
|
-
:company => nil
|
206
|
-
},
|
207
|
-
[1] {
|
208
|
-
:link => "http://www.linkedin.com/in/marissamayer?trk=pub-pbmap",
|
209
|
-
:name => "Marissa Mayer",
|
210
|
-
:title => "Yahoo!, President & CEO",
|
211
|
-
:company => nil
|
212
|
-
},
|
213
|
-
[2] {
|
214
|
-
:link => "http://www.linkedin.com/pub/sean-parker/0/1/826?trk=pub-pbmap",
|
215
|
-
:name => "Sean Parker",
|
216
|
-
:title => nil,
|
217
|
-
:company => nil
|
218
|
-
},
|
219
|
-
[3] {
|
220
|
-
:link => "http://www.linkedin.com/pub/eduardo-saverin/0/70a/31b?trk=pub-pbmap",
|
221
|
-
:name => "Eduardo Saverin",
|
222
|
-
:title => nil,
|
223
|
-
:company => nil
|
224
|
-
},
|
225
|
-
[4] {
|
226
|
-
:link => "http://www.linkedin.com/in/rbranson?trk=pub-pbmap",
|
227
|
-
:name => "Richard Branson",
|
228
|
-
:title => "Founder",
|
229
|
-
:company => "Virgin Group"
|
230
|
-
},
|
231
|
-
[5] {
|
232
|
-
:link => "http://www.linkedin.com/in/reidhoffman?trk=pub-pbmap",
|
233
|
-
:name => "Reid Hoffman",
|
234
|
-
:title => "Entrepreneur. Product Strategist. ",
|
235
|
-
:company => nil
|
236
|
-
},
|
237
|
-
[6] {
|
238
|
-
:link => "http://www.linkedin.com/in/mdell?trk=pub-pbmap",
|
239
|
-
:name => "Michael Dell",
|
240
|
-
:title => "Chairman and CEO",
|
241
|
-
:company => "Dell"
|
242
|
-
},
|
243
|
-
[7] {
|
244
|
-
:link => "http://www.linkedin.com/in/mittromney?trk=pub-pbmap",
|
245
|
-
:name => "Mitt Romney",
|
246
|
-
:title => "Believe in America",
|
247
|
-
:company => nil
|
248
|
-
},
|
249
|
-
[8] {
|
250
|
-
:link => "http://www.linkedin.com/pub/sheryl-sandberg/2/665/512?trk=pub-pbmap",
|
251
|
-
:name => "Sheryl Sandberg",
|
252
|
-
:title => nil,
|
253
|
-
:company => nil
|
254
|
-
}
|
255
|
-
]
|
256
|
-
|
257
|
-
|
258
|
-
The gem also comes with a binary and can be used from the command line to get a json response of the scraped data.
|
259
|
-
It takes the url as the first argument.
|
260
|
-
|
261
|
-
linkedin-scraper http://www.linkedin.com/in/jeffweiner08
|
262
|
-
|
263
|
-
## Contributing
|
264
|
-
|
265
|
-
Bug reports and pull requests are welcome on GitHub at https://github.com/yatish27/linkedin-scraper.
|
266
|
-
This project is intended to be a safe, welcoming space for collaboration, and contributors are expected to adhere to the
|
267
|
-
[Contributor Covenant](contributor-covenant.org) code of conduct.
|
268
|
-
|
269
|
-
|
270
|
-
## License
|
271
|
-
|
272
|
-
The gem is available as open source under the terms of the [MIT License](http://opensource.org/licenses/MIT).
|