indeed_jobsearch 0.1.0

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: 48a417eb30492ea9329635a4fae28b13515f5a00
4
+ data.tar.gz: 0360b731a2836dd40edf76fd8f9b6e5f8176fabc
5
+ SHA512:
6
+ metadata.gz: be27a299b329ff062ad46602140fd81e1c687e5375e0299013e585ecfa9c5f2c8efcf5ce28c59895a67dae28fce1a7388f6b662c69b68f2034922294754f8300
7
+ data.tar.gz: 1c4de759974a4c9fc1ca41826e5ecd2d28dfb4e84c6b183259d35c35600ecf4bdb110f527ca69aa477f0356a2b73a75349e9fb8cab06245fd53ea7cb66662222
data/.gitignore ADDED
@@ -0,0 +1,9 @@
1
+ /.bundle/
2
+ /.yardoc
3
+ /Gemfile.lock
4
+ /_yardoc/
5
+ /coverage/
6
+ /doc/
7
+ /pkg/
8
+ /spec/reports/
9
+ /tmp/
data/.rspec ADDED
@@ -0,0 +1,2 @@
1
+ --format documentation
2
+ --color
data/.travis.yml ADDED
@@ -0,0 +1,3 @@
1
+ language: ruby
2
+ rvm:
3
+ - 2.1.5
data/Gemfile ADDED
@@ -0,0 +1,4 @@
1
+ source 'https://rubygems.org'
2
+
3
+ # Specify your gem's dependencies in indeed_jobsearch.gemspec
4
+ gemspec
data/Guardfile ADDED
@@ -0,0 +1,70 @@
1
+ # A sample Guardfile
2
+ # More info at https://github.com/guard/guard#readme
3
+
4
+ ## Uncomment and set this to only include directories you want to watch
5
+ # directories %w(app lib config test spec features) \
6
+ # .select{|d| Dir.exists?(d) ? d : UI.warning("Directory #{d} does not exist")}
7
+
8
+ ## Note: if you are using the `directories` clause above and you are not
9
+ ## watching the project directory ('.'), then you will want to move
10
+ ## the Guardfile to a watched dir and symlink it back, e.g.
11
+ #
12
+ # $ mkdir config
13
+ # $ mv Guardfile config/
14
+ # $ ln -s config/Guardfile .
15
+ #
16
+ # and, you'll have to watch "config/Guardfile" instead of "Guardfile"
17
+
18
+ # Note: The cmd option is now required due to the increasing number of ways
19
+ # rspec may be run, below are examples of the most common uses.
20
+ # * bundler: 'bundle exec rspec'
21
+ # * bundler binstubs: 'bin/rspec'
22
+ # * spring: 'bin/rspec' (This will use spring if running and you have
23
+ # installed the spring binstubs per the docs)
24
+ # * zeus: 'zeus rspec' (requires the server to be started separately)
25
+ # * 'just' rspec: 'rspec'
26
+
27
+ guard :rspec, cmd: "bundle exec rspec" do
28
+ require "guard/rspec/dsl"
29
+ dsl = Guard::RSpec::Dsl.new(self)
30
+
31
+ # Feel free to open issues for suggestions and improvements
32
+
33
+ # RSpec files
34
+ rspec = dsl.rspec
35
+ watch(rspec.spec_helper) { rspec.spec_dir }
36
+ watch(rspec.spec_support) { rspec.spec_dir }
37
+ watch(rspec.spec_files)
38
+
39
+ # Ruby files
40
+ ruby = dsl.ruby
41
+ dsl.watch_spec_files_for(ruby.lib_files)
42
+
43
+ # Rails files
44
+ rails = dsl.rails(view_extensions: %w(erb haml slim))
45
+ dsl.watch_spec_files_for(rails.app_files)
46
+ dsl.watch_spec_files_for(rails.views)
47
+
48
+ watch(rails.controllers) do |m|
49
+ [
50
+ rspec.spec.("routing/#{m[1]}_routing"),
51
+ rspec.spec.("controllers/#{m[1]}_controller"),
52
+ rspec.spec.("acceptance/#{m[1]}")
53
+ ]
54
+ end
55
+
56
+ # Rails config changes
57
+ watch(rails.spec_helper) { rspec.spec_dir }
58
+ watch(rails.routes) { "#{rspec.spec_dir}/routing" }
59
+ watch(rails.app_controller) { "#{rspec.spec_dir}/controllers" }
60
+
61
+ # Capybara features specs
62
+ watch(rails.view_dirs) { |m| rspec.spec.("features/#{m[1]}") }
63
+ watch(rails.layouts) { |m| rspec.spec.("features/#{m[1]}") }
64
+
65
+ # Turnip features and steps
66
+ watch(%r{^spec/acceptance/(.+)\.feature$})
67
+ watch(%r{^spec/acceptance/steps/(.+)_steps\.rb$}) do |m|
68
+ Dir[File.join("**/#{m[1]}.feature")][0] || "spec/acceptance"
69
+ end
70
+ end
data/README.md ADDED
@@ -0,0 +1,45 @@
1
+ # IndeedJobsearch [![Coverage Status](https://coveralls.io/repos/andrew-carroll/indeed_jobsearch/badge.svg?branch=master&service=github)](https://coveralls.io/github/andrew-carroll/indeed_jobsearch?branch=master) [![Build Status](https://circleci.com/gh/andrew-carroll/indeed_jobsearch.svg?style=shield&circle-token=5f73b0fc84e352ec3c03acb0771526d80326f5b8)](https://circleci.com/gh/andrew-carroll/indeed_jobsearch) [![Code Climate](https://codeclimate.com/github/andrew-carroll/indeed_jobsearch/badges/gpa.svg)](https://codeclimate.com/github/andrew-carroll/indeed_jobsearch)
2
+
3
+ A client library for searching Indeed jobs without using the official API. There are a couple advantages to this, including not requiring authorization, as well as being able to fetch search results for third-party job ads. If you are looking for a client library for the official API, use [Indeed's official gem](https://github.com/indeedlabs/indeed-ruby) instead.
4
+
5
+ ## Installation
6
+
7
+ Add this line to your application's Gemfile:
8
+
9
+ ```ruby
10
+ gem 'indeed_jobsearch'
11
+ ```
12
+
13
+ And then execute:
14
+
15
+ $ bundle
16
+
17
+ Or install it yourself as:
18
+
19
+ $ gem install indeed_jobsearch
20
+
21
+ ## Usage
22
+
23
+ ```ruby
24
+ require 'indeed_jobsearch'
25
+ search = IndeedJobsearch::Search.new(job_title, city)
26
+ results = search.page(1)
27
+ ```
28
+
29
+ This will return an array of SearchResult objects with the following readable attributes:
30
+ * Job title
31
+ * Company
32
+ * Location
33
+ * Time the job was posted
34
+ * Time the job was scraped
35
+ * Job URL
36
+
37
+ **Please note that this library does not enforce rate limiting. Please be courteous and limit usage to an appropriate rate.**
38
+
39
+ ## Contributing
40
+
41
+ 1. Fork it ( https://github.com/andrew-carroll/indeed_jobsearch/fork )
42
+ 2. Create your feature branch (`git checkout -b my-new-feature`)
43
+ 3. Commit your changes (`git commit -am 'Add some feature'`)
44
+ 4. Push to the branch (`git push origin my-new-feature`)
45
+ 5. Create a new Pull Request
data/Rakefile ADDED
@@ -0,0 +1 @@
1
+ require "bundler/gem_tasks"
data/bin/console ADDED
@@ -0,0 +1,14 @@
1
+ #!/usr/bin/env ruby
2
+
3
+ require "bundler/setup"
4
+ require "indeed_jobsearch"
5
+
6
+ # You can add fixtures and/or initialization code here to make experimenting
7
+ # with your gem easier. You can also use a different console, if you like.
8
+
9
+ # (If you use this, don't forget to add pry to your Gemfile!)
10
+ # require "pry"
11
+ # Pry.start
12
+
13
+ require "irb"
14
+ IRB.start
data/bin/setup ADDED
@@ -0,0 +1,7 @@
1
+ #!/bin/bash
2
+ set -euo pipefail
3
+ IFS=$'\n\t'
4
+
5
+ bundle install
6
+
7
+ # Do any other automated setup that you need to do here
data/circle.yml ADDED
@@ -0,0 +1,3 @@
1
+ machine:
2
+ ruby:
3
+ version: 2.1.2
@@ -0,0 +1,33 @@
1
+ # coding: utf-8
2
+ lib = File.expand_path('../lib', __FILE__)
3
+ $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
4
+ require 'indeed_jobsearch/version'
5
+
6
+ Gem::Specification.new do |spec|
7
+ spec.name = "indeed_jobsearch"
8
+ spec.version = IndeedJobsearch::VERSION
9
+ spec.authors = ["Andrew Carroll"]
10
+ spec.email = ["mrandrewcarroll@gmail.com"]
11
+
12
+ spec.summary = %q{Unofficial API for searching Indeed jobs.}
13
+ spec.homepage = "http://github.com/andrew-carroll/indeed_jobsearch"
14
+
15
+ spec.files = `git ls-files -z`.split("\x0").reject { |f| f.match(%r{^(test|spec|features)/}) }
16
+ spec.bindir = "bin"
17
+ spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
18
+ spec.require_paths = ["lib"]
19
+
20
+ spec.required_ruby_version = '>= 2.1.2'
21
+ spec.add_development_dependency "bundler", "~> 1.9"
22
+ spec.add_development_dependency "rake", "~> 10.0"
23
+ spec.add_development_dependency "rspec", "~> 3.3.0"
24
+ spec.add_development_dependency "guard-rspec", "~> 4.6.4"
25
+ spec.add_development_dependency "pry", "~> 0.10.1"
26
+ spec.add_development_dependency "pry-remote", "~> 0.1.8"
27
+ spec.add_development_dependency "pry-nav", "~> 0.2.4"
28
+ spec.add_development_dependency "simplecov", "~> 0.10.0"
29
+ spec.add_development_dependency "coveralls", "~> 0.8.2"
30
+ spec.add_runtime_dependency "mechanize", "~> 2.7.3"
31
+ spec.add_runtime_dependency "activesupport", "~> 4.2.3"
32
+ spec.add_runtime_dependency "retryable", "~> 2.0.2"
33
+ end
@@ -0,0 +1,11 @@
1
+ require "mechanize"
2
+ require "indeed_jobsearch/version"
3
+ require "indeed_jobsearch/search"
4
+ require "indeed_jobsearch/search_page"
5
+ require "indeed_jobsearch/search_result"
6
+ require "indeed_jobsearch/search_results_fetcher"
7
+ require "indeed_jobsearch/search_result_node"
8
+
9
+ module IndeedJobsearch
10
+ # Your code goes here...
11
+ end
@@ -0,0 +1,12 @@
1
+ module IndeedJobsearch
2
+ class Search
3
+ attr_reader :query, :location
4
+ def initialize(query, location)
5
+ @query, @location = query, location
6
+ end
7
+
8
+ def page(page_number)
9
+ SearchResultsFetcher.fetch(@query, @location, page_number)
10
+ end
11
+ end
12
+ end
@@ -0,0 +1,19 @@
1
+ module IndeedJobsearch
2
+ class SearchPage
3
+ attr_reader :nodes
4
+ def initialize(query, location, page_number)
5
+ agent = Mechanize.new
6
+ @page = agent.get(query_url(query, location, page_number))
7
+ @nodes = @page.search('.result').map do |node|
8
+ SearchResultNode.new(node)
9
+ end
10
+ end
11
+
12
+ private
13
+
14
+ def query_url(query, location, page_number)
15
+ query, location = CGI.escape(query), CGI.escape(location)
16
+ "http://www.indeed.com/jobs?q=#{query}&l=#{location}&start=#{page_number * 10}"
17
+ end
18
+ end
19
+ end
@@ -0,0 +1,8 @@
1
+ module IndeedJobsearch
2
+ class SearchResult
3
+ attr_reader :job_title, :company, :location, :time_since_posting, :time_scraped, :url
4
+ def initialize(job_title:, company:, location:, time_since_posting:, time_scraped:, url:)
5
+ @job_title, @company, @location, @time_since_posting, @time_scraped, @url = job_title, company, location, time_since_posting, time_scraped, url
6
+ end
7
+ end
8
+ end
@@ -0,0 +1,16 @@
1
+ module IndeedJobsearch
2
+ class SearchResultNode
3
+ def initialize(node)
4
+ @node = node
5
+ end
6
+
7
+ def text(selector)
8
+ @node.search(selector).text.strip
9
+ end
10
+
11
+ def url
12
+ selector = '[data-tn-element=jobTitle]'
13
+ @node.search(selector).first.attribute('href').value
14
+ end
15
+ end
16
+ end
@@ -0,0 +1,23 @@
1
+ module IndeedJobsearch
2
+ module SearchResultsFetcher
3
+ def self.fetch(query, location, page_number)
4
+ page = SearchPage.new(query, location, page_number)
5
+ results = page.nodes.map do |node|
6
+ search_result(node)
7
+ end
8
+ end
9
+
10
+ private
11
+
12
+ def self.search_result(node)
13
+ SearchResult.new(
14
+ job_title: node.text('.jobtitle'),
15
+ company: node.text('.company'),
16
+ location: node.text('.location'),
17
+ time_since_posting: node.text('.date'),
18
+ time_scraped: Time.now,
19
+ url: 'http://www.indeed.com' + node.url
20
+ )
21
+ end
22
+ end
23
+ end
@@ -0,0 +1,3 @@
1
+ module IndeedJobsearch
2
+ VERSION = "0.1.0"
3
+ end
metadata ADDED
@@ -0,0 +1,231 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: indeed_jobsearch
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.1.0
5
+ platform: ruby
6
+ authors:
7
+ - Andrew Carroll
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2015-08-28 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: bundler
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - "~>"
18
+ - !ruby/object:Gem::Version
19
+ version: '1.9'
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - "~>"
25
+ - !ruby/object:Gem::Version
26
+ version: '1.9'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - "~>"
32
+ - !ruby/object:Gem::Version
33
+ version: '10.0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - "~>"
39
+ - !ruby/object:Gem::Version
40
+ version: '10.0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rspec
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - "~>"
46
+ - !ruby/object:Gem::Version
47
+ version: 3.3.0
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - "~>"
53
+ - !ruby/object:Gem::Version
54
+ version: 3.3.0
55
+ - !ruby/object:Gem::Dependency
56
+ name: guard-rspec
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - "~>"
60
+ - !ruby/object:Gem::Version
61
+ version: 4.6.4
62
+ type: :development
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - "~>"
67
+ - !ruby/object:Gem::Version
68
+ version: 4.6.4
69
+ - !ruby/object:Gem::Dependency
70
+ name: pry
71
+ requirement: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - "~>"
74
+ - !ruby/object:Gem::Version
75
+ version: 0.10.1
76
+ type: :development
77
+ prerelease: false
78
+ version_requirements: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - "~>"
81
+ - !ruby/object:Gem::Version
82
+ version: 0.10.1
83
+ - !ruby/object:Gem::Dependency
84
+ name: pry-remote
85
+ requirement: !ruby/object:Gem::Requirement
86
+ requirements:
87
+ - - "~>"
88
+ - !ruby/object:Gem::Version
89
+ version: 0.1.8
90
+ type: :development
91
+ prerelease: false
92
+ version_requirements: !ruby/object:Gem::Requirement
93
+ requirements:
94
+ - - "~>"
95
+ - !ruby/object:Gem::Version
96
+ version: 0.1.8
97
+ - !ruby/object:Gem::Dependency
98
+ name: pry-nav
99
+ requirement: !ruby/object:Gem::Requirement
100
+ requirements:
101
+ - - "~>"
102
+ - !ruby/object:Gem::Version
103
+ version: 0.2.4
104
+ type: :development
105
+ prerelease: false
106
+ version_requirements: !ruby/object:Gem::Requirement
107
+ requirements:
108
+ - - "~>"
109
+ - !ruby/object:Gem::Version
110
+ version: 0.2.4
111
+ - !ruby/object:Gem::Dependency
112
+ name: simplecov
113
+ requirement: !ruby/object:Gem::Requirement
114
+ requirements:
115
+ - - "~>"
116
+ - !ruby/object:Gem::Version
117
+ version: 0.10.0
118
+ type: :development
119
+ prerelease: false
120
+ version_requirements: !ruby/object:Gem::Requirement
121
+ requirements:
122
+ - - "~>"
123
+ - !ruby/object:Gem::Version
124
+ version: 0.10.0
125
+ - !ruby/object:Gem::Dependency
126
+ name: coveralls
127
+ requirement: !ruby/object:Gem::Requirement
128
+ requirements:
129
+ - - "~>"
130
+ - !ruby/object:Gem::Version
131
+ version: 0.8.2
132
+ type: :development
133
+ prerelease: false
134
+ version_requirements: !ruby/object:Gem::Requirement
135
+ requirements:
136
+ - - "~>"
137
+ - !ruby/object:Gem::Version
138
+ version: 0.8.2
139
+ - !ruby/object:Gem::Dependency
140
+ name: mechanize
141
+ requirement: !ruby/object:Gem::Requirement
142
+ requirements:
143
+ - - "~>"
144
+ - !ruby/object:Gem::Version
145
+ version: 2.7.3
146
+ type: :runtime
147
+ prerelease: false
148
+ version_requirements: !ruby/object:Gem::Requirement
149
+ requirements:
150
+ - - "~>"
151
+ - !ruby/object:Gem::Version
152
+ version: 2.7.3
153
+ - !ruby/object:Gem::Dependency
154
+ name: activesupport
155
+ requirement: !ruby/object:Gem::Requirement
156
+ requirements:
157
+ - - "~>"
158
+ - !ruby/object:Gem::Version
159
+ version: 4.2.3
160
+ type: :runtime
161
+ prerelease: false
162
+ version_requirements: !ruby/object:Gem::Requirement
163
+ requirements:
164
+ - - "~>"
165
+ - !ruby/object:Gem::Version
166
+ version: 4.2.3
167
+ - !ruby/object:Gem::Dependency
168
+ name: retryable
169
+ requirement: !ruby/object:Gem::Requirement
170
+ requirements:
171
+ - - "~>"
172
+ - !ruby/object:Gem::Version
173
+ version: 2.0.2
174
+ type: :runtime
175
+ prerelease: false
176
+ version_requirements: !ruby/object:Gem::Requirement
177
+ requirements:
178
+ - - "~>"
179
+ - !ruby/object:Gem::Version
180
+ version: 2.0.2
181
+ description:
182
+ email:
183
+ - mrandrewcarroll@gmail.com
184
+ executables:
185
+ - console
186
+ - setup
187
+ extensions: []
188
+ extra_rdoc_files: []
189
+ files:
190
+ - ".gitignore"
191
+ - ".rspec"
192
+ - ".travis.yml"
193
+ - Gemfile
194
+ - Guardfile
195
+ - README.md
196
+ - Rakefile
197
+ - bin/console
198
+ - bin/setup
199
+ - circle.yml
200
+ - indeed_jobsearch.gemspec
201
+ - lib/indeed_jobsearch.rb
202
+ - lib/indeed_jobsearch/search.rb
203
+ - lib/indeed_jobsearch/search_page.rb
204
+ - lib/indeed_jobsearch/search_result.rb
205
+ - lib/indeed_jobsearch/search_result_node.rb
206
+ - lib/indeed_jobsearch/search_results_fetcher.rb
207
+ - lib/indeed_jobsearch/version.rb
208
+ homepage: http://github.com/andrew-carroll/indeed_jobsearch
209
+ licenses: []
210
+ metadata: {}
211
+ post_install_message:
212
+ rdoc_options: []
213
+ require_paths:
214
+ - lib
215
+ required_ruby_version: !ruby/object:Gem::Requirement
216
+ requirements:
217
+ - - ">="
218
+ - !ruby/object:Gem::Version
219
+ version: 2.1.2
220
+ required_rubygems_version: !ruby/object:Gem::Requirement
221
+ requirements:
222
+ - - ">="
223
+ - !ruby/object:Gem::Version
224
+ version: '0'
225
+ requirements: []
226
+ rubyforge_project:
227
+ rubygems_version: 2.2.2
228
+ signing_key:
229
+ specification_version: 4
230
+ summary: Unofficial API for searching Indeed jobs.
231
+ test_files: []