woot 0.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
data/.gitignore ADDED
@@ -0,0 +1,7 @@
1
+ .DS_Store
2
+ *.sw?
3
+ coverage
4
+ lib/.cookie
5
+ rdoc
6
+ pkg
7
+ sandbox
data/MIT-LICENSE ADDED
@@ -0,0 +1,20 @@
1
+ Copyright (c) 2009 Sean Huber (shuber@huberry.com)
2
+
3
+ Permission is hereby granted, free of charge, to any person obtaining
4
+ a copy of this software and associated documentation files (the
5
+ "Software"), to deal in the Software without restriction, including
6
+ without limitation the rights to use, copy, modify, merge, publish,
7
+ distribute, sublicense, and/or sell copies of the Software, and to
8
+ permit persons to whom the Software is furnished to do so, subject to
9
+ the following conditions:
10
+
11
+ The above copyright notice and this permission notice shall be
12
+ included in all copies or substantial portions of the Software.
13
+
14
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
15
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
16
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
17
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
18
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
19
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
20
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
data/README.rdoc ADDED
@@ -0,0 +1,40 @@
1
+ = woot
2
+
3
+ Scapes woot.com sites with ruby
4
+
5
+ == Installation
6
+
7
+ gem install woot --source http://gemcutter.org
8
+
9
+ == Usage
10
+
11
+ Simply call <tt>Woot.scrape</tt> and optionally specify the woot subdomain (e.g. www, shirt, kids, wine, etc).
12
+ Defaults to www.
13
+
14
+ data = Woot.scrape
15
+ puts data.title
16
+ puts data.price
17
+
18
+ data = Woot.scrape(:shirt)
19
+ puts data.title
20
+
21
+ == Note on Patches/Pull Requests
22
+
23
+ * Fork the project.
24
+ * Make your feature addition or bug fix.
25
+ * Add tests for it. This is important so I don't break it in a
26
+ future version unintentionally.
27
+ * Commit, do not mess with rakefile, version, or history.
28
+ (if you want to have your own version, that is fine but
29
+ bump version in a commit by itself I can ignore when I pull)
30
+ * Send me a pull request. Bonus points for topic branches.
31
+
32
+ == Todo
33
+
34
+ * sellout.woot.com support
35
+ * woot-off quantities
36
+ * build gem
37
+
38
+ == Copyright
39
+
40
+ Copyright (c) 2009 Sean Huber. See MIT-LICENSE for details.
data/Rakefile ADDED
@@ -0,0 +1,57 @@
1
+ require 'rubygems'
2
+ require 'rake'
3
+
4
+ begin
5
+ require 'jeweler'
6
+ Jeweler::Tasks.new do |gem|
7
+ gem.name = 'woot'
8
+ gem.summary = 'Scapes woot.com sites'
9
+ gem.description = 'Scapes woot.com sites'
10
+ gem.email = 'shuber@huberry.com'
11
+ gem.homepage = 'http://github.com/shuber/woot'
12
+ gem.authors = ['Sean Huber']
13
+ gem.add_dependency 'scrapi'
14
+ gem.add_development_dependency 'shoulda'
15
+ # gem is a Gem::Specification... see http://www.rubygems.org/read/chapter/20 for additional settings
16
+ end
17
+ rescue LoadError
18
+ puts 'Jeweler (or a dependency) not available. Install it with: sudo gem install jeweler'
19
+ end
20
+
21
+ require 'rake/testtask'
22
+ Rake::TestTask.new(:test) do |test|
23
+ test.libs << 'lib' << 'test'
24
+ test.pattern = 'test/**/*_test.rb'
25
+ test.verbose = true
26
+ end
27
+
28
+ begin
29
+ require 'rcov/rcovtask'
30
+ Rcov::RcovTask.new do |test|
31
+ test.libs << 'test'
32
+ test.pattern = 'test/**/*_test.rb'
33
+ test.verbose = true
34
+ end
35
+ rescue LoadError
36
+ task :rcov do
37
+ abort 'RCov is not available. In order to run rcov, you must: sudo gem install spicycode-rcov'
38
+ end
39
+ end
40
+
41
+ task :test => :check_dependencies
42
+
43
+ task :default => :test
44
+
45
+ require 'rake/rdoctask'
46
+ Rake::RDocTask.new do |rdoc|
47
+ if File.exist?('VERSION')
48
+ version = File.read('VERSION')
49
+ else
50
+ version = ""
51
+ end
52
+
53
+ rdoc.rdoc_dir = 'rdoc'
54
+ rdoc.title = "woot #{version}"
55
+ rdoc.rdoc_files.include('README*')
56
+ rdoc.rdoc_files.include('lib/**/*.rb')
57
+ end
data/VERSION ADDED
@@ -0,0 +1 @@
1
+ 0.0.0
data/init.rb ADDED
@@ -0,0 +1 @@
1
+ require 'woot'
data/lib/woot.rb ADDED
@@ -0,0 +1,33 @@
1
+ class Woot
2
+ DOMAIN = 'woot.com'
3
+
4
+ def self.scrape(subdomain = :www)
5
+ selectors = self.selectors(subdomain)
6
+ Scraper.define do
7
+ result *(selectors.inject([]) do |array, (pattern, results)|
8
+ process pattern, results
9
+ array += results.keys
10
+ end)
11
+ end.scrape(URI.parse("http://#{subdomain}.#{DOMAIN}/"))
12
+ end
13
+
14
+ def self.selectors(subdomain = :www)
15
+ @selectors = {
16
+ 'h2.fn' => { :title => :text },
17
+ 'span.amount' => { :price => :text },
18
+ 'ul#shippingOptions' => { :shipping => :text },
19
+ 'img.photo' => { :image => '@src' },
20
+ 'div.hproduct>a' => { :alternate_image => proc { |element| $1 if element.attributes['href'] =~ /\('([^']+)'\);/ } },
21
+ 'a.url' => { :url => '@href' },
22
+ 'li.comments>a' => { :comments_url => '@href', :comments_count => proc { |element| element.children[0].content.gsub(/\D/, '') } },
23
+ 'div.story>h2' => { :header => :text },
24
+ 'div.story>h3' => { :sub_header => :text },
25
+ 'div.writeUp' => { :writeup => :text },
26
+ 'div.specs' => { :specs => :text },
27
+ 'div.productDescription>dl' => { :details => :text },
28
+ 'a#ctl00_ctl00_ContentPlaceHolderLeadIn_ContentPlaceHolderLeadIn_SaleControl_HyperLinkWantOne' => { :purchase_url => proc do |element|
29
+ "http://#{subdomain}.#{DOMAIN}#{element.attributes['href'].gsub(/^https?:\/\/[^\/]+/, '')}" if element.attributes.has_key?('href')
30
+ end }
31
+ }
32
+ end
33
+ end
@@ -0,0 +1,25 @@
1
+ require 'rubygems'
2
+ require 'test/unit'
3
+ require 'shoulda'
4
+ require 'scrapi'
5
+ Tidy.path = ENV['TIDY_PATH'] if ENV['TIDY_PATH']
6
+
7
+ $LOAD_PATH.unshift(File.join(File.dirname(__FILE__), '..', 'lib'))
8
+ $LOAD_PATH.unshift(File.dirname(__FILE__))
9
+ require 'woot'
10
+
11
+ class Test::Unit::TestCase
12
+
13
+ def self.attributes
14
+ @attributes ||= Woot.selectors.map { |selector, results| results.keys }.flatten
15
+ end
16
+
17
+ def self.possible_blank_attributes
18
+ @possible_blank_attributes ||= [:purchase_url]
19
+ end
20
+
21
+ def self.subdomains
22
+ @subdomains ||= [:www, :wine, :shirt, :kids] # TODO: sellout
23
+ end
24
+
25
+ end
data/test/woot_test.rb ADDED
@@ -0,0 +1,24 @@
1
+ require 'test_helper'
2
+
3
+ class WootTest < Test::Unit::TestCase
4
+
5
+ subdomains.each do |subdomain|
6
+ context "When parsing http://#{subdomain}.#{Woot::DOMAIN}/ it" do
7
+ setup { @woot = Woot.scrape(subdomain) }
8
+
9
+ attributes.each do |attribute|
10
+ should "have a key for #{attribute}" do
11
+ assert @woot.members.include?(attribute.to_s)
12
+ end
13
+
14
+ unless possible_blank_attributes.include?(attribute)
15
+ should "have a value for #{attribute}" do
16
+ assert !@woot.send(attribute).nil?
17
+ assert !@woot.send(attribute).empty?
18
+ end
19
+ end
20
+ end
21
+ end
22
+ end
23
+
24
+ end
metadata ADDED
@@ -0,0 +1,83 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: woot
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.0
5
+ platform: ruby
6
+ authors:
7
+ - Sean Huber
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+
12
+ date: 2009-10-30 00:00:00 -07:00
13
+ default_executable:
14
+ dependencies:
15
+ - !ruby/object:Gem::Dependency
16
+ name: scrapi
17
+ type: :runtime
18
+ version_requirement:
19
+ version_requirements: !ruby/object:Gem::Requirement
20
+ requirements:
21
+ - - ">="
22
+ - !ruby/object:Gem::Version
23
+ version: "0"
24
+ version:
25
+ - !ruby/object:Gem::Dependency
26
+ name: shoulda
27
+ type: :development
28
+ version_requirement:
29
+ version_requirements: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - ">="
32
+ - !ruby/object:Gem::Version
33
+ version: "0"
34
+ version:
35
+ description: Scapes woot.com sites
36
+ email: shuber@huberry.com
37
+ executables: []
38
+
39
+ extensions: []
40
+
41
+ extra_rdoc_files:
42
+ - README.rdoc
43
+ files:
44
+ - .gitignore
45
+ - MIT-LICENSE
46
+ - README.rdoc
47
+ - Rakefile
48
+ - VERSION
49
+ - init.rb
50
+ - lib/woot.rb
51
+ - test/test_helper.rb
52
+ - test/woot_test.rb
53
+ has_rdoc: true
54
+ homepage: http://github.com/shuber/woot
55
+ licenses: []
56
+
57
+ post_install_message:
58
+ rdoc_options:
59
+ - --charset=UTF-8
60
+ require_paths:
61
+ - lib
62
+ required_ruby_version: !ruby/object:Gem::Requirement
63
+ requirements:
64
+ - - ">="
65
+ - !ruby/object:Gem::Version
66
+ version: "0"
67
+ version:
68
+ required_rubygems_version: !ruby/object:Gem::Requirement
69
+ requirements:
70
+ - - ">="
71
+ - !ruby/object:Gem::Version
72
+ version: "0"
73
+ version:
74
+ requirements: []
75
+
76
+ rubyforge_project:
77
+ rubygems_version: 1.3.5
78
+ signing_key:
79
+ specification_version: 3
80
+ summary: Scapes woot.com sites
81
+ test_files:
82
+ - test/test_helper.rb
83
+ - test/woot_test.rb