olek-libcraigscrape 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (70) hide show
  1. data/CHANGELOG +94 -0
  2. data/COPYING +674 -0
  3. data/COPYING.LESSER +165 -0
  4. data/README +89 -0
  5. data/Rakefile +125 -0
  6. data/bin/craig_report_schema.yml +68 -0
  7. data/bin/craigwatch +581 -0
  8. data/bin/report_mailer/craigslist_report.html.erb +17 -0
  9. data/bin/report_mailer/craigslist_report.plain.erb +18 -0
  10. data/lib/geo_listings.rb +144 -0
  11. data/lib/libcraigscrape.rb +217 -0
  12. data/lib/listings.rb +160 -0
  13. data/lib/posting.rb +324 -0
  14. data/lib/scraper.rb +212 -0
  15. data/test/geolisting_samples/geo_listing_ca070209.html +76 -0
  16. data/test/geolisting_samples/geo_listing_ca_sk070209.html +31 -0
  17. data/test/geolisting_samples/geo_listing_cn070209.html +35 -0
  18. data/test/geolisting_samples/geo_listing_us070209.html +355 -0
  19. data/test/geolisting_samples/hierarchy_test071009/index.html +31 -0
  20. data/test/geolisting_samples/hierarchy_test071009/us/fl/ft%20myers%20%5C/%20SW%20florida/index.html +46 -0
  21. data/test/geolisting_samples/hierarchy_test071009/us/fl/ft%20myers%20%5C/index.html +46 -0
  22. data/test/geolisting_samples/hierarchy_test071009/us/fl/index.html +46 -0
  23. data/test/geolisting_samples/hierarchy_test071009/us/fl/miami/index.html +46 -0
  24. data/test/geolisting_samples/hierarchy_test071009/us/fl/miami/nonsense/index.html +46 -0
  25. data/test/geolisting_samples/hierarchy_test071009/us/fl/miami/nonsense/more-nonsense/index.html +46 -0
  26. data/test/geolisting_samples/hierarchy_test071009/us/fl/nonexist/index.html +46 -0
  27. data/test/geolisting_samples/hierarchy_test071009/us/fl/nonsense/index.html +46 -0
  28. data/test/geolisting_samples/hierarchy_test071009/us/fl/south%20florida/index.html +46 -0
  29. data/test/geolisting_samples/hierarchy_test071009/us/index.html +355 -0
  30. data/test/google.html +8 -0
  31. data/test/libcraigscrape_test_helpers.rb +37 -0
  32. data/test/listing_samples/category_output.html +231 -0
  33. data/test/listing_samples/category_output_2.html +217 -0
  34. data/test/listing_samples/empty_listings.html +128 -0
  35. data/test/listing_samples/fortmyers_art_index.060909/1046596324.html +93 -0
  36. data/test/listing_samples/fortmyers_art_index.060909/1053085283.html +92 -0
  37. data/test/listing_samples/fortmyers_art_index.060909/1112522674.html +89 -0
  38. data/test/listing_samples/fortmyers_art_index.060909/823516079.html +92 -0
  39. data/test/listing_samples/fortmyers_art_index.060909/825684735.html +89 -0
  40. data/test/listing_samples/fortmyers_art_index.060909/891513957.html +94 -0
  41. data/test/listing_samples/fortmyers_art_index.060909/897549505.html +99 -0
  42. data/test/listing_samples/fortmyers_art_index.060909/960826026.html +89 -0
  43. data/test/listing_samples/fortmyers_art_index.060909/993256300.html +89 -0
  44. data/test/listing_samples/fortmyers_art_index.060909/fortmyers_art_index500.060909.html +237 -0
  45. data/test/listing_samples/fortmyers_art_index.060909/fortmyers_art_index600.060909.html +132 -0
  46. data/test/listing_samples/long_search_output.html +137 -0
  47. data/test/listing_samples/mia_fua_index8900.5.21.09.html +226 -0
  48. data/test/listing_samples/mia_search_kitten.3.15.10.html +149 -0
  49. data/test/listing_samples/miami_search_sss_rack.6.18.09/miami_search_sss_rack1000.6.18.09.html +144 -0
  50. data/test/listing_samples/miami_search_sss_rack.6.18.09/miami_search_sss_rack900.6.18.09.html +146 -0
  51. data/test/listing_samples/new_listing_span.4.17.10.html +769 -0
  52. data/test/listing_samples/short_search_output.html +133 -0
  53. data/test/post_samples/1207457727.html +92 -0
  54. data/test/post_samples/brw_reb_1224008903.html +101 -0
  55. data/test/post_samples/posting0.html +91 -0
  56. data/test/post_samples/posting1.html +106 -0
  57. data/test/post_samples/posting1796890756-061710.html +2318 -0
  58. data/test/post_samples/posting1808219423.html +2473 -0
  59. data/test/post_samples/posting1938291834-090610.html +188 -0
  60. data/test/post_samples/posting2.html +107 -0
  61. data/test/post_samples/posting3.html +92 -0
  62. data/test/post_samples/posting4.html +993 -0
  63. data/test/post_samples/posting5.html +38 -0
  64. data/test/post_samples/sfbay_art_1223614914.html +94 -0
  65. data/test/post_samples/this_post_has_been_deleted_by_its_author.html +37 -0
  66. data/test/post_samples/this_post_has_expired.html +48 -0
  67. data/test/test_craigslist_geolisting.rb +521 -0
  68. data/test/test_craigslist_listing.rb +362 -0
  69. data/test/test_craigslist_posting.rb +426 -0
  70. metadata +273 -0
metadata ADDED
@@ -0,0 +1,273 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: olek-libcraigscrape
3
+ version: !ruby/object:Gem::Version
4
+ hash: 21
5
+ prerelease:
6
+ segments:
7
+ - 1
8
+ - 0
9
+ - 1
10
+ version: 1.0.1
11
+ platform: ruby
12
+ authors:
13
+ - Chris DeRose, DeRose Technologies, Inc.
14
+ autorequire:
15
+ bindir: bin
16
+ cert_chain: []
17
+
18
+ date: 2011-07-02 00:00:00 -04:00
19
+ default_executable:
20
+ dependencies:
21
+ - !ruby/object:Gem::Dependency
22
+ name: nokogiri
23
+ prerelease: false
24
+ requirement: &id001 !ruby/object:Gem::Requirement
25
+ none: false
26
+ requirements:
27
+ - - ">="
28
+ - !ruby/object:Gem::Version
29
+ hash: 15
30
+ segments:
31
+ - 1
32
+ - 4
33
+ - 4
34
+ version: 1.4.4
35
+ type: :runtime
36
+ version_requirements: *id001
37
+ - !ruby/object:Gem::Dependency
38
+ name: htmlentities
39
+ prerelease: false
40
+ requirement: &id002 !ruby/object:Gem::Requirement
41
+ none: false
42
+ requirements:
43
+ - - ">="
44
+ - !ruby/object:Gem::Version
45
+ hash: 63
46
+ segments:
47
+ - 4
48
+ - 0
49
+ - 0
50
+ version: 4.0.0
51
+ type: :runtime
52
+ version_requirements: *id002
53
+ - !ruby/object:Gem::Dependency
54
+ name: activesupport
55
+ prerelease: false
56
+ requirement: &id003 !ruby/object:Gem::Requirement
57
+ none: false
58
+ requirements:
59
+ - - ">="
60
+ - !ruby/object:Gem::Version
61
+ hash: 3
62
+ segments:
63
+ - 2
64
+ - 3
65
+ - 0
66
+ version: 2.3.0
67
+ - - <
68
+ - !ruby/object:Gem::Version
69
+ hash: 5
70
+ segments:
71
+ - 3
72
+ version: "3"
73
+ type: :runtime
74
+ version_requirements: *id003
75
+ - !ruby/object:Gem::Dependency
76
+ name: activerecord
77
+ prerelease: false
78
+ requirement: &id004 !ruby/object:Gem::Requirement
79
+ none: false
80
+ requirements:
81
+ - - ">="
82
+ - !ruby/object:Gem::Version
83
+ hash: 3
84
+ segments:
85
+ - 2
86
+ - 3
87
+ - 0
88
+ version: 2.3.0
89
+ - - <
90
+ - !ruby/object:Gem::Version
91
+ hash: 5
92
+ segments:
93
+ - 3
94
+ version: "3"
95
+ type: :runtime
96
+ version_requirements: *id004
97
+ - !ruby/object:Gem::Dependency
98
+ name: actionmailer
99
+ prerelease: false
100
+ requirement: &id005 !ruby/object:Gem::Requirement
101
+ none: false
102
+ requirements:
103
+ - - ">="
104
+ - !ruby/object:Gem::Version
105
+ hash: 3
106
+ segments:
107
+ - 2
108
+ - 3
109
+ - 0
110
+ version: 2.3.0
111
+ - - <
112
+ - !ruby/object:Gem::Version
113
+ hash: 5
114
+ segments:
115
+ - 3
116
+ version: "3"
117
+ type: :runtime
118
+ version_requirements: *id005
119
+ - !ruby/object:Gem::Dependency
120
+ name: kwalify
121
+ prerelease: false
122
+ requirement: &id006 !ruby/object:Gem::Requirement
123
+ none: false
124
+ requirements:
125
+ - - ">="
126
+ - !ruby/object:Gem::Version
127
+ hash: 7
128
+ segments:
129
+ - 0
130
+ - 7
131
+ - 2
132
+ version: 0.7.2
133
+ type: :runtime
134
+ version_requirements: *id006
135
+ - !ruby/object:Gem::Dependency
136
+ name: sqlite3
137
+ prerelease: false
138
+ requirement: &id007 !ruby/object:Gem::Requirement
139
+ none: false
140
+ requirements:
141
+ - - ">="
142
+ - !ruby/object:Gem::Version
143
+ hash: 3
144
+ segments:
145
+ - 0
146
+ version: "0"
147
+ type: :runtime
148
+ version_requirements: *id007
149
+ description: quick, easy, craigslist parsing library that takes the monotony out of working with craigslist posts and listings
150
+ email: cderose@derosetechnologies.com
151
+ executables:
152
+ - craigwatch
153
+ extensions: []
154
+
155
+ extra_rdoc_files:
156
+ - README
157
+ - CHANGELOG
158
+ - COPYING
159
+ - COPYING.LESSER
160
+ - bin/craigwatch
161
+ files:
162
+ - lib/libcraigscrape.rb
163
+ - test/post_samples/1207457727.html
164
+ - CHANGELOG
165
+ - COPYING
166
+ - COPYING.LESSER
167
+ - bin/craigwatch
168
+ - bin/craig_report_schema.yml
169
+ - bin/report_mailer/craigslist_report.html.erb
170
+ - bin/report_mailer/craigslist_report.plain.erb
171
+ - test/geolisting_samples/geo_listing_ca070209.html
172
+ - test/geolisting_samples/geo_listing_ca_sk070209.html
173
+ - test/geolisting_samples/geo_listing_cn070209.html
174
+ - test/geolisting_samples/geo_listing_us070209.html
175
+ - test/geolisting_samples/hierarchy_test071009/index.html
176
+ - test/geolisting_samples/hierarchy_test071009/us/fl/ft%20myers%20%5C/%20SW%20florida/index.html
177
+ - test/geolisting_samples/hierarchy_test071009/us/fl/ft%20myers%20%5C/index.html
178
+ - test/geolisting_samples/hierarchy_test071009/us/fl/index.html
179
+ - test/geolisting_samples/hierarchy_test071009/us/fl/miami/index.html
180
+ - test/geolisting_samples/hierarchy_test071009/us/fl/miami/nonsense/index.html
181
+ - test/geolisting_samples/hierarchy_test071009/us/fl/miami/nonsense/more-nonsense/index.html
182
+ - test/geolisting_samples/hierarchy_test071009/us/fl/nonexist/index.html
183
+ - test/geolisting_samples/hierarchy_test071009/us/fl/nonsense/index.html
184
+ - test/geolisting_samples/hierarchy_test071009/us/fl/south%20florida/index.html
185
+ - test/geolisting_samples/hierarchy_test071009/us/index.html
186
+ - test/google.html
187
+ - test/libcraigscrape_test_helpers.rb
188
+ - test/listing_samples/category_output.html
189
+ - test/listing_samples/category_output_2.html
190
+ - test/listing_samples/empty_listings.html
191
+ - test/listing_samples/fortmyers_art_index.060909/1046596324.html
192
+ - test/listing_samples/fortmyers_art_index.060909/1053085283.html
193
+ - test/listing_samples/fortmyers_art_index.060909/1112522674.html
194
+ - test/listing_samples/fortmyers_art_index.060909/823516079.html
195
+ - test/listing_samples/fortmyers_art_index.060909/825684735.html
196
+ - test/listing_samples/fortmyers_art_index.060909/891513957.html
197
+ - test/listing_samples/fortmyers_art_index.060909/897549505.html
198
+ - test/listing_samples/fortmyers_art_index.060909/960826026.html
199
+ - test/listing_samples/fortmyers_art_index.060909/993256300.html
200
+ - test/listing_samples/fortmyers_art_index.060909/fortmyers_art_index500.060909.html
201
+ - test/listing_samples/fortmyers_art_index.060909/fortmyers_art_index600.060909.html
202
+ - test/listing_samples/long_search_output.html
203
+ - test/listing_samples/mia_fua_index8900.5.21.09.html
204
+ - test/listing_samples/mia_search_kitten.3.15.10.html
205
+ - test/listing_samples/miami_search_sss_rack.6.18.09/miami_search_sss_rack1000.6.18.09.html
206
+ - test/listing_samples/miami_search_sss_rack.6.18.09/miami_search_sss_rack900.6.18.09.html
207
+ - test/listing_samples/new_listing_span.4.17.10.html
208
+ - test/listing_samples/short_search_output.html
209
+ - README
210
+ - test/post_samples/brw_reb_1224008903.html
211
+ - test/post_samples/posting0.html
212
+ - test/post_samples/posting1.html
213
+ - test/post_samples/posting1796890756-061710.html
214
+ - test/post_samples/posting1808219423.html
215
+ - test/post_samples/posting1938291834-090610.html
216
+ - test/post_samples/posting2.html
217
+ - test/post_samples/posting3.html
218
+ - test/post_samples/posting4.html
219
+ - test/post_samples/posting5.html
220
+ - test/post_samples/sfbay_art_1223614914.html
221
+ - test/post_samples/this_post_has_been_deleted_by_its_author.html
222
+ - test/post_samples/this_post_has_expired.html
223
+ - test/test_craigslist_geolisting.rb
224
+ - test/test_craigslist_listing.rb
225
+ - test/test_craigslist_posting.rb
226
+ - lib/geo_listings.rb
227
+ - Rakefile
228
+ - lib/listings.rb
229
+ - lib/posting.rb
230
+ - lib/scraper.rb
231
+ has_rdoc: true
232
+ homepage: http://www.derosetechnologies.com/community/libcraigscrape
233
+ licenses: []
234
+
235
+ post_install_message:
236
+ rdoc_options:
237
+ - --quiet
238
+ - --title
239
+ - The libcraigscrape Reference
240
+ - --main
241
+ - README
242
+ - --inline-source
243
+ require_paths:
244
+ - lib
245
+ required_ruby_version: !ruby/object:Gem::Requirement
246
+ none: false
247
+ requirements:
248
+ - - ">="
249
+ - !ruby/object:Gem::Version
250
+ hash: 3
251
+ segments:
252
+ - 0
253
+ version: "0"
254
+ required_rubygems_version: !ruby/object:Gem::Requirement
255
+ none: false
256
+ requirements:
257
+ - - ">="
258
+ - !ruby/object:Gem::Version
259
+ hash: 3
260
+ segments:
261
+ - 0
262
+ version: "0"
263
+ requirements: []
264
+
265
+ rubyforge_project: libcraigwatch
266
+ rubygems_version: 1.6.2
267
+ signing_key:
268
+ specification_version: 3
269
+ summary: quick, easy, craigslist parsing library that takes the monotony out of working with craigslist posts and listings
270
+ test_files:
271
+ - test/test_craigslist_geolisting.rb
272
+ - test/test_craigslist_listing.rb
273
+ - test/test_craigslist_posting.rb