microformats2 2.0.0.pre4 → 2.0.0.pre5
Sign up to get free protection for your applications and to get access to all the features.
- data/README.md +2 -2
- data/lib/microformats2.rb +4 -7
- data/lib/microformats2/parser.rb +25 -0
- data/lib/microformats2/version.rb +1 -1
- data/microformats2.gemspec +1 -1
- data/spec/lib/microformats2/parser_spec.rb +41 -0
- data/spec/lib/microformats2_spec.rb +3 -0
- data/spec/spec_helper.rb +1 -0
- metadata +9 -8
data/README.md
CHANGED
@@ -10,7 +10,7 @@ A work in progress.
|
|
10
10
|
|
11
11
|
Implemented:
|
12
12
|
|
13
|
-
* [parsing depth first, doc order](parse_a_document_for_microformats)
|
13
|
+
* [parsing depth first, doc order](http://microformats.org/wiki/microformats2-parsing#parse_a_document_for_microformats)
|
14
14
|
* [parsing a p- property](http://microformats.org/wiki/microformats2-parsing#parsing_a_p-_property)
|
15
15
|
* [parsing a u- property](http://microformats.org/wiki/microformats2-parsing#parsing_a_u-_property)
|
16
16
|
* [parsing a dt- property](http://microformats.org/wiki/microformats2-parsing#parsing_a_dt-_property)
|
@@ -33,7 +33,7 @@ Not Implemented:
|
|
33
33
|
|
34
34
|
## Current Version
|
35
35
|
|
36
|
-
2.0.0.
|
36
|
+
2.0.0.pre5
|
37
37
|
|
38
38
|
|
39
39
|
## Requirements
|
data/lib/microformats2.rb
CHANGED
@@ -4,6 +4,7 @@ require "json"
|
|
4
4
|
require "active_support/inflector"
|
5
5
|
|
6
6
|
require "microformats2/version"
|
7
|
+
require "microformats2/parser"
|
7
8
|
require "microformats2/format_parser"
|
8
9
|
require "microformats2/property_parser"
|
9
10
|
require "microformats2/collection"
|
@@ -22,17 +23,13 @@ require "microformats2/implied_property/url"
|
|
22
23
|
module Microformats2
|
23
24
|
class << self
|
24
25
|
def parse(html)
|
25
|
-
|
26
|
-
document = Nokogiri::HTML(html)
|
27
|
-
Collection.new(document).parse
|
26
|
+
Parser.new.parse(html)
|
28
27
|
end
|
29
28
|
|
30
29
|
def read_html(html)
|
31
|
-
|
32
|
-
rescue Errno::ENOENT, Errno::ENAMETOOLONG => e
|
33
|
-
html
|
30
|
+
Parser.new.read_html(html)
|
34
31
|
end
|
35
32
|
end # class << self
|
36
33
|
|
37
34
|
class InvalidPropertyPrefix < StandardError; end
|
38
|
-
end
|
35
|
+
end
|
@@ -0,0 +1,25 @@
|
|
1
|
+
module Microformats2
|
2
|
+
class Parser
|
3
|
+
attr_reader :http_headers, :http_body
|
4
|
+
|
5
|
+
def initialize
|
6
|
+
@http_headers = {}
|
7
|
+
end
|
8
|
+
|
9
|
+
def parse(html, headers={})
|
10
|
+
html = read_html(html, headers)
|
11
|
+
document = Nokogiri::HTML(html)
|
12
|
+
Collection.new(document).parse
|
13
|
+
end
|
14
|
+
|
15
|
+
def read_html(html, headers={})
|
16
|
+
open(html, headers) do |response|
|
17
|
+
@http_headers = response.meta if response.respond_to?(:meta)
|
18
|
+
@http_body = response.read
|
19
|
+
end
|
20
|
+
@http_body
|
21
|
+
rescue Errno::ENOENT, Errno::ENAMETOOLONG => e
|
22
|
+
@http_body = html
|
23
|
+
end
|
24
|
+
end
|
25
|
+
end
|
data/microformats2.gemspec
CHANGED
@@ -26,5 +26,5 @@ Gem::Specification.new do |gem|
|
|
26
26
|
gem.add_development_dependency "guard-rspec", "~> 2.1.0"
|
27
27
|
gem.add_development_dependency "rb-fsevent", "~> 0.9.1"
|
28
28
|
gem.add_development_dependency "simplecov", "~> 0.7.1"
|
29
|
-
gem.add_development_dependency "
|
29
|
+
gem.add_development_dependency "webmock", "~> 1.12.3"
|
30
30
|
end
|
@@ -0,0 +1,41 @@
|
|
1
|
+
require "spec_helper"
|
2
|
+
require "microformats2"
|
3
|
+
|
4
|
+
describe Microformats2::Parser do
|
5
|
+
let(:parser) { Microformats2::Parser.new }
|
6
|
+
|
7
|
+
describe "#http_headers" do
|
8
|
+
it "starts as a blank hash" do
|
9
|
+
parser.http_headers.should eq({})
|
10
|
+
end
|
11
|
+
|
12
|
+
describe "open file" do
|
13
|
+
before do
|
14
|
+
parser.parse("spec/support/lib/microformats2/simple.html")
|
15
|
+
end
|
16
|
+
|
17
|
+
it "doesn't save #http_headers" do
|
18
|
+
parser.http_headers.should eq({})
|
19
|
+
end
|
20
|
+
it "saves #http_body" do
|
21
|
+
parser.http_body.should include "<!DOCTYPE html>"
|
22
|
+
end
|
23
|
+
end
|
24
|
+
|
25
|
+
describe "http response" do
|
26
|
+
before do
|
27
|
+
stub_request(:get, "http://www.example.com/").
|
28
|
+
with(:headers => {"Accept"=>"*/*", "User-Agent"=>"Ruby"}).
|
29
|
+
to_return(:status => 200, :body => "abc", :headers => {"Content-Length" => 3})
|
30
|
+
parser.parse("http://www.example.com")
|
31
|
+
end
|
32
|
+
|
33
|
+
it "saves #http_headers" do
|
34
|
+
parser.http_headers.should eq({"content-length" => "3"})
|
35
|
+
end
|
36
|
+
it "saves #http_body" do
|
37
|
+
parser.http_body.should eq("abc")
|
38
|
+
end
|
39
|
+
end
|
40
|
+
end
|
41
|
+
end
|
@@ -23,6 +23,9 @@ describe Microformats2 do
|
|
23
23
|
Microformats2.read_html(html).should include "<div class=\"h-card\">"
|
24
24
|
end
|
25
25
|
it "can be a url to html" do
|
26
|
+
stub_request(:get, "http://google.com/").
|
27
|
+
with(:headers => {'Accept'=>'*/*', 'User-Agent'=>'Ruby'}).
|
28
|
+
to_return(:status => 200, :body => "google", :headers => {})
|
26
29
|
html = "http://google.com"
|
27
30
|
Microformats2.read_html(html).should include "google"
|
28
31
|
end
|
data/spec/spec_helper.rb
CHANGED
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: microformats2
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 2.0.0.
|
4
|
+
version: 2.0.0.pre5
|
5
5
|
prerelease: 6
|
6
6
|
platform: ruby
|
7
7
|
authors:
|
@@ -9,7 +9,7 @@ authors:
|
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
date: 2013-
|
12
|
+
date: 2013-07-02 00:00:00.000000000 Z
|
13
13
|
dependencies:
|
14
14
|
- !ruby/object:Gem::Dependency
|
15
15
|
name: nokogiri
|
@@ -140,13 +140,13 @@ dependencies:
|
|
140
140
|
- !ruby/object:Gem::Version
|
141
141
|
version: 0.7.1
|
142
142
|
- !ruby/object:Gem::Dependency
|
143
|
-
name:
|
143
|
+
name: webmock
|
144
144
|
requirement: !ruby/object:Gem::Requirement
|
145
145
|
none: false
|
146
146
|
requirements:
|
147
147
|
- - ~>
|
148
148
|
- !ruby/object:Gem::Version
|
149
|
-
version: 1.
|
149
|
+
version: 1.12.3
|
150
150
|
type: :development
|
151
151
|
prerelease: false
|
152
152
|
version_requirements: !ruby/object:Gem::Requirement
|
@@ -154,7 +154,7 @@ dependencies:
|
|
154
154
|
requirements:
|
155
155
|
- - ~>
|
156
156
|
- !ruby/object:Gem::Version
|
157
|
-
version: 1.
|
157
|
+
version: 1.12.3
|
158
158
|
description: parses HTML for microformats and return a collection of dynamically defined
|
159
159
|
Ruby objects
|
160
160
|
email:
|
@@ -179,6 +179,7 @@ files:
|
|
179
179
|
- lib/microformats2/implied_property/name.rb
|
180
180
|
- lib/microformats2/implied_property/photo.rb
|
181
181
|
- lib/microformats2/implied_property/url.rb
|
182
|
+
- lib/microformats2/parser.rb
|
182
183
|
- lib/microformats2/property.rb
|
183
184
|
- lib/microformats2/property/date_time.rb
|
184
185
|
- lib/microformats2/property/embedded.rb
|
@@ -192,6 +193,7 @@ files:
|
|
192
193
|
- spec/lib/microformats2/implied_property/name_spec.rb
|
193
194
|
- spec/lib/microformats2/implied_property/photo_spec.rb
|
194
195
|
- spec/lib/microformats2/implied_property/url_spec.rb
|
196
|
+
- spec/lib/microformats2/parser_spec.rb
|
195
197
|
- spec/lib/microformats2_spec.rb
|
196
198
|
- spec/spec_helper.rb
|
197
199
|
- spec/support/cases/microformat2-node.jit.su/h-adr/h-adr-0.html
|
@@ -371,9 +373,6 @@ required_ruby_version: !ruby/object:Gem::Requirement
|
|
371
373
|
- - ! '>='
|
372
374
|
- !ruby/object:Gem::Version
|
373
375
|
version: '0'
|
374
|
-
segments:
|
375
|
-
- 0
|
376
|
-
hash: 2813270681629112276
|
377
376
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
378
377
|
none: false
|
379
378
|
requirements:
|
@@ -391,6 +390,7 @@ test_files:
|
|
391
390
|
- spec/lib/microformats2/implied_property/name_spec.rb
|
392
391
|
- spec/lib/microformats2/implied_property/photo_spec.rb
|
393
392
|
- spec/lib/microformats2/implied_property/url_spec.rb
|
393
|
+
- spec/lib/microformats2/parser_spec.rb
|
394
394
|
- spec/lib/microformats2_spec.rb
|
395
395
|
- spec/spec_helper.rb
|
396
396
|
- spec/support/cases/microformat2-node.jit.su/h-adr/h-adr-0.html
|
@@ -558,3 +558,4 @@ test_files:
|
|
558
558
|
- spec/support/lib/microformats2/nested-property.js
|
559
559
|
- spec/support/lib/microformats2/simple.html
|
560
560
|
- spec/support/lib/microformats2/simple.js
|
561
|
+
has_rdoc:
|