rdig 0.3.8 → 0.3.9
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
metadata
CHANGED
|
@@ -1,13 +1,12 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: rdig
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
|
|
5
|
-
prerelease:
|
|
4
|
+
prerelease: false
|
|
6
5
|
segments:
|
|
7
6
|
- 0
|
|
8
7
|
- 3
|
|
9
|
-
-
|
|
10
|
-
version: 0.3.
|
|
8
|
+
- 9
|
|
9
|
+
version: 0.3.9
|
|
11
10
|
platform: ruby
|
|
12
11
|
authors:
|
|
13
12
|
- Jens Kraemer
|
|
@@ -22,11 +21,9 @@ dependencies:
|
|
|
22
21
|
name: ferret
|
|
23
22
|
prerelease: false
|
|
24
23
|
requirement: &id001 !ruby/object:Gem::Requirement
|
|
25
|
-
none: false
|
|
26
24
|
requirements:
|
|
27
25
|
- - ">="
|
|
28
26
|
- !ruby/object:Gem::Version
|
|
29
|
-
hash: 63
|
|
30
27
|
segments:
|
|
31
28
|
- 0
|
|
32
29
|
- 11
|
|
@@ -38,11 +35,9 @@ dependencies:
|
|
|
38
35
|
name: hpricot
|
|
39
36
|
prerelease: false
|
|
40
37
|
requirement: &id002 !ruby/object:Gem::Requirement
|
|
41
|
-
none: false
|
|
42
38
|
requirements:
|
|
43
39
|
- - ">="
|
|
44
40
|
- !ruby/object:Gem::Version
|
|
45
|
-
hash: 7
|
|
46
41
|
segments:
|
|
47
42
|
- 0
|
|
48
43
|
- 6
|
|
@@ -53,11 +48,9 @@ dependencies:
|
|
|
53
48
|
name: htmlentities
|
|
54
49
|
prerelease: false
|
|
55
50
|
requirement: &id003 !ruby/object:Gem::Requirement
|
|
56
|
-
none: false
|
|
57
51
|
requirements:
|
|
58
52
|
- - ">="
|
|
59
53
|
- !ruby/object:Gem::Version
|
|
60
|
-
hash: 63
|
|
61
54
|
segments:
|
|
62
55
|
- 4
|
|
63
56
|
- 0
|
|
@@ -67,8 +60,8 @@ dependencies:
|
|
|
67
60
|
version_requirements: *id003
|
|
68
61
|
description: Website crawler and fulltext indexer.
|
|
69
62
|
email: jk@jkraemer.net
|
|
70
|
-
executables:
|
|
71
|
-
|
|
63
|
+
executables:
|
|
64
|
+
- rdig
|
|
72
65
|
extensions: []
|
|
73
66
|
|
|
74
67
|
extra_rdoc_files:
|
|
@@ -97,24 +90,6 @@ files:
|
|
|
97
90
|
- lib/rdig/search.rb
|
|
98
91
|
- lib/rdig/url_filters.rb
|
|
99
92
|
- lib/rdig.rb
|
|
100
|
-
- test/fixtures/html/custom_tag_selectors.html
|
|
101
|
-
- test/fixtures/html/entities.html
|
|
102
|
-
- test/fixtures/html/frameset.html
|
|
103
|
-
- test/fixtures/html/imagemap.html
|
|
104
|
-
- test/fixtures/html/simple.html
|
|
105
|
-
- test/fixtures/pdf/simple.pdf
|
|
106
|
-
- test/fixtures/word/simple.doc
|
|
107
|
-
- test/test_helper.rb
|
|
108
|
-
- test/unit/crawler_fs_test.rb
|
|
109
|
-
- test/unit/etag_filter_test.rb
|
|
110
|
-
- test/unit/file_document_test.rb
|
|
111
|
-
- test/unit/hpricot_content_extractor_test.rb
|
|
112
|
-
- test/unit/http_document_test.rb
|
|
113
|
-
- test/unit/pdf_content_extractor_test.rb
|
|
114
|
-
- test/unit/rdig_test.rb
|
|
115
|
-
- test/unit/searcher_test.rb
|
|
116
|
-
- test/unit/url_filters_test.rb
|
|
117
|
-
- test/unit/word_content_extractor_test.rb
|
|
118
93
|
has_rdoc: true
|
|
119
94
|
homepage: http://github.com/jkraemer/rdig/
|
|
120
95
|
licenses: []
|
|
@@ -126,27 +101,23 @@ rdoc_options:
|
|
|
126
101
|
require_paths:
|
|
127
102
|
- lib
|
|
128
103
|
required_ruby_version: !ruby/object:Gem::Requirement
|
|
129
|
-
none: false
|
|
130
104
|
requirements:
|
|
131
105
|
- - ">="
|
|
132
106
|
- !ruby/object:Gem::Version
|
|
133
|
-
hash: 3
|
|
134
107
|
segments:
|
|
135
108
|
- 0
|
|
136
109
|
version: "0"
|
|
137
110
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
|
138
|
-
none: false
|
|
139
111
|
requirements:
|
|
140
112
|
- - ">="
|
|
141
113
|
- !ruby/object:Gem::Version
|
|
142
|
-
hash: 3
|
|
143
114
|
segments:
|
|
144
115
|
- 0
|
|
145
116
|
version: "0"
|
|
146
117
|
requirements: []
|
|
147
118
|
|
|
148
119
|
rubyforge_project: rdig
|
|
149
|
-
rubygems_version: 1.
|
|
120
|
+
rubygems_version: 1.3.6
|
|
150
121
|
signing_key:
|
|
151
122
|
specification_version: 3
|
|
152
123
|
summary: Crawler and content extractor for building a full text index of a website's contents. Uses Ferret for indexing.
|