xapian-indexer 1.2.3.1 → 1.2.3.2

Sign up to get free protection for your applications and to get access to all the features.
@@ -95,7 +95,12 @@ module Xapian
95
95
  html.search("form").remove
96
96
  html.css('.noindex').remove
97
97
 
98
- result[:content] = html.at('html/body').inner_text
98
+
99
+ body = html.at('html/body')
100
+
101
+ if body
102
+ result[:content] = body.inner_text.gsub(/\s+/, " ")
103
+ end
99
104
 
100
105
  return result
101
106
  end
@@ -135,7 +135,6 @@ module Xapian
135
135
  @database.replace_document(resource.name_digest, doc)
136
136
  else
137
137
  @logger.warn "Resource was not indexable #{resource.name}!"
138
- @logger.warn "Links = #{(fetch.links || []).map(&block).compact.inspect}"
139
138
  end
140
139
  else
141
140
  @logger.warn "Could not fetch resource #{resource.name}!"
@@ -19,7 +19,7 @@ module Xapian
19
19
  MAJOR = 1
20
20
  MINOR = 2
21
21
  TINY = 3
22
- REV = 1
22
+ REV = 2
23
23
 
24
24
  STRING = [MAJOR, MINOR, TINY, REV].join('.')
25
25
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: xapian-indexer
3
3
  version: !ruby/object:Gem::Version
4
- hash: 65
4
+ hash: 71
5
5
  prerelease: false
6
6
  segments:
7
7
  - 1
8
8
  - 2
9
9
  - 3
10
- - 1
11
- version: 1.2.3.1
10
+ - 2
11
+ version: 1.2.3.2
12
12
  platform: ruby
13
13
  authors:
14
14
  - Samuel Williams
@@ -16,10 +16,23 @@ autorequire:
16
16
  bindir: bin
17
17
  cert_chain: []
18
18
 
19
- date: 2010-12-19 00:00:00 +13:00
19
+ date: 2010-12-22 00:00:00 +13:00
20
20
  default_executable:
21
- dependencies: []
22
-
21
+ dependencies:
22
+ - !ruby/object:Gem::Dependency
23
+ name: xapian-core
24
+ prerelease: false
25
+ requirement: &id001 !ruby/object:Gem::Requirement
26
+ none: false
27
+ requirements:
28
+ - - ">="
29
+ - !ruby/object:Gem::Version
30
+ hash: 3
31
+ segments:
32
+ - 0
33
+ version: "0"
34
+ type: :runtime
35
+ version_requirements: *id001
23
36
  description:
24
37
  email: samuel.williams@oriontransfer.co.nz
25
38
  executables: []
@@ -69,6 +82,6 @@ rubyforge_project:
69
82
  rubygems_version: 1.3.7
70
83
  signing_key:
71
84
  specification_version: 3
72
- summary: Xapian is a framework for fast full-text searching.
85
+ summary: Xapian::Indexer provides a flexible spider for indexing resources.
73
86
  test_files: []
74
87