xapian-indexer 1.2.3.1 → 1.2.3.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -95,7 +95,12 @@ module Xapian
95
95
  html.search("form").remove
96
96
  html.css('.noindex').remove
97
97
 
98
- result[:content] = html.at('html/body').inner_text
98
+
99
+ body = html.at('html/body')
100
+
101
+ if body
102
+ result[:content] = body.inner_text.gsub(/\s+/, " ")
103
+ end
99
104
 
100
105
  return result
101
106
  end
@@ -135,7 +135,6 @@ module Xapian
135
135
  @database.replace_document(resource.name_digest, doc)
136
136
  else
137
137
  @logger.warn "Resource was not indexable #{resource.name}!"
138
- @logger.warn "Links = #{(fetch.links || []).map(&block).compact.inspect}"
139
138
  end
140
139
  else
141
140
  @logger.warn "Could not fetch resource #{resource.name}!"
@@ -19,7 +19,7 @@ module Xapian
19
19
  MAJOR = 1
20
20
  MINOR = 2
21
21
  TINY = 3
22
- REV = 1
22
+ REV = 2
23
23
 
24
24
  STRING = [MAJOR, MINOR, TINY, REV].join('.')
25
25
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: xapian-indexer
3
3
  version: !ruby/object:Gem::Version
4
- hash: 65
4
+ hash: 71
5
5
  prerelease: false
6
6
  segments:
7
7
  - 1
8
8
  - 2
9
9
  - 3
10
- - 1
11
- version: 1.2.3.1
10
+ - 2
11
+ version: 1.2.3.2
12
12
  platform: ruby
13
13
  authors:
14
14
  - Samuel Williams
@@ -16,10 +16,23 @@ autorequire:
16
16
  bindir: bin
17
17
  cert_chain: []
18
18
 
19
- date: 2010-12-19 00:00:00 +13:00
19
+ date: 2010-12-22 00:00:00 +13:00
20
20
  default_executable:
21
- dependencies: []
22
-
21
+ dependencies:
22
+ - !ruby/object:Gem::Dependency
23
+ name: xapian-core
24
+ prerelease: false
25
+ requirement: &id001 !ruby/object:Gem::Requirement
26
+ none: false
27
+ requirements:
28
+ - - ">="
29
+ - !ruby/object:Gem::Version
30
+ hash: 3
31
+ segments:
32
+ - 0
33
+ version: "0"
34
+ type: :runtime
35
+ version_requirements: *id001
23
36
  description:
24
37
  email: samuel.williams@oriontransfer.co.nz
25
38
  executables: []
@@ -69,6 +82,6 @@ rubyforge_project:
69
82
  rubygems_version: 1.3.7
70
83
  signing_key:
71
84
  specification_version: 3
72
- summary: Xapian is a framework for fast full-text searching.
85
+ summary: Xapian::Indexer provides a flexible spider for indexing resources.
73
86
  test_files: []
74
87