keyword-filter 0.1.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (2) hide show
  1. data/lib/keyword-filter.rb +32 -0
  2. metadata +55 -0
@@ -0,0 +1,32 @@
1
+ #!/usr/bin/ruby
2
+
3
+ # file: keywords-filter.rb
4
+
5
+ require 'rexml/document'
6
+ include REXML
7
+
8
+ class KeywordFilter
9
+ include REXML
10
+
11
+ def initialize(s)
12
+ @keywords = XPath.match(Document.new(open(s)).root, 'records/keyword/phrase/text()')
13
+ end
14
+
15
+ def filter(raw_s)
16
+ s = raw_s.gsub(/\b(#{@keywords.join('|')})\b/i,'<f>\0</f>')
17
+ doc = Document.new("<root>#{s}</root>")
18
+ filtered_words = XPath.match(doc.root, '*')
19
+
20
+ filtered_words.empty? ? raw_s : doc.root
21
+ end
22
+
23
+ def open(s)
24
+ if s[/^https?:\/\//] then # open a file from a url
25
+ buffer = Kernel.open(s, 'UserAgent' => 'KeywordsFilter-Reader').read
26
+ elsif s[/\</] # input xml string
27
+ buffer = s
28
+ else # local file
29
+ buffer = File.open(s,'r').read
30
+ end
31
+ end
32
+ end
metadata ADDED
@@ -0,0 +1,55 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: keyword-filter
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.1.0
5
+ platform: ruby
6
+ authors: []
7
+
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+
12
+ date: 2010-11-13 00:00:00 +00:00
13
+ default_executable:
14
+ dependencies: []
15
+
16
+ description:
17
+ email:
18
+ executables: []
19
+
20
+ extensions: []
21
+
22
+ extra_rdoc_files: []
23
+
24
+ files:
25
+ - lib/keyword-filter.rb
26
+ has_rdoc: true
27
+ homepage:
28
+ licenses: []
29
+
30
+ post_install_message:
31
+ rdoc_options: []
32
+
33
+ require_paths:
34
+ - lib
35
+ required_ruby_version: !ruby/object:Gem::Requirement
36
+ requirements:
37
+ - - ">="
38
+ - !ruby/object:Gem::Version
39
+ version: "0"
40
+ version:
41
+ required_rubygems_version: !ruby/object:Gem::Requirement
42
+ requirements:
43
+ - - ">="
44
+ - !ruby/object:Gem::Version
45
+ version: "0"
46
+ version:
47
+ requirements: []
48
+
49
+ rubyforge_project:
50
+ rubygems_version: 1.3.5
51
+ signing_key:
52
+ specification_version: 3
53
+ summary: keyword-filter
54
+ test_files: []
55
+