solr-client 0.0.1

Sign up to get free protection for your applications and to get access to all the features.
@@ -0,0 +1,17 @@
1
+ *.gem
2
+ *.rbc
3
+ .bundle
4
+ .config
5
+ .yardoc
6
+ Gemfile.lock
7
+ InstalledFiles
8
+ _yardoc
9
+ coverage
10
+ doc/
11
+ lib/bundler/man
12
+ pkg
13
+ rdoc
14
+ spec/reports
15
+ test/tmp
16
+ test/version_tmp
17
+ tmp
data/Gemfile ADDED
@@ -0,0 +1,3 @@
1
+ source 'https://rubygems.org'
2
+
3
+ gemspec
data/LICENSE ADDED
@@ -0,0 +1,22 @@
1
+ Copyright (c) 2012 zzzhc
2
+
3
+ MIT License
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining
6
+ a copy of this software and associated documentation files (the
7
+ "Software"), to deal in the Software without restriction, including
8
+ without limitation the rights to use, copy, modify, merge, publish,
9
+ distribute, sublicense, and/or sell copies of the Software, and to
10
+ permit persons to whom the Software is furnished to do so, subject to
11
+ the following conditions:
12
+
13
+ The above copyright notice and this permission notice shall be
14
+ included in all copies or substantial portions of the Software.
15
+
16
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
19
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
20
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
21
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
22
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
@@ -0,0 +1,39 @@
1
+ # Solr::Client
2
+
3
+ fast solr client for ruby
4
+
5
+ ## Installation
6
+
7
+ Add this line to your application's Gemfile:
8
+
9
+ gem 'solr-client'
10
+
11
+ And then execute:
12
+
13
+ $ bundle
14
+
15
+ Or install it yourself as:
16
+
17
+ $ gem install solr-client
18
+
19
+ ## Usage
20
+
21
+ ``` ruby
22
+ solr_base_url = "http://localhost:8983/solr"
23
+ client = Solr::Client.new(solr_base_url)
24
+ client.core = "article"
25
+ rows = mysql.query("select * from article order by id asc limit 100")
26
+ rows.each do |row|
27
+ solr_client.add(row)
28
+ end
29
+ solr_client.commit
30
+ solr_client.stop
31
+ ```
32
+
33
+ ## Contributing
34
+
35
+ 1. Fork it
36
+ 2. Create your feature branch (`git checkout -b my-new-feature`)
37
+ 3. Commit your changes (`git commit -am 'Added some feature'`)
38
+ 4. Push to the branch (`git push origin my-new-feature`)
39
+ 5. Create new Pull Request
@@ -0,0 +1,2 @@
1
+ #!/usr/bin/env rake
2
+ require "bundler/gem_tasks"
@@ -0,0 +1,300 @@
1
+ require 'curb'
2
+ require 'thread'
3
+ require 'cgi'
4
+ require 'time'
5
+
6
+ module Solr
7
+
8
+ module Codec
9
+
10
+ ALLOWED_ADD_ATTRS = [:overwrite, :commitWithin]
11
+
12
+ def to_docs(data, add_attrs={})
13
+ attrs = add_attrs.map do |k, v|
14
+ "#{k}=\"#{v}\"" if ALLOWED_ADD_ATTRS.include?(k) && !v.nil?
15
+ end.join(" ")
16
+ attrs = " " + attrs unless attrs.empty?
17
+ content = '<?xml version="1.0" encoding="UTF-8"?>';
18
+ content += "<add#{attrs}>"
19
+
20
+ data = [data] unless data.is_a?(Array)
21
+ data.each do |doc|
22
+ content << '<doc>'
23
+ doc.each do |field_key, field_values|
24
+ next if field_values.nil?
25
+ field_values = [field_values] unless field_values.is_a?(Array)
26
+ field_values.each do |field_value|
27
+ content << '<field name="' << h(field_key) << '">'
28
+ case field_value
29
+ when Time, DateTime
30
+ field_value = field_value.strftime("%Y-%m-%dT%H:%M:%SZ")
31
+ end
32
+ content << h(field_value)
33
+ content << '</field>'
34
+ end
35
+ end
36
+ content << '</doc>'
37
+ end
38
+ content << '</add>'
39
+ end
40
+
41
+ def to_delete_by_id(*ids)
42
+ ids.flatten!
43
+ content = '<?xml version="1.0" encoding="UTF-8"?><delete>'
44
+ ids.each { |id| content << '<id>' << h(id) << '</id>' }
45
+ content << '</delete>'
46
+ end
47
+
48
+ def to_delete_by_query(*queries)
49
+ queries.flatten!
50
+ content = '<?xml version="1.0" encoding="UTF-8"?><delete>'
51
+ queries.each { |query| content << '<query>' << h(query) << '</query>' }
52
+ content << '</delete>'
53
+ end
54
+
55
+ private
56
+ def h(s)
57
+ CGI.escapeHTML(s.to_s)
58
+ end
59
+
60
+ def escape(s)
61
+ CGI.escape(s.to_s)
62
+ end
63
+
64
+ end
65
+
66
+ class Request
67
+ attr_reader :url, :callback, :body
68
+
69
+ def initialize(url, data = nil, &block)
70
+ @url, @data, @callback = url, data, block
71
+ @success = false
72
+ @finished = false
73
+ end
74
+
75
+ def sync?
76
+ @callback.nil?
77
+ end
78
+
79
+ def on_complete(curl)
80
+ @finished = true
81
+ @body = curl.body_str
82
+ @code = curl.response_code
83
+ @callback.call(self) if @callback
84
+ end
85
+
86
+ def data
87
+ if @data.respond_to?(:call)
88
+ @data = @data.call
89
+ end
90
+ @data
91
+ end
92
+
93
+ def finished?
94
+ @finished
95
+ end
96
+
97
+ def success?
98
+ @code == 200
99
+ end
100
+
101
+ def response
102
+ return @body unless (url =~ /wt=ruby/)
103
+ @response ||= Response.new(@body)
104
+ end
105
+
106
+ end
107
+
108
+ class Response
109
+
110
+ attr_reader :status, :docs, :start, :num_found, :qtime, :params, :rows, :start
111
+
112
+ def initialize(body)
113
+ data = eval(body)
114
+ header = data["responseHeader"]
115
+ @status = header["status"]
116
+ @qtime = header["QTime"]
117
+ @params = header["params"]
118
+ @start = @params["start"].to_i
119
+ @rows = @params["rows"].to_i
120
+ response = data["response"]
121
+ @docs = response["docs"]
122
+ @start = response["start"]
123
+ @num_found = response["numFound"]
124
+ end
125
+
126
+ def success?
127
+ @status == 0
128
+ end
129
+
130
+ end
131
+
132
+ # see http://wiki.apache.org/solr/UpdateXmlMessages
133
+ class Client
134
+
135
+ VERSION = "0.0.1"
136
+
137
+ include Codec
138
+
139
+ attr_accessor :core
140
+
141
+ def initialize(base_url, options = {})
142
+ @base_url = base_url.gsub(/\/$/, '')
143
+ @max_connects = options[:max_connects] || 10
144
+ @stop = false
145
+ @queue = Queue.new
146
+ @multi = Curl::Multi.new
147
+ @multi.max_connects = @max_connects
148
+ end
149
+
150
+ # execute a search request.
151
+ # [query] query parameters, keys:
152
+ # q: query
153
+ # qt: query type
154
+ # fq: filter query
155
+ # fl: specify a set of fields to return, * means all fields
156
+ # sort: sort method, default value is score desc
157
+ # start: offset in result set
158
+ # rows: maximum number of documents to return, default value is 10
159
+ # defType: specify the query parser
160
+ #
161
+ # ref:
162
+ # http://wiki.apache.org/solr/CoreQueryParameters
163
+ # http://wiki.apache.org/solr/CommonQueryParameters
164
+ #
165
+ def select(query, options={}, &block)
166
+ query[:wt] = "ruby"
167
+ options[:action] = "select"
168
+ url = real_url(options)
169
+ url += '?' unless (url =~ /\?/)
170
+ url += '&' if (url =~ /&/)
171
+ url += query.map {|k, v| "#{escape(k)}=#{escape(v)}"}.join("&")
172
+
173
+ execute Request.new(url, &block)
174
+ end
175
+
176
+ def commit(options = {}, &block)
177
+ url = real_url(options) + "?commit=true"
178
+ execute Request.new(url, &block)
179
+ end
180
+
181
+ def rollback(options = {}, &block)
182
+ url = real_url(options) + "?rollback=true"
183
+ execute Request.new(url, &block)
184
+ end
185
+
186
+ def optimize(options = {}, &block)
187
+ url = real_url(options) + "?optimize=true"
188
+ execute Request.new(url, &block)
189
+ end
190
+
191
+ def delete_all(options = {}, &block)
192
+ delete_by_query("*:*", options, &block)
193
+ end
194
+
195
+ def delete_by_id(id, options = {}, &block)
196
+ data = to_delete_by_id(id)
197
+ execute Request.new(real_url(options), data, &block)
198
+ end
199
+
200
+ def delete_by_query(query, options = {}, &block)
201
+ data = to_delete_by_query(query)
202
+ execute Request.new(real_url(options), data, &block)
203
+ end
204
+
205
+ def add(docs, options = {}, &block)
206
+ data = lambda { to_docs(docs, options) }
207
+ execute Request.new(real_url(options), data, &block)
208
+ end
209
+
210
+ def stop
211
+ @stop = true
212
+ if @thread
213
+ @queue.push nil
214
+ @thread.join
215
+ @thread = nil
216
+ end
217
+ end
218
+
219
+ def reset
220
+ stop
221
+ @stop = false
222
+ end
223
+
224
+ def full?
225
+ @queue.size > @max_connects
226
+ end
227
+
228
+ private
229
+
230
+ def execute(request)
231
+ if request.sync?
232
+ curl = build_curl(request)
233
+ curl.perform
234
+ request.on_complete(curl)
235
+ else
236
+ raise "please call reset before performing solr request on a stopped client!" if @stop
237
+ @queue.push request
238
+ ensure_thread_start
239
+ end
240
+ request
241
+ end
242
+
243
+ def real_url(options = {})
244
+ return options[:url] if options[:url]
245
+ action = options[:action] || "update"
246
+ core = options[:core] || self.core
247
+ core ? "#{@base_url}/#{core}/#{action}" : "#{@base_url}/#{action}"
248
+ end
249
+
250
+ def build_curl(request)
251
+ Curl::Easy.new do |curl|
252
+ curl.url = request.url
253
+ curl.headers["Content-Type"] = "application/xml; charset=UTF-8"
254
+ curl.headers["Expect"] = ""
255
+ curl.post_body = request.data if request.data
256
+ end
257
+ end
258
+
259
+ def ensure_thread_start
260
+ @thread ||= Thread.new do
261
+ run
262
+ end
263
+ end
264
+
265
+ def send_request(request)
266
+ return unless request
267
+ curl = build_curl(request)
268
+ curl.on_complete do |easy|
269
+ on_idle
270
+ request.on_complete(easy)
271
+ end
272
+ @multi.add(curl)
273
+ end
274
+
275
+ def run
276
+ while !@stop || !empty?
277
+ send_request(@queue.pop)
278
+ @multi.perform do
279
+ on_idle
280
+ end
281
+ end
282
+ end
283
+
284
+ def on_idle
285
+ if !@stop && !empty? && !busy?
286
+ send_request(@queue.pop)
287
+ end
288
+ end
289
+
290
+ def empty?
291
+ @queue.size == 0
292
+ end
293
+
294
+ def busy?
295
+ @multi.requests.size > @max_connects * 2
296
+ end
297
+
298
+ end
299
+ end
300
+
@@ -0,0 +1,19 @@
1
+ # -*- encoding: utf-8 -*-
2
+ require File.expand_path('../lib/solr-client', __FILE__)
3
+
4
+ Gem::Specification.new do |gem|
5
+ gem.authors = ["zzzhc"]
6
+ gem.email = ["zzzhc.starfire@gmail.com"]
7
+ gem.description = %q{fast solr client for ruby}
8
+ gem.summary = %q{a high performance, little memory footprint solr client for ruby}
9
+ gem.homepage = "https://github.com/freewheel/solr-client"
10
+
11
+ gem.files = `git ls-files`.split($\)
12
+ gem.executables = gem.files.grep(%r{^bin/}).map{ |f| File.basename(f) }
13
+ gem.test_files = gem.files.grep(%r{^(test|spec|features)/})
14
+ gem.name = "solr-client"
15
+ gem.require_paths = ["lib"]
16
+ gem.version = Solr::Client::VERSION
17
+
18
+ gem.add_dependency 'curb', '>= 0.8.1'
19
+ end
metadata ADDED
@@ -0,0 +1,69 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: solr-client
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.1
5
+ prerelease:
6
+ platform: ruby
7
+ authors:
8
+ - zzzhc
9
+ autorequire:
10
+ bindir: bin
11
+ cert_chain: []
12
+ date: 2012-09-03 00:00:00.000000000 Z
13
+ dependencies:
14
+ - !ruby/object:Gem::Dependency
15
+ name: curb
16
+ requirement: !ruby/object:Gem::Requirement
17
+ none: false
18
+ requirements:
19
+ - - ! '>='
20
+ - !ruby/object:Gem::Version
21
+ version: 0.8.1
22
+ type: :runtime
23
+ prerelease: false
24
+ version_requirements: !ruby/object:Gem::Requirement
25
+ none: false
26
+ requirements:
27
+ - - ! '>='
28
+ - !ruby/object:Gem::Version
29
+ version: 0.8.1
30
+ description: fast solr client for ruby
31
+ email:
32
+ - zzzhc.starfire@gmail.com
33
+ executables: []
34
+ extensions: []
35
+ extra_rdoc_files: []
36
+ files:
37
+ - .gitignore
38
+ - Gemfile
39
+ - LICENSE
40
+ - README.md
41
+ - Rakefile
42
+ - lib/solr-client.rb
43
+ - solr-client.gemspec
44
+ homepage: https://github.com/freewheel/solr-client
45
+ licenses: []
46
+ post_install_message:
47
+ rdoc_options: []
48
+ require_paths:
49
+ - lib
50
+ required_ruby_version: !ruby/object:Gem::Requirement
51
+ none: false
52
+ requirements:
53
+ - - ! '>='
54
+ - !ruby/object:Gem::Version
55
+ version: '0'
56
+ required_rubygems_version: !ruby/object:Gem::Requirement
57
+ none: false
58
+ requirements:
59
+ - - ! '>='
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ requirements: []
63
+ rubyforge_project:
64
+ rubygems_version: 1.8.24
65
+ signing_key:
66
+ specification_version: 3
67
+ summary: a high performance, little memory footprint solr client for ruby
68
+ test_files: []
69
+ has_rdoc: