riemann-riak 0.1.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/LICENSE +21 -0
- data/README.md +10 -0
- data/bin/riemann-riak +330 -0
- data/bin/riemann-riak-keys +12 -0
- data/bin/riemann-riak-ring +8 -0
- metadata +78 -0
checksums.yaml
ADDED
@@ -0,0 +1,7 @@
|
|
1
|
+
---
|
2
|
+
SHA1:
|
3
|
+
metadata.gz: 7358bc4125363c3f2774a6579ea6648b9d5efb1b
|
4
|
+
data.tar.gz: ed6e0d58221a1b03e8bd00ff1d2e5649b35b2cd4
|
5
|
+
SHA512:
|
6
|
+
metadata.gz: 061832fbfbefa06354c931caea31604d41557157c07deb75b06cdaafbf3e8d9c5e82d223179dfe21e6b0e61821fb65e7a81c8e46c147216fbcf1dad3241a58fd
|
7
|
+
data.tar.gz: 6a0d5f3ded5dd8fc45132d2a8c4f351e0e78adb006737a98ae84644a7b35da47fa30509b53841555821f0203d2911289af36c577cc3e994790b37defb831a05d
|
data/LICENSE
ADDED
@@ -0,0 +1,21 @@
|
|
1
|
+
The MIT License
|
2
|
+
|
3
|
+
Copyright (c) 2011 Kyle Kingsbury
|
4
|
+
|
5
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
6
|
+
of this software and associated documentation files (the "Software"), to deal
|
7
|
+
in the Software without restriction, including without limitation the rights
|
8
|
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
9
|
+
copies of the Software, and to permit persons to whom the Software is
|
10
|
+
furnished to do so, subject to the following conditions:
|
11
|
+
|
12
|
+
The above copyright notice and this permission notice shall be included in
|
13
|
+
all copies or substantial portions of the Software.
|
14
|
+
|
15
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
16
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
17
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
18
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
19
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
20
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
21
|
+
THE SOFTWARE.
|
data/README.md
ADDED
data/bin/riemann-riak
ADDED
@@ -0,0 +1,330 @@
|
|
1
|
+
#!/usr/bin/env ruby
|
2
|
+
|
3
|
+
# Forwards information on a Riak node to Riemann.
|
4
|
+
|
5
|
+
require 'riemann/tools'
|
6
|
+
|
7
|
+
class Riemann::Tools::Riak
|
8
|
+
include Riemann::Tools
|
9
|
+
require 'net/http'
|
10
|
+
require 'net/https'
|
11
|
+
require 'yajl/json_gem'
|
12
|
+
|
13
|
+
opt :riak_host, "Riak host for stats <IP> or SSL http(s)://<IP>", :default => Socket.gethostname
|
14
|
+
opt :data_dir, "Riak data directory", :default => '/var/lib/riak'
|
15
|
+
opt :stats_port, "Riak HTTP port for stats", :default => 8098
|
16
|
+
opt :stats_path, "Riak HTTP stats path", :default => '/stats'
|
17
|
+
opt :node_name, "Riak erlang node name", :default => "riak@#{Socket.gethostname}"
|
18
|
+
opt :cookie, "Riak cookie to use", :default => "riak"
|
19
|
+
|
20
|
+
opt :get_50_warning, "FSM 50% get time warning threshold (ms)", :default => 1000
|
21
|
+
opt :put_50_warning, "FSM 50% put time warning threshold (ms)", :default => 1000
|
22
|
+
opt :get_95_warning, "FSM 95% get time warning threshold (ms)", :default => 2000
|
23
|
+
opt :put_95_warning, "FSM 95% put time warning threshold (ms)", :default => 2000
|
24
|
+
opt :get_99_warning, "FSM 99% get time warning threshold (ms)", :default => 10000
|
25
|
+
opt :put_99_warning, "FSM 99% put time warning threshold (ms)", :default => 10000
|
26
|
+
|
27
|
+
def initialize
|
28
|
+
detect_features
|
29
|
+
|
30
|
+
@httpstatus = true
|
31
|
+
|
32
|
+
begin
|
33
|
+
uri = URI.parse(opts[:riak_host])
|
34
|
+
if uri.host == nil
|
35
|
+
uri.host = opts[:riak_host]
|
36
|
+
end
|
37
|
+
http = Net::HTTP.new(uri.host, opts[:stats_port])
|
38
|
+
http.use_ssl = uri.scheme == 'https'
|
39
|
+
if http.use_ssl?
|
40
|
+
http.verify_mode = OpenSSL::SSL::VERIFY_NONE
|
41
|
+
end
|
42
|
+
http.start do |h|
|
43
|
+
h.get opts[:stats_path]
|
44
|
+
end
|
45
|
+
rescue => _e
|
46
|
+
@httpstatus = false
|
47
|
+
end
|
48
|
+
|
49
|
+
# we're going to override the emulator setting to allow users to
|
50
|
+
# dynamically input the cookie
|
51
|
+
# this is done only once - hopefully it doesn't get overridden.
|
52
|
+
ENV['ERL_AFLAGS'] = "-setcookie #{opts[:cookie]}"
|
53
|
+
end
|
54
|
+
|
55
|
+
# Identifies whether escript and riak-admin are installed
|
56
|
+
def detect_features
|
57
|
+
@escript = true # Whether escript is present on this machine
|
58
|
+
@riakadmin = true # Whether riak-admin is present
|
59
|
+
|
60
|
+
if `which escript` =~ /^\s*$/
|
61
|
+
@escript = false
|
62
|
+
end
|
63
|
+
|
64
|
+
if `which riak-admin` =~ /^\s*$/
|
65
|
+
@riakadmin = false
|
66
|
+
end
|
67
|
+
end
|
68
|
+
|
69
|
+
def check_ring
|
70
|
+
str = if @escript
|
71
|
+
str = `#{File.expand_path(File.dirname(__FILE__))}/riemann-riak-ring #{opts[:node_name]}`.chomp
|
72
|
+
elsif @riakadmin
|
73
|
+
str = `riak-admin ringready`
|
74
|
+
else
|
75
|
+
nil
|
76
|
+
end
|
77
|
+
|
78
|
+
return if str.nil?
|
79
|
+
|
80
|
+
if str =~ /^TRUE/
|
81
|
+
report(
|
82
|
+
:host => opts[:riak_host],
|
83
|
+
:service => 'riak ring',
|
84
|
+
:state => 'ok',
|
85
|
+
:description => str
|
86
|
+
)
|
87
|
+
else
|
88
|
+
report(
|
89
|
+
:host => opts[:riak_host],
|
90
|
+
:service => 'riak ring',
|
91
|
+
:state => 'warning',
|
92
|
+
:description => str
|
93
|
+
)
|
94
|
+
end
|
95
|
+
end
|
96
|
+
|
97
|
+
def check_keys
|
98
|
+
keys = `#{File.expand_path(File.dirname(__FILE__))}/riemann-riak-keys #{opts[:node_name]}`.chomp
|
99
|
+
if keys =~ /^\d+$/
|
100
|
+
report(
|
101
|
+
:host => opts[:riak_host],
|
102
|
+
:service => 'riak keys',
|
103
|
+
:state => 'ok',
|
104
|
+
:metric => keys.to_i,
|
105
|
+
:description => keys
|
106
|
+
)
|
107
|
+
else
|
108
|
+
report(
|
109
|
+
:host => opts[:riak_host],
|
110
|
+
:service => 'riak keys',
|
111
|
+
:state => 'unknown',
|
112
|
+
:description => keys
|
113
|
+
)
|
114
|
+
end
|
115
|
+
end
|
116
|
+
|
117
|
+
def check_transfers
|
118
|
+
str = if @riakadmin
|
119
|
+
`riak-admin transfers`
|
120
|
+
else
|
121
|
+
nil
|
122
|
+
end
|
123
|
+
|
124
|
+
return if str.nil?
|
125
|
+
|
126
|
+
if str =~ /'#{opts[:node_name]}' waiting to handoff (\d+) partitions/
|
127
|
+
report(
|
128
|
+
:host => opts[:riak_host],
|
129
|
+
:service => 'riak transfers',
|
130
|
+
:state => 'critical',
|
131
|
+
:metric => $1.to_i,
|
132
|
+
:description => "waiting to handoff #{$1} partitions"
|
133
|
+
)
|
134
|
+
else
|
135
|
+
report(
|
136
|
+
:host => opts[:riak_host],
|
137
|
+
:service => 'riak transfers',
|
138
|
+
:state => 'ok',
|
139
|
+
:metric => 0,
|
140
|
+
:description => "No pending transfers"
|
141
|
+
)
|
142
|
+
end
|
143
|
+
end
|
144
|
+
|
145
|
+
def check_disk
|
146
|
+
gb = `du -Ls #{opts[:data_dir]}`.split(/\s+/).first.to_i / (1024.0**2)
|
147
|
+
report(
|
148
|
+
:host => opts[:riak_host],
|
149
|
+
:service => 'riak disk',
|
150
|
+
:state => 'ok',
|
151
|
+
:metric => gb,
|
152
|
+
:description => "#{gb} GB in #{opts[:data_dir]}"
|
153
|
+
)
|
154
|
+
end
|
155
|
+
|
156
|
+
# Returns the riak stat for the given fsm type and percentile.
|
157
|
+
def fsm_stat(type, property, percentile)
|
158
|
+
"node_#{type}_fsm_#{property}_#{percentile == 50 ? 'median' : percentile}"
|
159
|
+
end
|
160
|
+
|
161
|
+
# Returns the alerts state for the given fsm.
|
162
|
+
def fsm_state(type, percentile, val)
|
163
|
+
limit = opts["#{type}_#{percentile}_warning".to_sym]
|
164
|
+
case val
|
165
|
+
when 0 .. limit
|
166
|
+
'ok'
|
167
|
+
when limit .. limit * 2
|
168
|
+
'warning'
|
169
|
+
else
|
170
|
+
'critical'
|
171
|
+
end
|
172
|
+
end
|
173
|
+
|
174
|
+
# Get current stats via HTTP
|
175
|
+
def stats_http
|
176
|
+
begin
|
177
|
+
uri = URI.parse(opts[:riak_host])
|
178
|
+
if uri.host == nil
|
179
|
+
uri.host = opts[:riak_host]
|
180
|
+
end
|
181
|
+
http = Net::HTTP.new(uri.host, opts[:stats_port])
|
182
|
+
http.use_ssl = uri.scheme == 'https'
|
183
|
+
if http.use_ssl?
|
184
|
+
http.verify_mode = OpenSSL::SSL::VERIFY_NONE
|
185
|
+
end
|
186
|
+
res = http.start do |h|
|
187
|
+
h.get opts[:stats_path]
|
188
|
+
end
|
189
|
+
rescue => e
|
190
|
+
report(
|
191
|
+
:host => opts[:riak_host],
|
192
|
+
:service => 'riak',
|
193
|
+
:state => 'critical',
|
194
|
+
:description => "error fetching #{opts[:riak_host]}:#{opts[:stats_port]} #{e.class}, #{e.message}"
|
195
|
+
)
|
196
|
+
raise
|
197
|
+
end
|
198
|
+
|
199
|
+
if res.code.to_i == 200
|
200
|
+
return JSON.parse(res.body)
|
201
|
+
else
|
202
|
+
report(
|
203
|
+
:host => opts[:riak_host],
|
204
|
+
:service => 'riak',
|
205
|
+
:state => 'critical',
|
206
|
+
:description => "stats returned HTTP #{res.code}:\n\n#{res.body}"
|
207
|
+
)
|
208
|
+
raise "Can't fetch stats via HTTP: #{res.core}:\n\n#{res.body}"
|
209
|
+
end
|
210
|
+
end
|
211
|
+
|
212
|
+
# Get current stats via riak-admin
|
213
|
+
def stats_riak_admin
|
214
|
+
str = `riak-admin status`
|
215
|
+
raise "riak-admin failed" unless $? == 0
|
216
|
+
Hash[str.split(/\n/).map{|i| i.split(/ : /)}]
|
217
|
+
end
|
218
|
+
|
219
|
+
# Get current stats as a hash
|
220
|
+
def stats
|
221
|
+
if @httpstatus
|
222
|
+
stats_http
|
223
|
+
elsif @riakadmin
|
224
|
+
stats_riak_admin
|
225
|
+
else
|
226
|
+
report(
|
227
|
+
:host => opts[:riak_host],
|
228
|
+
:service => 'riak',
|
229
|
+
:state => 'critical',
|
230
|
+
:description => "No mechanism for fetching Riak stats: neither HTTP nor riak-admin available."
|
231
|
+
)
|
232
|
+
raise "No mechanism for fetching Riak stats: neither HTTP nor riak-admin available."
|
233
|
+
end
|
234
|
+
end
|
235
|
+
|
236
|
+
def core_services
|
237
|
+
['vnode_gets',
|
238
|
+
'vnode_puts',
|
239
|
+
'node_gets',
|
240
|
+
'node_puts',
|
241
|
+
'node_gets_set',
|
242
|
+
'node_puts_set',
|
243
|
+
'read_repairs']
|
244
|
+
end
|
245
|
+
|
246
|
+
def fsm_types
|
247
|
+
[{'get' => 'time'}, {'put' => 'time'},
|
248
|
+
{'get' => 'set_objsize'}]
|
249
|
+
end
|
250
|
+
|
251
|
+
def fsm_percentiles
|
252
|
+
[50, 95, 99]
|
253
|
+
end
|
254
|
+
|
255
|
+
# Reports current stats to Riemann
|
256
|
+
def check_stats
|
257
|
+
begin
|
258
|
+
stats = self.stats
|
259
|
+
rescue => e
|
260
|
+
event = {:state => 'critical',
|
261
|
+
:description => e.message,
|
262
|
+
:host => opts[:riak_host]}
|
263
|
+
# Report errors
|
264
|
+
report(event.merge(:service => 'riak'))
|
265
|
+
core_services.each do |s|
|
266
|
+
report(event.merge(:service => "riak #{s}"))
|
267
|
+
end
|
268
|
+
fsm_types.each do |typespec|
|
269
|
+
typespec.each do |type, prop|
|
270
|
+
fsm_percentiles.each do |percentile|
|
271
|
+
report(event.merge(:service => "riak #{type} #{prop} #{percentile}"))
|
272
|
+
end
|
273
|
+
end
|
274
|
+
end
|
275
|
+
return
|
276
|
+
end
|
277
|
+
|
278
|
+
# Riak itself
|
279
|
+
report(
|
280
|
+
:host => opts[:riak_host],
|
281
|
+
:service => 'riak',
|
282
|
+
:state => 'ok'
|
283
|
+
)
|
284
|
+
|
285
|
+
# Gets/puts/rr
|
286
|
+
core_services.each do |s|
|
287
|
+
report(
|
288
|
+
:host => opts[:riak_host],
|
289
|
+
:service => "riak #{s}",
|
290
|
+
:state => 'ok',
|
291
|
+
:metric => stats[s].to_i/60.0,
|
292
|
+
:description => "#{stats[s].to_i/60.0}/sec"
|
293
|
+
)
|
294
|
+
end
|
295
|
+
|
296
|
+
# FSMs
|
297
|
+
fsm_types.each do |typespec|
|
298
|
+
typespec.each do |type, prop|
|
299
|
+
fsm_percentiles.each do |percentile|
|
300
|
+
val = stats[fsm_stat(type, prop, percentile)].to_i || 0
|
301
|
+
val = 0 if val == 'undefined'
|
302
|
+
val /= 1000.0 if prop == 'time' # Convert us to ms
|
303
|
+
if prop == 'time'
|
304
|
+
state = fsm_state(type, percentile, val)
|
305
|
+
else
|
306
|
+
state = "ok"
|
307
|
+
end
|
308
|
+
report(
|
309
|
+
:host => opts[:riak_host],
|
310
|
+
:service => "riak #{type} #{prop} #{percentile}",
|
311
|
+
:state => state,
|
312
|
+
:metric => val,
|
313
|
+
:description => "#{val} ms"
|
314
|
+
)
|
315
|
+
end
|
316
|
+
end
|
317
|
+
end
|
318
|
+
end
|
319
|
+
|
320
|
+
def tick
|
321
|
+
# This can utterly destroy a cluster, so we disable
|
322
|
+
# check_keys
|
323
|
+
check_stats
|
324
|
+
check_ring
|
325
|
+
check_disk
|
326
|
+
check_transfers
|
327
|
+
end
|
328
|
+
end
|
329
|
+
|
330
|
+
Riemann::Tools::Riak.run
|
@@ -0,0 +1,12 @@
|
|
1
|
+
#!/usr/bin/env escript
|
2
|
+
%%! -name riakstatuscheck@127.0.0.1 -hidden
|
3
|
+
|
4
|
+
main([]) -> main(["riak@127.0.0.1"]);
|
5
|
+
main([Node]) ->
|
6
|
+
io:format("~w\n", [
|
7
|
+
lists:foldl(
|
8
|
+
fun({_VNode, Count}, Sum) -> Sum + Count end,
|
9
|
+
0,
|
10
|
+
rpc:call(list_to_atom(Node), riak_kv_bitcask_backend, key_counts, [])
|
11
|
+
)
|
12
|
+
]).
|
metadata
ADDED
@@ -0,0 +1,78 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: riemann-riak
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: 0.1.0
|
5
|
+
platform: ruby
|
6
|
+
authors:
|
7
|
+
- Kyle Kingsbury
|
8
|
+
autorequire:
|
9
|
+
bindir: bin
|
10
|
+
cert_chain: []
|
11
|
+
date: 2016-01-21 00:00:00.000000000 Z
|
12
|
+
dependencies:
|
13
|
+
- !ruby/object:Gem::Dependency
|
14
|
+
name: riemann-tools
|
15
|
+
requirement: !ruby/object:Gem::Requirement
|
16
|
+
requirements:
|
17
|
+
- - ">="
|
18
|
+
- !ruby/object:Gem::Version
|
19
|
+
version: 0.2.7
|
20
|
+
type: :runtime
|
21
|
+
prerelease: false
|
22
|
+
version_requirements: !ruby/object:Gem::Requirement
|
23
|
+
requirements:
|
24
|
+
- - ">="
|
25
|
+
- !ruby/object:Gem::Version
|
26
|
+
version: 0.2.7
|
27
|
+
- !ruby/object:Gem::Dependency
|
28
|
+
name: yajl-ruby
|
29
|
+
requirement: !ruby/object:Gem::Requirement
|
30
|
+
requirements:
|
31
|
+
- - ">="
|
32
|
+
- !ruby/object:Gem::Version
|
33
|
+
version: 1.1.0
|
34
|
+
type: :runtime
|
35
|
+
prerelease: false
|
36
|
+
version_requirements: !ruby/object:Gem::Requirement
|
37
|
+
requirements:
|
38
|
+
- - ">="
|
39
|
+
- !ruby/object:Gem::Version
|
40
|
+
version: 1.1.0
|
41
|
+
description:
|
42
|
+
email: aphyr@aphyr.com
|
43
|
+
executables:
|
44
|
+
- riemann-riak
|
45
|
+
- riemann-riak-keys
|
46
|
+
- riemann-riak-ring
|
47
|
+
extensions: []
|
48
|
+
extra_rdoc_files: []
|
49
|
+
files:
|
50
|
+
- LICENSE
|
51
|
+
- README.md
|
52
|
+
- bin/riemann-riak
|
53
|
+
- bin/riemann-riak-keys
|
54
|
+
- bin/riemann-riak-ring
|
55
|
+
homepage: https://github.com/riemann/riemann-riak
|
56
|
+
licenses: []
|
57
|
+
metadata: {}
|
58
|
+
post_install_message:
|
59
|
+
rdoc_options: []
|
60
|
+
require_paths:
|
61
|
+
- lib
|
62
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
63
|
+
requirements:
|
64
|
+
- - ">="
|
65
|
+
- !ruby/object:Gem::Version
|
66
|
+
version: 1.8.7
|
67
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
68
|
+
requirements:
|
69
|
+
- - ">="
|
70
|
+
- !ruby/object:Gem::Version
|
71
|
+
version: '0'
|
72
|
+
requirements: []
|
73
|
+
rubyforge_project: riemann-riak
|
74
|
+
rubygems_version: 2.4.5
|
75
|
+
signing_key:
|
76
|
+
specification_version: 4
|
77
|
+
summary: Submits riak stats to riemann.
|
78
|
+
test_files: []
|