logstash-input-generator 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml ADDED
@@ -0,0 +1,15 @@
1
+ ---
2
+ !binary "U0hBMQ==":
3
+ metadata.gz: !binary |-
4
+ OTU0ZTJkYzI2MDgxMDhjZWZjMThmM2MxNTQ0OGQ2M2QzZTlmNjFjNQ==
5
+ data.tar.gz: !binary |-
6
+ ZWQzYTQ2NmEwODhkYzkxZjlkNGE1MDg5YmRiYzVlMDMzYjFlOTFjYw==
7
+ SHA512:
8
+ metadata.gz: !binary |-
9
+ OWE1NjliOTZhNDgxNmU4N2ZhOTFhYTI1OGQ1MzVmMWE2YjQwYjJlZmZhMDc3
10
+ NmYwODc1M2IzNTQ2ZDUzMjRkYThmYzA1YzJkYTY5ZTE5NWJlMDI1ODEwODdk
11
+ NmQ1MGRhMDM0OGQ1MTg0NTE3ZjVmNWQxYjBkYjg2NGFmNGE0ZDk=
12
+ data.tar.gz: !binary |-
13
+ ZmIxZDliNmRjZGU4NDQzYTUxMzViODZhZjljY2E1MWMyZGNlYWRmZTUyOGQx
14
+ MjM2NzM3YmQzYTE3MTRmZDAzYTAwZmEyNTM2ZjczMmJkYTlmYmJhY2UwZjA0
15
+ MjE3ODdjZjY2N2RjZjExNmFlMDRkM2ZkZDQzMWJlOWExMzE2OGI=
data/.gitignore ADDED
@@ -0,0 +1,4 @@
1
+ *.gem
2
+ Gemfile.lock
3
+ .bundle
4
+ vendor
data/Gemfile ADDED
@@ -0,0 +1,4 @@
1
+ source 'http://rubygems.org'
2
+ gem 'rake'
3
+ gem 'gem_publisher'
4
+ gem 'archive-tar-minitar'
data/Rakefile ADDED
@@ -0,0 +1,6 @@
1
+ @files=[]
2
+
3
+ task :default do
4
+ system("rake -T")
5
+ end
6
+
@@ -0,0 +1,96 @@
1
+ # encoding: utf-8
2
+ require "logstash/inputs/threadable"
3
+ require "logstash/namespace"
4
+ require "socket" # for Socket.gethostname
5
+
6
+ # Generate random log events.
7
+ #
8
+ # The general intention of this is to test performance of plugins.
9
+ #
10
+ # An event is generated first
11
+ class LogStash::Inputs::Generator < LogStash::Inputs::Threadable
12
+ config_name "generator"
13
+ milestone 3
14
+
15
+ default :codec, "plain"
16
+
17
+ # The message string to use in the event.
18
+ #
19
+ # If you set this to 'stdin' then this plugin will read a single line from
20
+ # stdin and use that as the message string for every event.
21
+ #
22
+ # Otherwise, this value will be used verbatim as the event message.
23
+ config :message, :validate => :string, :default => "Hello world!"
24
+
25
+ # The lines to emit, in order. This option cannot be used with the 'message'
26
+ # setting.
27
+ #
28
+ # Example:
29
+ #
30
+ # input {
31
+ # generator {
32
+ # lines => [
33
+ # "line 1",
34
+ # "line 2",
35
+ # "line 3"
36
+ # ]
37
+ # # Emit all lines 3 times.
38
+ # count => 3
39
+ # }
40
+ # }
41
+ #
42
+ # The above will emit "line 1" then "line 2" then "line", then "line 1", etc...
43
+ config :lines, :validate => :array
44
+
45
+ # Set how many messages should be generated.
46
+ #
47
+ # The default, 0, means generate an unlimited number of events.
48
+ config :count, :validate => :number, :default => 0
49
+
50
+ public
51
+ def register
52
+ @host = Socket.gethostname
53
+ @count = @count.first if @count.is_a?(Array)
54
+ end # def register
55
+
56
+ def run(queue)
57
+ number = 0
58
+
59
+ if @message == "stdin"
60
+ @logger.info("Generator plugin reading a line from stdin")
61
+ @message = $stdin.readline
62
+ @logger.debug("Generator line read complete", :message => @message)
63
+ end
64
+ @lines = [@message] if @lines.nil?
65
+
66
+ while !finished? && (@count <= 0 || number < @count)
67
+ @lines.each do |line|
68
+ @codec.decode(line.clone) do |event|
69
+ decorate(event)
70
+ event["host"] = @host
71
+ event["sequence"] = number
72
+ queue << event
73
+ end
74
+ end
75
+ number += 1
76
+ end # loop
77
+
78
+ if @codec.respond_to?(:flush)
79
+ @codec.flush do |event|
80
+ decorate(event)
81
+ event["host"] = @host
82
+ queue << event
83
+ end
84
+ end
85
+ end # def run
86
+
87
+ public
88
+ def teardown
89
+ @codec.flush do |event|
90
+ decorate(event)
91
+ event["host"] = @host
92
+ queue << event
93
+ end
94
+ finished
95
+ end # def teardown
96
+ end # class LogStash::Inputs::Generator
@@ -0,0 +1,27 @@
1
+ Gem::Specification.new do |s|
2
+
3
+ s.name = 'logstash-input-generator'
4
+ s.version = '0.1.0'
5
+ s.licenses = ['Apache License (2.0)']
6
+ s.summary = "Generate random log events."
7
+ s.description = "Generate random log events."
8
+ s.authors = ["Elasticsearch"]
9
+ s.email = 'richard.pijnenburg@elasticsearch.com'
10
+ s.homepage = "http://logstash.net/"
11
+ s.require_paths = ["lib"]
12
+
13
+ # Files
14
+ s.files = `git ls-files`.split($\)+::Dir.glob('vendor/*')
15
+
16
+ # Tests
17
+ s.test_files = s.files.grep(%r{^(test|spec|features)/})
18
+
19
+ # Special flag to let us know this is actually a logstash plugin
20
+ s.metadata = { "logstash_plugin" => "true", "group" => "input" }
21
+
22
+ # Gem dependencies
23
+ s.add_runtime_dependency 'logstash', '>= 1.4.0', '< 2.0.0'
24
+
25
+ s.add_runtime_dependency 'logstash-codec-plain'
26
+ end
27
+
@@ -0,0 +1,9 @@
1
+ require "gem_publisher"
2
+
3
+ desc "Publish gem to RubyGems.org"
4
+ task :publish_gem do |t|
5
+ gem_file = Dir.glob(File.expand_path('../*.gemspec',File.dirname(__FILE__))).first
6
+ gem = GemPublisher.publish_if_updated(gem_file, :rubygems)
7
+ puts "Published #{gem}" if gem
8
+ end
9
+
@@ -0,0 +1,169 @@
1
+ require "net/http"
2
+ require "uri"
3
+ require "digest/sha1"
4
+
5
+ def vendor(*args)
6
+ return File.join("vendor", *args)
7
+ end
8
+
9
+ directory "vendor/" => ["vendor"] do |task, args|
10
+ mkdir task.name
11
+ end
12
+
13
+ def fetch(url, sha1, output)
14
+
15
+ puts "Downloading #{url}"
16
+ actual_sha1 = download(url, output)
17
+
18
+ if actual_sha1 != sha1
19
+ fail "SHA1 does not match (expected '#{sha1}' but got '#{actual_sha1}')"
20
+ end
21
+ end # def fetch
22
+
23
+ def file_fetch(url, sha1)
24
+ filename = File.basename( URI(url).path )
25
+ output = "vendor/#{filename}"
26
+ task output => [ "vendor/" ] do
27
+ begin
28
+ actual_sha1 = file_sha1(output)
29
+ if actual_sha1 != sha1
30
+ fetch(url, sha1, output)
31
+ end
32
+ rescue Errno::ENOENT
33
+ fetch(url, sha1, output)
34
+ end
35
+ end.invoke
36
+
37
+ return output
38
+ end
39
+
40
+ def file_sha1(path)
41
+ digest = Digest::SHA1.new
42
+ fd = File.new(path, "r")
43
+ while true
44
+ begin
45
+ digest << fd.sysread(16384)
46
+ rescue EOFError
47
+ break
48
+ end
49
+ end
50
+ return digest.hexdigest
51
+ ensure
52
+ fd.close if fd
53
+ end
54
+
55
+ def download(url, output)
56
+ uri = URI(url)
57
+ digest = Digest::SHA1.new
58
+ tmp = "#{output}.tmp"
59
+ Net::HTTP.start(uri.host, uri.port, :use_ssl => (uri.scheme == "https")) do |http|
60
+ request = Net::HTTP::Get.new(uri.path)
61
+ http.request(request) do |response|
62
+ fail "HTTP fetch failed for #{url}. #{response}" if [200, 301].include?(response.code)
63
+ size = (response["content-length"].to_i || -1).to_f
64
+ count = 0
65
+ File.open(tmp, "w") do |fd|
66
+ response.read_body do |chunk|
67
+ fd.write(chunk)
68
+ digest << chunk
69
+ if size > 0 && $stdout.tty?
70
+ count += chunk.bytesize
71
+ $stdout.write(sprintf("\r%0.2f%%", count/size * 100))
72
+ end
73
+ end
74
+ end
75
+ $stdout.write("\r \r") if $stdout.tty?
76
+ end
77
+ end
78
+
79
+ File.rename(tmp, output)
80
+
81
+ return digest.hexdigest
82
+ rescue SocketError => e
83
+ puts "Failure while downloading #{url}: #{e}"
84
+ raise
85
+ ensure
86
+ File.unlink(tmp) if File.exist?(tmp)
87
+ end # def download
88
+
89
+ def untar(tarball, &block)
90
+ require "archive/tar/minitar"
91
+ tgz = Zlib::GzipReader.new(File.open(tarball))
92
+ # Pull out typesdb
93
+ tar = Archive::Tar::Minitar::Input.open(tgz)
94
+ tar.each do |entry|
95
+ path = block.call(entry)
96
+ next if path.nil?
97
+ parent = File.dirname(path)
98
+
99
+ mkdir_p parent unless File.directory?(parent)
100
+
101
+ # Skip this file if the output file is the same size
102
+ if entry.directory?
103
+ mkdir path unless File.directory?(path)
104
+ else
105
+ entry_mode = entry.instance_eval { @mode } & 0777
106
+ if File.exists?(path)
107
+ stat = File.stat(path)
108
+ # TODO(sissel): Submit a patch to archive-tar-minitar upstream to
109
+ # expose headers in the entry.
110
+ entry_size = entry.instance_eval { @size }
111
+ # If file sizes are same, skip writing.
112
+ next if stat.size == entry_size && (stat.mode & 0777) == entry_mode
113
+ end
114
+ puts "Extracting #{entry.full_name} from #{tarball} #{entry_mode.to_s(8)}"
115
+ File.open(path, "w") do |fd|
116
+ # eof? check lets us skip empty files. Necessary because the API provided by
117
+ # Archive::Tar::Minitar::Reader::EntryStream only mostly acts like an
118
+ # IO object. Something about empty files in this EntryStream causes
119
+ # IO.copy_stream to throw "can't convert nil into String" on JRuby
120
+ # TODO(sissel): File a bug about this.
121
+ while !entry.eof?
122
+ chunk = entry.read(16384)
123
+ fd.write(chunk)
124
+ end
125
+ #IO.copy_stream(entry, fd)
126
+ end
127
+ File.chmod(entry_mode, path)
128
+ end
129
+ end
130
+ tar.close
131
+ File.unlink(tarball) if File.file?(tarball)
132
+ end # def untar
133
+
134
+ def ungz(file)
135
+
136
+ outpath = file.gsub('.gz', '')
137
+ tgz = Zlib::GzipReader.new(File.open(file))
138
+ begin
139
+ File.open(outpath, "w") do |out|
140
+ IO::copy_stream(tgz, out)
141
+ end
142
+ File.unlink(file)
143
+ rescue
144
+ File.unlink(outpath) if File.file?(outpath)
145
+ raise
146
+ end
147
+ tgz.close
148
+ end
149
+
150
+ desc "Process any vendor files required for this plugin"
151
+ task "vendor" do |task, args|
152
+
153
+ @files.each do |file|
154
+ download = file_fetch(file['url'], file['sha1'])
155
+ if download =~ /.tar.gz/
156
+ prefix = download.gsub('.tar.gz', '').gsub('vendor/', '')
157
+ untar(download) do |entry|
158
+ if !file['files'].nil?
159
+ next unless file['files'].include?(entry.full_name.gsub(prefix, ''))
160
+ out = entry.full_name.split("/").last
161
+ end
162
+ File.join('vendor', out)
163
+ end
164
+ elsif download =~ /.gz/
165
+ ungz(download)
166
+ end
167
+ end
168
+
169
+ end
@@ -0,0 +1,86 @@
1
+ require "spec_helper"
2
+
3
+ describe "inputs/generator" do
4
+
5
+
6
+ context "performance", :performance => true do
7
+ event_count = 100000 + rand(50000)
8
+
9
+ config <<-CONFIG
10
+ input {
11
+ generator {
12
+ type => "blah"
13
+ count => #{event_count}
14
+ }
15
+ }
16
+ CONFIG
17
+
18
+ input do |pipeline, queue|
19
+ start = Time.now
20
+ Thread.new { pipeline.run }
21
+ event_count.times do |i|
22
+ event = queue.pop
23
+ insist { event["sequence"] } == i
24
+ end
25
+ duration = Time.now - start
26
+ puts "inputs/generator rate: #{"%02.0f/sec" % (event_count / duration)}, elapsed: #{duration}s"
27
+ pipeline.shutdown
28
+ end # input
29
+ end
30
+
31
+ context "generate configured message" do
32
+ config <<-CONFIG
33
+ input {
34
+ generator {
35
+ count => 2
36
+ message => "foo"
37
+ }
38
+ }
39
+ CONFIG
40
+
41
+ input do |pipeline, queue|
42
+ Thread.new { pipeline.run }
43
+ event = queue.pop
44
+ insist { event["sequence"] } == 0
45
+ insist { event["message"] } == "foo"
46
+
47
+ event = queue.pop
48
+ insist { event["sequence"] } == 1
49
+ insist { event["message"] } == "foo"
50
+
51
+ insist { queue.size } == 0
52
+ pipeline.shutdown
53
+ end # input
54
+
55
+ context "generate message from stdin" do
56
+ config <<-CONFIG
57
+ input {
58
+ generator {
59
+ count => 2
60
+ message => "stdin"
61
+ }
62
+ }
63
+ CONFIG
64
+
65
+ input do |pipeline, queue|
66
+ saved_stdin = $stdin
67
+ stdin_mock = StringIO.new
68
+ $stdin = stdin_mock
69
+ stdin_mock.should_receive(:readline).once.and_return("bar")
70
+
71
+ Thread.new { pipeline.run }
72
+ event = queue.pop
73
+ insist { event["sequence"] } == 0
74
+ insist { event["message"] } == "bar"
75
+
76
+ event = queue.pop
77
+ insist { event["sequence"] } == 1
78
+ insist { event["message"] } == "bar"
79
+
80
+ insist { queue.size } == 0
81
+ pipeline.shutdown
82
+ $stdin = saved_stdin
83
+ end # input
84
+ end
85
+ end
86
+ end
metadata ADDED
@@ -0,0 +1,88 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: logstash-input-generator
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.1.0
5
+ platform: ruby
6
+ authors:
7
+ - Elasticsearch
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2014-10-30 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: logstash
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - ! '>='
18
+ - !ruby/object:Gem::Version
19
+ version: 1.4.0
20
+ - - <
21
+ - !ruby/object:Gem::Version
22
+ version: 2.0.0
23
+ type: :runtime
24
+ prerelease: false
25
+ version_requirements: !ruby/object:Gem::Requirement
26
+ requirements:
27
+ - - ! '>='
28
+ - !ruby/object:Gem::Version
29
+ version: 1.4.0
30
+ - - <
31
+ - !ruby/object:Gem::Version
32
+ version: 2.0.0
33
+ - !ruby/object:Gem::Dependency
34
+ name: logstash-codec-plain
35
+ requirement: !ruby/object:Gem::Requirement
36
+ requirements:
37
+ - - ! '>='
38
+ - !ruby/object:Gem::Version
39
+ version: '0'
40
+ type: :runtime
41
+ prerelease: false
42
+ version_requirements: !ruby/object:Gem::Requirement
43
+ requirements:
44
+ - - ! '>='
45
+ - !ruby/object:Gem::Version
46
+ version: '0'
47
+ description: Generate random log events.
48
+ email: richard.pijnenburg@elasticsearch.com
49
+ executables: []
50
+ extensions: []
51
+ extra_rdoc_files: []
52
+ files:
53
+ - .gitignore
54
+ - Gemfile
55
+ - Rakefile
56
+ - lib/logstash/inputs/generator.rb
57
+ - logstash-input-generator.gemspec
58
+ - rakelib/publish.rake
59
+ - rakelib/vendor.rake
60
+ - spec/inputs/generator_spec.rb
61
+ homepage: http://logstash.net/
62
+ licenses:
63
+ - Apache License (2.0)
64
+ metadata:
65
+ logstash_plugin: 'true'
66
+ group: input
67
+ post_install_message:
68
+ rdoc_options: []
69
+ require_paths:
70
+ - lib
71
+ required_ruby_version: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - ! '>='
74
+ - !ruby/object:Gem::Version
75
+ version: '0'
76
+ required_rubygems_version: !ruby/object:Gem::Requirement
77
+ requirements:
78
+ - - ! '>='
79
+ - !ruby/object:Gem::Version
80
+ version: '0'
81
+ requirements: []
82
+ rubyforge_project:
83
+ rubygems_version: 2.4.1
84
+ signing_key:
85
+ specification_version: 4
86
+ summary: Generate random log events.
87
+ test_files:
88
+ - spec/inputs/generator_spec.rb