logstash-codec-plain 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +15 -0
- data/.gitignore +3 -0
- data/Gemfile +4 -0
- data/Rakefile +6 -0
- data/lib/logstash/codecs/plain.rb +48 -0
- data/logstash-codec-plain.gemspec +26 -0
- data/rakelib/publish.rake +9 -0
- data/rakelib/vendor.rake +169 -0
- data/spec/codecs/plain_spec.rb +106 -0
- metadata +74 -0
checksums.yaml
ADDED
@@ -0,0 +1,15 @@
|
|
1
|
+
---
|
2
|
+
!binary "U0hBMQ==":
|
3
|
+
metadata.gz: !binary |-
|
4
|
+
YjVkNDEyYjgxNzQ3OTcxNzI1MDU2N2UzNTUyNmI1YTE2MjZmNDU0OA==
|
5
|
+
data.tar.gz: !binary |-
|
6
|
+
ZDRkNTEwMzdhZWQ5NjYyMTZjZjI0ZTE5MTBhZmRlOTgxNWYwNzM2MQ==
|
7
|
+
SHA512:
|
8
|
+
metadata.gz: !binary |-
|
9
|
+
NTMzNzc2OTM1NzBhNGUzYTIxNDQ4OWU2ZGZkZjMzYzUyMTMzNTVhOWQyMWFj
|
10
|
+
YTY0OGFiMzJhODMzNTIzOGM1NWRiZmM1ZmVjNDJlNzJkNTBhYzY4MGUzNTk3
|
11
|
+
MTAyN2ViYzYxYmIzZjA0YjE5ZmY5MTEzODg5NzhmOGM4N2E5YTk=
|
12
|
+
data.tar.gz: !binary |-
|
13
|
+
ZWU4NTIxMGRjYTkwYWZhYTBiMTk3OWE1MjgxNmU5OWM4MWNhM2MwMGNmNzk3
|
14
|
+
Nzk3ZTk2YTM0MmRkNDBmM2JjZTMwMTNlNjZkZjEwNzNlZTQ4NjgwNWI1Zjcz
|
15
|
+
ZjBhNThmNDlkYjE0MjU0YTY0NmJjYmJlM2IyNTkyMmFmMzhhN2I=
|
data/.gitignore
ADDED
data/Gemfile
ADDED
data/Rakefile
ADDED
@@ -0,0 +1,48 @@
|
|
1
|
+
# encoding: utf-8
|
2
|
+
require "logstash/codecs/base"
|
3
|
+
require "logstash/util/charset"
|
4
|
+
|
5
|
+
# The "plain" codec is for plain text with no delimiting between events.
|
6
|
+
#
|
7
|
+
# This is mainly useful on inputs and outputs that already have a defined
|
8
|
+
# framing in their transport protocol (such as zeromq, rabbitmq, redis, etc)
|
9
|
+
class LogStash::Codecs::Plain < LogStash::Codecs::Base
|
10
|
+
config_name "plain"
|
11
|
+
milestone 3
|
12
|
+
|
13
|
+
# Set the message you which to emit for each event. This supports sprintf
|
14
|
+
# strings.
|
15
|
+
#
|
16
|
+
# This setting only affects outputs (encoding of events).
|
17
|
+
config :format, :validate => :string
|
18
|
+
|
19
|
+
# The character encoding used in this input. Examples include "UTF-8"
|
20
|
+
# and "cp1252"
|
21
|
+
#
|
22
|
+
# This setting is useful if your log files are in Latin-1 (aka cp1252)
|
23
|
+
# or in another character set other than UTF-8.
|
24
|
+
#
|
25
|
+
# This only affects "plain" format logs since json is UTF-8 already.
|
26
|
+
config :charset, :validate => ::Encoding.name_list, :default => "UTF-8"
|
27
|
+
|
28
|
+
public
|
29
|
+
def register
|
30
|
+
@converter = LogStash::Util::Charset.new(@charset)
|
31
|
+
@converter.logger = @logger
|
32
|
+
end
|
33
|
+
|
34
|
+
public
|
35
|
+
def decode(data)
|
36
|
+
yield LogStash::Event.new("message" => @converter.convert(data))
|
37
|
+
end # def decode
|
38
|
+
|
39
|
+
public
|
40
|
+
def encode(event)
|
41
|
+
if event.is_a?(LogStash::Event) and @format
|
42
|
+
@on_event.call(event.sprintf(@format))
|
43
|
+
else
|
44
|
+
@on_event.call(event.to_s)
|
45
|
+
end
|
46
|
+
end # def encode
|
47
|
+
|
48
|
+
end # class LogStash::Codecs::Plain
|
@@ -0,0 +1,26 @@
|
|
1
|
+
Gem::Specification.new do |s|
|
2
|
+
|
3
|
+
s.name = 'logstash-codec-plain'
|
4
|
+
s.version = '0.1.0'
|
5
|
+
s.licenses = ['Apache License (2.0)']
|
6
|
+
s.summary = "The plain codec is for plain text with no delimiting between events."
|
7
|
+
s.description = "The plain codec is for plain text with no delimiting between events."
|
8
|
+
s.authors = ["Elasticsearch"]
|
9
|
+
s.email = 'richard.pijnenburg@elasticsearch.com'
|
10
|
+
s.homepage = "http://logstash.net/"
|
11
|
+
s.require_paths = ["lib"]
|
12
|
+
|
13
|
+
# Files
|
14
|
+
s.files = `git ls-files`.split($\)
|
15
|
+
|
16
|
+
# Tests
|
17
|
+
s.test_files = s.files.grep(%r{^(test|spec|features)/})
|
18
|
+
|
19
|
+
# Special flag to let us know this is actually a logstash plugin
|
20
|
+
s.metadata = { "logstash_plugin" => "true", "group" => "codec" }
|
21
|
+
|
22
|
+
# Gem dependencies
|
23
|
+
s.add_runtime_dependency 'logstash', '>= 1.4.0', '< 2.0.0'
|
24
|
+
|
25
|
+
end
|
26
|
+
|
@@ -0,0 +1,9 @@
|
|
1
|
+
require "gem_publisher"
|
2
|
+
|
3
|
+
desc "Publish gem to RubyGems.org"
|
4
|
+
task :publish_gem do |t|
|
5
|
+
gem_file = Dir.glob(File.expand_path('../*.gemspec',File.dirname(__FILE__))).first
|
6
|
+
gem = GemPublisher.publish_if_updated(gem_file, :rubygems)
|
7
|
+
puts "Published #{gem}" if gem
|
8
|
+
end
|
9
|
+
|
data/rakelib/vendor.rake
ADDED
@@ -0,0 +1,169 @@
|
|
1
|
+
require "net/http"
|
2
|
+
require "uri"
|
3
|
+
require "digest/sha1"
|
4
|
+
|
5
|
+
def vendor(*args)
|
6
|
+
return File.join("vendor", *args)
|
7
|
+
end
|
8
|
+
|
9
|
+
directory "vendor/" => ["vendor"] do |task, args|
|
10
|
+
mkdir task.name
|
11
|
+
end
|
12
|
+
|
13
|
+
def fetch(url, sha1, output)
|
14
|
+
|
15
|
+
puts "Downloading #{url}"
|
16
|
+
actual_sha1 = download(url, output)
|
17
|
+
|
18
|
+
if actual_sha1 != sha1
|
19
|
+
fail "SHA1 does not match (expected '#{sha1}' but got '#{actual_sha1}')"
|
20
|
+
end
|
21
|
+
end # def fetch
|
22
|
+
|
23
|
+
def file_fetch(url, sha1)
|
24
|
+
filename = File.basename( URI(url).path )
|
25
|
+
output = "vendor/#{filename}"
|
26
|
+
task output => [ "vendor/" ] do
|
27
|
+
begin
|
28
|
+
actual_sha1 = file_sha1(output)
|
29
|
+
if actual_sha1 != sha1
|
30
|
+
fetch(url, sha1, output)
|
31
|
+
end
|
32
|
+
rescue Errno::ENOENT
|
33
|
+
fetch(url, sha1, output)
|
34
|
+
end
|
35
|
+
end.invoke
|
36
|
+
|
37
|
+
return output
|
38
|
+
end
|
39
|
+
|
40
|
+
def file_sha1(path)
|
41
|
+
digest = Digest::SHA1.new
|
42
|
+
fd = File.new(path, "r")
|
43
|
+
while true
|
44
|
+
begin
|
45
|
+
digest << fd.sysread(16384)
|
46
|
+
rescue EOFError
|
47
|
+
break
|
48
|
+
end
|
49
|
+
end
|
50
|
+
return digest.hexdigest
|
51
|
+
ensure
|
52
|
+
fd.close if fd
|
53
|
+
end
|
54
|
+
|
55
|
+
def download(url, output)
|
56
|
+
uri = URI(url)
|
57
|
+
digest = Digest::SHA1.new
|
58
|
+
tmp = "#{output}.tmp"
|
59
|
+
Net::HTTP.start(uri.host, uri.port, :use_ssl => (uri.scheme == "https")) do |http|
|
60
|
+
request = Net::HTTP::Get.new(uri.path)
|
61
|
+
http.request(request) do |response|
|
62
|
+
fail "HTTP fetch failed for #{url}. #{response}" if [200, 301].include?(response.code)
|
63
|
+
size = (response["content-length"].to_i || -1).to_f
|
64
|
+
count = 0
|
65
|
+
File.open(tmp, "w") do |fd|
|
66
|
+
response.read_body do |chunk|
|
67
|
+
fd.write(chunk)
|
68
|
+
digest << chunk
|
69
|
+
if size > 0 && $stdout.tty?
|
70
|
+
count += chunk.bytesize
|
71
|
+
$stdout.write(sprintf("\r%0.2f%%", count/size * 100))
|
72
|
+
end
|
73
|
+
end
|
74
|
+
end
|
75
|
+
$stdout.write("\r \r") if $stdout.tty?
|
76
|
+
end
|
77
|
+
end
|
78
|
+
|
79
|
+
File.rename(tmp, output)
|
80
|
+
|
81
|
+
return digest.hexdigest
|
82
|
+
rescue SocketError => e
|
83
|
+
puts "Failure while downloading #{url}: #{e}"
|
84
|
+
raise
|
85
|
+
ensure
|
86
|
+
File.unlink(tmp) if File.exist?(tmp)
|
87
|
+
end # def download
|
88
|
+
|
89
|
+
def untar(tarball, &block)
|
90
|
+
require "archive/tar/minitar"
|
91
|
+
tgz = Zlib::GzipReader.new(File.open(tarball))
|
92
|
+
# Pull out typesdb
|
93
|
+
tar = Archive::Tar::Minitar::Input.open(tgz)
|
94
|
+
tar.each do |entry|
|
95
|
+
path = block.call(entry)
|
96
|
+
next if path.nil?
|
97
|
+
parent = File.dirname(path)
|
98
|
+
|
99
|
+
mkdir_p parent unless File.directory?(parent)
|
100
|
+
|
101
|
+
# Skip this file if the output file is the same size
|
102
|
+
if entry.directory?
|
103
|
+
mkdir path unless File.directory?(path)
|
104
|
+
else
|
105
|
+
entry_mode = entry.instance_eval { @mode } & 0777
|
106
|
+
if File.exists?(path)
|
107
|
+
stat = File.stat(path)
|
108
|
+
# TODO(sissel): Submit a patch to archive-tar-minitar upstream to
|
109
|
+
# expose headers in the entry.
|
110
|
+
entry_size = entry.instance_eval { @size }
|
111
|
+
# If file sizes are same, skip writing.
|
112
|
+
next if stat.size == entry_size && (stat.mode & 0777) == entry_mode
|
113
|
+
end
|
114
|
+
puts "Extracting #{entry.full_name} from #{tarball} #{entry_mode.to_s(8)}"
|
115
|
+
File.open(path, "w") do |fd|
|
116
|
+
# eof? check lets us skip empty files. Necessary because the API provided by
|
117
|
+
# Archive::Tar::Minitar::Reader::EntryStream only mostly acts like an
|
118
|
+
# IO object. Something about empty files in this EntryStream causes
|
119
|
+
# IO.copy_stream to throw "can't convert nil into String" on JRuby
|
120
|
+
# TODO(sissel): File a bug about this.
|
121
|
+
while !entry.eof?
|
122
|
+
chunk = entry.read(16384)
|
123
|
+
fd.write(chunk)
|
124
|
+
end
|
125
|
+
#IO.copy_stream(entry, fd)
|
126
|
+
end
|
127
|
+
File.chmod(entry_mode, path)
|
128
|
+
end
|
129
|
+
end
|
130
|
+
tar.close
|
131
|
+
File.unlink(tarball) if File.file?(tarball)
|
132
|
+
end # def untar
|
133
|
+
|
134
|
+
def ungz(file)
|
135
|
+
|
136
|
+
outpath = file.gsub('.gz', '')
|
137
|
+
tgz = Zlib::GzipReader.new(File.open(file))
|
138
|
+
begin
|
139
|
+
File.open(outpath, "w") do |out|
|
140
|
+
IO::copy_stream(tgz, out)
|
141
|
+
end
|
142
|
+
File.unlink(file)
|
143
|
+
rescue
|
144
|
+
File.unlink(outpath) if File.file?(outpath)
|
145
|
+
raise
|
146
|
+
end
|
147
|
+
tgz.close
|
148
|
+
end
|
149
|
+
|
150
|
+
desc "Process any vendor files required for this plugin"
|
151
|
+
task "vendor" do |task, args|
|
152
|
+
|
153
|
+
@files.each do |file|
|
154
|
+
download = file_fetch(file['url'], file['sha1'])
|
155
|
+
if download =~ /.tar.gz/
|
156
|
+
prefix = download.gsub('.tar.gz', '').gsub('vendor/', '')
|
157
|
+
untar(download) do |entry|
|
158
|
+
if !file['files'].nil?
|
159
|
+
next unless file['files'].include?(entry.full_name.gsub(prefix, ''))
|
160
|
+
out = entry.full_name.split("/").last
|
161
|
+
end
|
162
|
+
File.join('vendor', out)
|
163
|
+
end
|
164
|
+
elsif download =~ /.gz/
|
165
|
+
ungz(download)
|
166
|
+
end
|
167
|
+
end
|
168
|
+
|
169
|
+
end
|
@@ -0,0 +1,106 @@
|
|
1
|
+
# encoding: utf-8
|
2
|
+
|
3
|
+
require "logstash/codecs/plain"
|
4
|
+
require "logstash/event"
|
5
|
+
require "insist"
|
6
|
+
|
7
|
+
describe LogStash::Codecs::Plain do
|
8
|
+
context "#decode" do
|
9
|
+
it "should return a valid event" do
|
10
|
+
subject.decode("Testing decoding.") do |event|
|
11
|
+
insist { event.is_a? LogStash::Event }
|
12
|
+
end
|
13
|
+
end
|
14
|
+
|
15
|
+
context "using default UTF-8 charset" do
|
16
|
+
|
17
|
+
it "should decode valid UTF-8 input" do
|
18
|
+
["foobar", "κόσμε"].each do |data|
|
19
|
+
insist { data.encoding.name } == "UTF-8"
|
20
|
+
insist { data.valid_encoding? } == true
|
21
|
+
subject.decode(data) do |event|
|
22
|
+
insist { event["message"] } == data
|
23
|
+
insist { event["message"].encoding.name } == "UTF-8"
|
24
|
+
end
|
25
|
+
end
|
26
|
+
end
|
27
|
+
|
28
|
+
it "should escape invalid sequences" do
|
29
|
+
["foo \xED\xB9\x81\xC3", "bar \xAD"].each do |data|
|
30
|
+
insist { data.encoding.name } == "UTF-8"
|
31
|
+
insist { data.valid_encoding? } == false
|
32
|
+
subject.decode(data) do |event|
|
33
|
+
insist { event["message"] } == data.inspect[1..-2]
|
34
|
+
insist { event["message"].encoding.name } == "UTF-8"
|
35
|
+
end
|
36
|
+
end
|
37
|
+
end
|
38
|
+
end
|
39
|
+
|
40
|
+
|
41
|
+
context "with valid non UTF-8 source encoding" do
|
42
|
+
|
43
|
+
subject{LogStash::Codecs::Plain.new("charset" => "ISO-8859-1")}
|
44
|
+
|
45
|
+
it "should encode to UTF-8" do
|
46
|
+
samples = [
|
47
|
+
["foobar", "foobar"],
|
48
|
+
["\xE0 Montr\xE9al", "à Montréal"],
|
49
|
+
]
|
50
|
+
samples.map{|(a, b)| [a.force_encoding("ISO-8859-1"), b]}.each do |(a, b)|
|
51
|
+
insist { a.encoding.name } == "ISO-8859-1"
|
52
|
+
insist { b.encoding.name } == "UTF-8"
|
53
|
+
insist { a.valid_encoding? } == true
|
54
|
+
|
55
|
+
subject.decode(a) do |event|
|
56
|
+
insist { event["message"] } == b
|
57
|
+
insist { event["message"].encoding.name } == "UTF-8"
|
58
|
+
end
|
59
|
+
end
|
60
|
+
end
|
61
|
+
end
|
62
|
+
|
63
|
+
context "with invalid non UTF-8 source encoding" do
|
64
|
+
|
65
|
+
subject{LogStash::Codecs::Plain.new("charset" => "ASCII-8BIT")}
|
66
|
+
|
67
|
+
it "should encode to UTF-8" do
|
68
|
+
samples = [
|
69
|
+
["\xE0 Montr\xE9al", "� Montr�al"],
|
70
|
+
["\xCE\xBA\xCF\x8C\xCF\x83\xCE\xBC\xCE\xB5", "����������"],
|
71
|
+
]
|
72
|
+
samples.map{|(a, b)| [a.force_encoding("ASCII-8BIT"), b]}.each do |(a, b)|
|
73
|
+
insist { a.encoding.name } == "ASCII-8BIT"
|
74
|
+
insist { b.encoding.name } == "UTF-8"
|
75
|
+
insist { a.valid_encoding? } == true
|
76
|
+
|
77
|
+
subject.decode(a) do |event|
|
78
|
+
insist { event["message"] } == b
|
79
|
+
insist { event["message"].encoding.name } == "UTF-8"
|
80
|
+
end
|
81
|
+
end
|
82
|
+
end
|
83
|
+
end
|
84
|
+
end
|
85
|
+
|
86
|
+
context "#encode" do
|
87
|
+
it "should return a plain text encoding" do
|
88
|
+
event = LogStash::Event.new
|
89
|
+
event["message"] = "Hello World."
|
90
|
+
subject.on_event do |data|
|
91
|
+
insist { data } == event.to_s
|
92
|
+
end
|
93
|
+
subject.encode(event)
|
94
|
+
end
|
95
|
+
|
96
|
+
it "should respect the format setting" do
|
97
|
+
format = "%{[hello]} %{[something][fancy]}"
|
98
|
+
codec = LogStash::Codecs::Plain.new("format" => format)
|
99
|
+
event = LogStash::Event.new("hello" => "world", "something" => { "fancy" => 123 })
|
100
|
+
codec.on_event do |data|
|
101
|
+
insist { data } == event.sprintf(format)
|
102
|
+
end
|
103
|
+
codec.encode(event)
|
104
|
+
end
|
105
|
+
end
|
106
|
+
end
|
metadata
ADDED
@@ -0,0 +1,74 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: logstash-codec-plain
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: 0.1.0
|
5
|
+
platform: ruby
|
6
|
+
authors:
|
7
|
+
- Elasticsearch
|
8
|
+
autorequire:
|
9
|
+
bindir: bin
|
10
|
+
cert_chain: []
|
11
|
+
date: 2014-10-30 00:00:00.000000000 Z
|
12
|
+
dependencies:
|
13
|
+
- !ruby/object:Gem::Dependency
|
14
|
+
name: logstash
|
15
|
+
requirement: !ruby/object:Gem::Requirement
|
16
|
+
requirements:
|
17
|
+
- - ! '>='
|
18
|
+
- !ruby/object:Gem::Version
|
19
|
+
version: 1.4.0
|
20
|
+
- - <
|
21
|
+
- !ruby/object:Gem::Version
|
22
|
+
version: 2.0.0
|
23
|
+
type: :runtime
|
24
|
+
prerelease: false
|
25
|
+
version_requirements: !ruby/object:Gem::Requirement
|
26
|
+
requirements:
|
27
|
+
- - ! '>='
|
28
|
+
- !ruby/object:Gem::Version
|
29
|
+
version: 1.4.0
|
30
|
+
- - <
|
31
|
+
- !ruby/object:Gem::Version
|
32
|
+
version: 2.0.0
|
33
|
+
description: The plain codec is for plain text with no delimiting between events.
|
34
|
+
email: richard.pijnenburg@elasticsearch.com
|
35
|
+
executables: []
|
36
|
+
extensions: []
|
37
|
+
extra_rdoc_files: []
|
38
|
+
files:
|
39
|
+
- .gitignore
|
40
|
+
- Gemfile
|
41
|
+
- Rakefile
|
42
|
+
- lib/logstash/codecs/plain.rb
|
43
|
+
- logstash-codec-plain.gemspec
|
44
|
+
- rakelib/publish.rake
|
45
|
+
- rakelib/vendor.rake
|
46
|
+
- spec/codecs/plain_spec.rb
|
47
|
+
homepage: http://logstash.net/
|
48
|
+
licenses:
|
49
|
+
- Apache License (2.0)
|
50
|
+
metadata:
|
51
|
+
logstash_plugin: 'true'
|
52
|
+
group: codec
|
53
|
+
post_install_message:
|
54
|
+
rdoc_options: []
|
55
|
+
require_paths:
|
56
|
+
- lib
|
57
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
58
|
+
requirements:
|
59
|
+
- - ! '>='
|
60
|
+
- !ruby/object:Gem::Version
|
61
|
+
version: '0'
|
62
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
63
|
+
requirements:
|
64
|
+
- - ! '>='
|
65
|
+
- !ruby/object:Gem::Version
|
66
|
+
version: '0'
|
67
|
+
requirements: []
|
68
|
+
rubyforge_project:
|
69
|
+
rubygems_version: 2.4.1
|
70
|
+
signing_key:
|
71
|
+
specification_version: 4
|
72
|
+
summary: The plain codec is for plain text with no delimiting between events.
|
73
|
+
test_files:
|
74
|
+
- spec/codecs/plain_spec.rb
|