logstash-input-s3 0.1.0 → 0.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +5 -13
- data/Gemfile +3 -4
- data/Rakefile +1 -0
- data/lib/logstash/inputs/s3.rb +6 -5
- data/logstash-input-s3.gemspec +7 -6
- data/spec/inputs/s3_spec.rb +1 -1
- metadata +54 -28
- data/rakelib/publish.rake +0 -9
- data/rakelib/vendor.rake +0 -169
checksums.yaml
CHANGED
|
@@ -1,15 +1,7 @@
|
|
|
1
1
|
---
|
|
2
|
-
|
|
3
|
-
metadata.gz:
|
|
4
|
-
|
|
5
|
-
data.tar.gz: !binary |-
|
|
6
|
-
YzlhZWI4NGMyZTY1N2E0Njk5M2Y3NjI1YTIwNzYyNWJhM2QzZDI2ZQ==
|
|
2
|
+
SHA1:
|
|
3
|
+
metadata.gz: 18491f4d5a8850a30b8bd5b25c33cc2a0dd9c247
|
|
4
|
+
data.tar.gz: c3017df48dd6ea484f8afb81e77d5b1e085d9d11
|
|
7
5
|
SHA512:
|
|
8
|
-
metadata.gz:
|
|
9
|
-
|
|
10
|
-
NmFhMzMyZmY2MTkwZWM3Y2ZlZDhiYzQ1NThhNzQ2ODgyYThjNzFiNDhkMmE3
|
|
11
|
-
Zjc5N2U2ODlkYmYwM2RiZmQ4Y2I0OGVmZTc0YTdhN2IzMGI3YmU=
|
|
12
|
-
data.tar.gz: !binary |-
|
|
13
|
-
NjI1NmFiOTY1ZWNiNGZiZTQ4YjE4ZjFiNGY3ZjU3MGU1NDgwYTQyODI0YTEx
|
|
14
|
-
MGNkMjA5MGNmNTdmNTJlNDAyNjlhODc4ZDkzYWFkNWM4MzU3ZTJmZjZlZDdk
|
|
15
|
-
Y2I5ODIxM2RiYmEwNTA4ZmU5ZGQyN2YxZjMzNjc4NzEyYWM3NmM=
|
|
6
|
+
metadata.gz: 8d112c0f09cbfe563eebce342812e8082b125b660560a250971b81a16d12584cad7303cc2b8b37fd2c6dfb2d64a0b44b44b843e133a22cde89971b1568bc38f8
|
|
7
|
+
data.tar.gz: ecec7bab79976f09f84f72b516ebe95dfbc6e07998f23ff581e17e275ab994259707e311aed5441bb38be5557bbed8ca377abfeb41f701fdcd8e79716954a51e
|
data/Gemfile
CHANGED
|
@@ -1,4 +1,3 @@
|
|
|
1
|
-
source '
|
|
2
|
-
|
|
3
|
-
gem
|
|
4
|
-
gem 'archive-tar-minitar'
|
|
1
|
+
source 'https://rubygems.org'
|
|
2
|
+
gemspec
|
|
3
|
+
gem "logstash", :github => "elasticsearch/logstash", :branch => "1.5"
|
data/Rakefile
CHANGED
data/lib/logstash/inputs/s3.rb
CHANGED
|
@@ -8,20 +8,20 @@ require "tmpdir"
|
|
|
8
8
|
# Stream events from files from a S3 bucket.
|
|
9
9
|
#
|
|
10
10
|
# Each line from each file generates an event.
|
|
11
|
-
# Files ending in
|
|
11
|
+
# Files ending in `.gz` are handled as gzip'ed files.
|
|
12
12
|
class LogStash::Inputs::S3 < LogStash::Inputs::Base
|
|
13
13
|
config_name "s3"
|
|
14
14
|
milestone 1
|
|
15
15
|
|
|
16
|
-
# TODO(sissel): refactor to use
|
|
16
|
+
# TODO(sissel): refactor to use `line` codec (requires removing both gzip
|
|
17
17
|
# support and readline usage). Support gzip through a gzip codec! ;)
|
|
18
18
|
default :codec, "plain"
|
|
19
19
|
|
|
20
20
|
# The credentials of the AWS account used to access the bucket.
|
|
21
21
|
# Credentials can be specified:
|
|
22
|
-
# - As an ["id","secret"] array
|
|
23
|
-
# - As a path to a file containing AWS_ACCESS_KEY_ID
|
|
24
|
-
# - In the environment, if not set (using variables AWS_ACCESS_KEY_ID and AWS_SECRET_ACCESS_KEY)
|
|
22
|
+
# - As an `["id","secret"]` array
|
|
23
|
+
# - As a path to a file containing `AWS_ACCESS_KEY_ID=...` and `AWS_SECRET_ACCESS_KEY=...`
|
|
24
|
+
# - In the environment, if not set (using variables `AWS_ACCESS_KEY_ID` and `AWS_SECRET_ACCESS_KEY`)
|
|
25
25
|
config :credentials, :validate => :array, :default => []
|
|
26
26
|
|
|
27
27
|
# The name of the S3 bucket.
|
|
@@ -44,6 +44,7 @@ class LogStash::Inputs::S3 < LogStash::Inputs::Base
|
|
|
44
44
|
# Where to write the since database (keeps track of the date
|
|
45
45
|
# the last handled file was added to S3). The default will write
|
|
46
46
|
# sincedb files to some path matching "$HOME/.sincedb*"
|
|
47
|
+
# Should be a path with filename not just a directory.
|
|
47
48
|
config :sincedb_path, :validate => :string, :default => nil
|
|
48
49
|
|
|
49
50
|
# Name of a S3 bucket to backup processed files to.
|
data/logstash-input-s3.gemspec
CHANGED
|
@@ -1,13 +1,13 @@
|
|
|
1
1
|
Gem::Specification.new do |s|
|
|
2
2
|
|
|
3
3
|
s.name = 'logstash-input-s3'
|
|
4
|
-
s.version = '0.1.
|
|
4
|
+
s.version = '0.1.1'
|
|
5
5
|
s.licenses = ['Apache License (2.0)']
|
|
6
6
|
s.summary = "Stream events from files from a S3 bucket."
|
|
7
|
-
s.description = "
|
|
7
|
+
s.description = "This gem is a logstash plugin required to be installed on top of the Logstash core pipeline using $LS_HOME/bin/plugin install gemname. This gem is not a stand-alone program"
|
|
8
8
|
s.authors = ["Elasticsearch"]
|
|
9
|
-
s.email = '
|
|
10
|
-
s.homepage = "http://logstash.
|
|
9
|
+
s.email = 'info@elasticsearch.com'
|
|
10
|
+
s.homepage = "http://www.elasticsearch.org/guide/en/logstash/current/index.html"
|
|
11
11
|
s.require_paths = ["lib"]
|
|
12
12
|
|
|
13
13
|
# Files
|
|
@@ -17,13 +17,14 @@ Gem::Specification.new do |s|
|
|
|
17
17
|
s.test_files = s.files.grep(%r{^(test|spec|features)/})
|
|
18
18
|
|
|
19
19
|
# Special flag to let us know this is actually a logstash plugin
|
|
20
|
-
s.metadata = { "logstash_plugin" => "true", "
|
|
20
|
+
s.metadata = { "logstash_plugin" => "true", "logstash_group" => "input" }
|
|
21
21
|
|
|
22
22
|
# Gem dependencies
|
|
23
23
|
s.add_runtime_dependency 'logstash', '>= 1.4.0', '< 2.0.0'
|
|
24
|
-
|
|
24
|
+
s.add_runtime_dependency 'logstash-mixin-aws'
|
|
25
25
|
s.add_runtime_dependency 'logstash-codec-plain'
|
|
26
26
|
s.add_runtime_dependency 'aws-sdk'
|
|
27
27
|
|
|
28
|
+
s.add_development_dependency 'logstash-devutils'
|
|
28
29
|
end
|
|
29
30
|
|
data/spec/inputs/s3_spec.rb
CHANGED
metadata
CHANGED
|
@@ -1,65 +1,93 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: logstash-input-s3
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 0.1.
|
|
4
|
+
version: 0.1.1
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Elasticsearch
|
|
8
|
-
autorequire:
|
|
8
|
+
autorequire:
|
|
9
9
|
bindir: bin
|
|
10
10
|
cert_chain: []
|
|
11
|
-
date: 2014-11-
|
|
11
|
+
date: 2014-11-19 00:00:00.000000000 Z
|
|
12
12
|
dependencies:
|
|
13
13
|
- !ruby/object:Gem::Dependency
|
|
14
14
|
name: logstash
|
|
15
|
-
|
|
15
|
+
version_requirements: !ruby/object:Gem::Requirement
|
|
16
16
|
requirements:
|
|
17
|
-
- -
|
|
17
|
+
- - '>='
|
|
18
18
|
- !ruby/object:Gem::Version
|
|
19
19
|
version: 1.4.0
|
|
20
20
|
- - <
|
|
21
21
|
- !ruby/object:Gem::Version
|
|
22
22
|
version: 2.0.0
|
|
23
|
-
|
|
24
|
-
prerelease: false
|
|
25
|
-
version_requirements: !ruby/object:Gem::Requirement
|
|
23
|
+
requirement: !ruby/object:Gem::Requirement
|
|
26
24
|
requirements:
|
|
27
|
-
- -
|
|
25
|
+
- - '>='
|
|
28
26
|
- !ruby/object:Gem::Version
|
|
29
27
|
version: 1.4.0
|
|
30
28
|
- - <
|
|
31
29
|
- !ruby/object:Gem::Version
|
|
32
30
|
version: 2.0.0
|
|
31
|
+
prerelease: false
|
|
32
|
+
type: :runtime
|
|
33
33
|
- !ruby/object:Gem::Dependency
|
|
34
|
-
name: logstash-
|
|
34
|
+
name: logstash-mixin-aws
|
|
35
|
+
version_requirements: !ruby/object:Gem::Requirement
|
|
36
|
+
requirements:
|
|
37
|
+
- - '>='
|
|
38
|
+
- !ruby/object:Gem::Version
|
|
39
|
+
version: '0'
|
|
35
40
|
requirement: !ruby/object:Gem::Requirement
|
|
36
41
|
requirements:
|
|
37
|
-
- -
|
|
42
|
+
- - '>='
|
|
38
43
|
- !ruby/object:Gem::Version
|
|
39
44
|
version: '0'
|
|
40
|
-
type: :runtime
|
|
41
45
|
prerelease: false
|
|
46
|
+
type: :runtime
|
|
47
|
+
- !ruby/object:Gem::Dependency
|
|
48
|
+
name: logstash-codec-plain
|
|
42
49
|
version_requirements: !ruby/object:Gem::Requirement
|
|
43
50
|
requirements:
|
|
44
|
-
- -
|
|
51
|
+
- - '>='
|
|
45
52
|
- !ruby/object:Gem::Version
|
|
46
53
|
version: '0'
|
|
54
|
+
requirement: !ruby/object:Gem::Requirement
|
|
55
|
+
requirements:
|
|
56
|
+
- - '>='
|
|
57
|
+
- !ruby/object:Gem::Version
|
|
58
|
+
version: '0'
|
|
59
|
+
prerelease: false
|
|
60
|
+
type: :runtime
|
|
47
61
|
- !ruby/object:Gem::Dependency
|
|
48
62
|
name: aws-sdk
|
|
63
|
+
version_requirements: !ruby/object:Gem::Requirement
|
|
64
|
+
requirements:
|
|
65
|
+
- - '>='
|
|
66
|
+
- !ruby/object:Gem::Version
|
|
67
|
+
version: '0'
|
|
49
68
|
requirement: !ruby/object:Gem::Requirement
|
|
50
69
|
requirements:
|
|
51
|
-
- -
|
|
70
|
+
- - '>='
|
|
52
71
|
- !ruby/object:Gem::Version
|
|
53
72
|
version: '0'
|
|
54
|
-
type: :runtime
|
|
55
73
|
prerelease: false
|
|
74
|
+
type: :runtime
|
|
75
|
+
- !ruby/object:Gem::Dependency
|
|
76
|
+
name: logstash-devutils
|
|
56
77
|
version_requirements: !ruby/object:Gem::Requirement
|
|
57
78
|
requirements:
|
|
58
|
-
- -
|
|
79
|
+
- - '>='
|
|
80
|
+
- !ruby/object:Gem::Version
|
|
81
|
+
version: '0'
|
|
82
|
+
requirement: !ruby/object:Gem::Requirement
|
|
83
|
+
requirements:
|
|
84
|
+
- - '>='
|
|
59
85
|
- !ruby/object:Gem::Version
|
|
60
86
|
version: '0'
|
|
61
|
-
|
|
62
|
-
|
|
87
|
+
prerelease: false
|
|
88
|
+
type: :development
|
|
89
|
+
description: This gem is a logstash plugin required to be installed on top of the Logstash core pipeline using $LS_HOME/bin/plugin install gemname. This gem is not a stand-alone program
|
|
90
|
+
email: info@elasticsearch.com
|
|
63
91
|
executables: []
|
|
64
92
|
extensions: []
|
|
65
93
|
extra_rdoc_files: []
|
|
@@ -70,33 +98,31 @@ files:
|
|
|
70
98
|
- Rakefile
|
|
71
99
|
- lib/logstash/inputs/s3.rb
|
|
72
100
|
- logstash-input-s3.gemspec
|
|
73
|
-
- rakelib/publish.rake
|
|
74
|
-
- rakelib/vendor.rake
|
|
75
101
|
- spec/inputs/s3_spec.rb
|
|
76
|
-
homepage: http://logstash.
|
|
102
|
+
homepage: http://www.elasticsearch.org/guide/en/logstash/current/index.html
|
|
77
103
|
licenses:
|
|
78
104
|
- Apache License (2.0)
|
|
79
105
|
metadata:
|
|
80
106
|
logstash_plugin: 'true'
|
|
81
|
-
|
|
82
|
-
post_install_message:
|
|
107
|
+
logstash_group: input
|
|
108
|
+
post_install_message:
|
|
83
109
|
rdoc_options: []
|
|
84
110
|
require_paths:
|
|
85
111
|
- lib
|
|
86
112
|
required_ruby_version: !ruby/object:Gem::Requirement
|
|
87
113
|
requirements:
|
|
88
|
-
- -
|
|
114
|
+
- - '>='
|
|
89
115
|
- !ruby/object:Gem::Version
|
|
90
116
|
version: '0'
|
|
91
117
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
|
92
118
|
requirements:
|
|
93
|
-
- -
|
|
119
|
+
- - '>='
|
|
94
120
|
- !ruby/object:Gem::Version
|
|
95
121
|
version: '0'
|
|
96
122
|
requirements: []
|
|
97
|
-
rubyforge_project:
|
|
98
|
-
rubygems_version: 2.
|
|
99
|
-
signing_key:
|
|
123
|
+
rubyforge_project:
|
|
124
|
+
rubygems_version: 2.2.2
|
|
125
|
+
signing_key:
|
|
100
126
|
specification_version: 4
|
|
101
127
|
summary: Stream events from files from a S3 bucket.
|
|
102
128
|
test_files:
|
data/rakelib/publish.rake
DELETED
|
@@ -1,9 +0,0 @@
|
|
|
1
|
-
require "gem_publisher"
|
|
2
|
-
|
|
3
|
-
desc "Publish gem to RubyGems.org"
|
|
4
|
-
task :publish_gem do |t|
|
|
5
|
-
gem_file = Dir.glob(File.expand_path('../*.gemspec',File.dirname(__FILE__))).first
|
|
6
|
-
gem = GemPublisher.publish_if_updated(gem_file, :rubygems)
|
|
7
|
-
puts "Published #{gem}" if gem
|
|
8
|
-
end
|
|
9
|
-
|
data/rakelib/vendor.rake
DELETED
|
@@ -1,169 +0,0 @@
|
|
|
1
|
-
require "net/http"
|
|
2
|
-
require "uri"
|
|
3
|
-
require "digest/sha1"
|
|
4
|
-
|
|
5
|
-
def vendor(*args)
|
|
6
|
-
return File.join("vendor", *args)
|
|
7
|
-
end
|
|
8
|
-
|
|
9
|
-
directory "vendor/" => ["vendor"] do |task, args|
|
|
10
|
-
mkdir task.name
|
|
11
|
-
end
|
|
12
|
-
|
|
13
|
-
def fetch(url, sha1, output)
|
|
14
|
-
|
|
15
|
-
puts "Downloading #{url}"
|
|
16
|
-
actual_sha1 = download(url, output)
|
|
17
|
-
|
|
18
|
-
if actual_sha1 != sha1
|
|
19
|
-
fail "SHA1 does not match (expected '#{sha1}' but got '#{actual_sha1}')"
|
|
20
|
-
end
|
|
21
|
-
end # def fetch
|
|
22
|
-
|
|
23
|
-
def file_fetch(url, sha1)
|
|
24
|
-
filename = File.basename( URI(url).path )
|
|
25
|
-
output = "vendor/#{filename}"
|
|
26
|
-
task output => [ "vendor/" ] do
|
|
27
|
-
begin
|
|
28
|
-
actual_sha1 = file_sha1(output)
|
|
29
|
-
if actual_sha1 != sha1
|
|
30
|
-
fetch(url, sha1, output)
|
|
31
|
-
end
|
|
32
|
-
rescue Errno::ENOENT
|
|
33
|
-
fetch(url, sha1, output)
|
|
34
|
-
end
|
|
35
|
-
end.invoke
|
|
36
|
-
|
|
37
|
-
return output
|
|
38
|
-
end
|
|
39
|
-
|
|
40
|
-
def file_sha1(path)
|
|
41
|
-
digest = Digest::SHA1.new
|
|
42
|
-
fd = File.new(path, "r")
|
|
43
|
-
while true
|
|
44
|
-
begin
|
|
45
|
-
digest << fd.sysread(16384)
|
|
46
|
-
rescue EOFError
|
|
47
|
-
break
|
|
48
|
-
end
|
|
49
|
-
end
|
|
50
|
-
return digest.hexdigest
|
|
51
|
-
ensure
|
|
52
|
-
fd.close if fd
|
|
53
|
-
end
|
|
54
|
-
|
|
55
|
-
def download(url, output)
|
|
56
|
-
uri = URI(url)
|
|
57
|
-
digest = Digest::SHA1.new
|
|
58
|
-
tmp = "#{output}.tmp"
|
|
59
|
-
Net::HTTP.start(uri.host, uri.port, :use_ssl => (uri.scheme == "https")) do |http|
|
|
60
|
-
request = Net::HTTP::Get.new(uri.path)
|
|
61
|
-
http.request(request) do |response|
|
|
62
|
-
fail "HTTP fetch failed for #{url}. #{response}" if [200, 301].include?(response.code)
|
|
63
|
-
size = (response["content-length"].to_i || -1).to_f
|
|
64
|
-
count = 0
|
|
65
|
-
File.open(tmp, "w") do |fd|
|
|
66
|
-
response.read_body do |chunk|
|
|
67
|
-
fd.write(chunk)
|
|
68
|
-
digest << chunk
|
|
69
|
-
if size > 0 && $stdout.tty?
|
|
70
|
-
count += chunk.bytesize
|
|
71
|
-
$stdout.write(sprintf("\r%0.2f%%", count/size * 100))
|
|
72
|
-
end
|
|
73
|
-
end
|
|
74
|
-
end
|
|
75
|
-
$stdout.write("\r \r") if $stdout.tty?
|
|
76
|
-
end
|
|
77
|
-
end
|
|
78
|
-
|
|
79
|
-
File.rename(tmp, output)
|
|
80
|
-
|
|
81
|
-
return digest.hexdigest
|
|
82
|
-
rescue SocketError => e
|
|
83
|
-
puts "Failure while downloading #{url}: #{e}"
|
|
84
|
-
raise
|
|
85
|
-
ensure
|
|
86
|
-
File.unlink(tmp) if File.exist?(tmp)
|
|
87
|
-
end # def download
|
|
88
|
-
|
|
89
|
-
def untar(tarball, &block)
|
|
90
|
-
require "archive/tar/minitar"
|
|
91
|
-
tgz = Zlib::GzipReader.new(File.open(tarball))
|
|
92
|
-
# Pull out typesdb
|
|
93
|
-
tar = Archive::Tar::Minitar::Input.open(tgz)
|
|
94
|
-
tar.each do |entry|
|
|
95
|
-
path = block.call(entry)
|
|
96
|
-
next if path.nil?
|
|
97
|
-
parent = File.dirname(path)
|
|
98
|
-
|
|
99
|
-
mkdir_p parent unless File.directory?(parent)
|
|
100
|
-
|
|
101
|
-
# Skip this file if the output file is the same size
|
|
102
|
-
if entry.directory?
|
|
103
|
-
mkdir path unless File.directory?(path)
|
|
104
|
-
else
|
|
105
|
-
entry_mode = entry.instance_eval { @mode } & 0777
|
|
106
|
-
if File.exists?(path)
|
|
107
|
-
stat = File.stat(path)
|
|
108
|
-
# TODO(sissel): Submit a patch to archive-tar-minitar upstream to
|
|
109
|
-
# expose headers in the entry.
|
|
110
|
-
entry_size = entry.instance_eval { @size }
|
|
111
|
-
# If file sizes are same, skip writing.
|
|
112
|
-
next if stat.size == entry_size && (stat.mode & 0777) == entry_mode
|
|
113
|
-
end
|
|
114
|
-
puts "Extracting #{entry.full_name} from #{tarball} #{entry_mode.to_s(8)}"
|
|
115
|
-
File.open(path, "w") do |fd|
|
|
116
|
-
# eof? check lets us skip empty files. Necessary because the API provided by
|
|
117
|
-
# Archive::Tar::Minitar::Reader::EntryStream only mostly acts like an
|
|
118
|
-
# IO object. Something about empty files in this EntryStream causes
|
|
119
|
-
# IO.copy_stream to throw "can't convert nil into String" on JRuby
|
|
120
|
-
# TODO(sissel): File a bug about this.
|
|
121
|
-
while !entry.eof?
|
|
122
|
-
chunk = entry.read(16384)
|
|
123
|
-
fd.write(chunk)
|
|
124
|
-
end
|
|
125
|
-
#IO.copy_stream(entry, fd)
|
|
126
|
-
end
|
|
127
|
-
File.chmod(entry_mode, path)
|
|
128
|
-
end
|
|
129
|
-
end
|
|
130
|
-
tar.close
|
|
131
|
-
File.unlink(tarball) if File.file?(tarball)
|
|
132
|
-
end # def untar
|
|
133
|
-
|
|
134
|
-
def ungz(file)
|
|
135
|
-
|
|
136
|
-
outpath = file.gsub('.gz', '')
|
|
137
|
-
tgz = Zlib::GzipReader.new(File.open(file))
|
|
138
|
-
begin
|
|
139
|
-
File.open(outpath, "w") do |out|
|
|
140
|
-
IO::copy_stream(tgz, out)
|
|
141
|
-
end
|
|
142
|
-
File.unlink(file)
|
|
143
|
-
rescue
|
|
144
|
-
File.unlink(outpath) if File.file?(outpath)
|
|
145
|
-
raise
|
|
146
|
-
end
|
|
147
|
-
tgz.close
|
|
148
|
-
end
|
|
149
|
-
|
|
150
|
-
desc "Process any vendor files required for this plugin"
|
|
151
|
-
task "vendor" do |task, args|
|
|
152
|
-
|
|
153
|
-
@files.each do |file|
|
|
154
|
-
download = file_fetch(file['url'], file['sha1'])
|
|
155
|
-
if download =~ /.tar.gz/
|
|
156
|
-
prefix = download.gsub('.tar.gz', '').gsub('vendor/', '')
|
|
157
|
-
untar(download) do |entry|
|
|
158
|
-
if !file['files'].nil?
|
|
159
|
-
next unless file['files'].include?(entry.full_name.gsub(prefix, ''))
|
|
160
|
-
out = entry.full_name.split("/").last
|
|
161
|
-
end
|
|
162
|
-
File.join('vendor', out)
|
|
163
|
-
end
|
|
164
|
-
elsif download =~ /.gz/
|
|
165
|
-
ungz(download)
|
|
166
|
-
end
|
|
167
|
-
end
|
|
168
|
-
|
|
169
|
-
end
|