kinesis-stream-reader 0.1.0

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: 6bb89a21a392fcfa49caca6f223d2a039961f130
4
+ data.tar.gz: f0a08dcbecf7208002b7524652211dbdfba2ff10
5
+ SHA512:
6
+ metadata.gz: 9e679f5ec4da78c12a134fd6ca5eb4737df76e2a35c3e35277bfe8d27e3ab8fe022296873adea599e894af0098a6f7a2da4e2641f2b898f9c23be28550e68f66
7
+ data.tar.gz: 9e256e5f5f83308284fa4c4886d39d3fa62228052767c580c9bd6cf70ef5275ce044d7b19f8f0515f9a3380a3810d3610e53141506b03aed2fa6bc45a5c527b6
data/.gitignore ADDED
@@ -0,0 +1,5 @@
1
+ /.bundle
2
+ /Gemfile.lock
3
+ pkg
4
+ vendor
5
+ /projectFilesBackup
data/.travis.yml ADDED
@@ -0,0 +1,7 @@
1
+ language: ruby
2
+ rvm:
3
+ - 2.2.2
4
+ notifications:
5
+ email: false
6
+ slack:
7
+ secure: GZdf4YAEI9uEly5FBAeYGl6grQi9YgtXImTCWBsrtSyqcVu19paorOe0zVIaXuQttv+8wNHcRx67U9Af/Mu3xWhLcNII4ukE9mKIvJm2TvQBbGpfv1slQ8K9QTTDrQZ4iH8X2ixt3FRseRywb/R4ANsqLbJn4hp/W81i8RG92kTREmR0oTT5Uya5eD2sb0iPOs9qy7gIxAdxIffUTmFiTlEo0R/BAiQFfpjGefbzYaMgi0fpTKvda8PN09itFuV2qNcFHClQHnFpuk3vpKO0WqQz0mfk453xPDihQXS0gneVvtIoqUJYuFy7RGep2fqlIccQV8U61HsVKSuEC3HIRXCdwJDpypOuxNXFuTmT0H6mfL05akUPGseG3S3Q4uTYeqYMjLOR+cDbNFJzsILDmJ0xCDvMnicoghFkB/eBpE9T5+VWiukI2KYo7comf+NTBKLAijxI8jrgZH5PjBcaotD4WQCqBZyEUs2wqWr8Xbup3hRsRzD3pG5PIlhy6LK/l7iXcJ/A2U2yI2ciKnU6Xqb/LjSAxOHwUimloKxwCvluRzVBbLHC21rKOIGT0wokXszpmhlRw2MDx1+9zssKMSS+REct1Ow+pFqCpVvPhV5mLdOjILcA3qeucFqH484SH8/GdfYTGYqSKmgLbTZezmEsnkDe9PmIxh3O7DKDIUY=
data/Gemfile ADDED
@@ -0,0 +1,3 @@
1
+ source 'https://rubygems.org'
2
+
3
+ gemspec
data/LICENSE.txt ADDED
@@ -0,0 +1,21 @@
1
+ The MIT License (MIT)
2
+
3
+ Copyright (c) 2016 Ello PBC
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
data/README.md ADDED
@@ -0,0 +1 @@
1
+ Readme
data/Rakefile ADDED
@@ -0,0 +1,6 @@
1
+ require 'bundler/gem_tasks'
2
+ require 'rspec/core/rake_task'
3
+
4
+ RSpec::Core::RakeTask.new(:spec)
5
+
6
+ task :default => :spec
@@ -0,0 +1,6 @@
1
+ require 'logger'
2
+ require 'aws-sdk-core'
3
+ require 'active_support/notifications'
4
+ require './lib/stream_reader/sequence_number_tracker'
5
+ require './lib/stream_reader/avro_parser'
6
+ require './lib/stream_reader/version'
@@ -0,0 +1,76 @@
1
+ require 'stream_helper'
2
+
3
+ module StreamReader
4
+ class << self
5
+ def logger
6
+ @logger ||= Logger.new(STDOUT)
7
+ end
8
+ end
9
+
10
+ # Assume only one shard for now
11
+ BATCH_SIZE = 10
12
+
13
+ def initialize(stream_name:, prefix: '')
14
+ @stream_name = stream_name
15
+ @prefix = prefix
16
+ @tracker = SequenceNumberTracker.new(key_prefix: [ stream_name, prefix ].compact.join('-'))
17
+ @logger = StreamReader.logger
18
+ end
19
+
20
+ def run!(&block)
21
+ # Locate a shard id to iterate through - we only have one for now
22
+ loop do
23
+ begin
24
+ iterator_opts = { stream_name: @stream_name, shard_id: shard_id }
25
+ if seq = @tracker.last_sequence_number
26
+ iterator_opts[:shard_iterator_type] = 'AFTER_SEQUENCE_NUMBER'
27
+ iterator_opts[:starting_sequence_number] = seq
28
+ else
29
+ iterator_opts[:shard_iterator_type] = 'TRIM_HORIZON'
30
+ end
31
+ @logger.debug "Getting shard iterator for #{@stream_name} / #{seq}"
32
+ resp = client.get_shard_iterator(iterator_opts)
33
+ shard_iterator = resp.shard_iterator
34
+
35
+ # Iterate!
36
+ loop do
37
+ sleep 1
38
+ @logger.debug "Getting records for #{shard_iterator}"
39
+ resp = client.get_records({
40
+ shard_iterator: shard_iterator,
41
+ limit: BATCH_SIZE,
42
+ })
43
+
44
+ resp.records.each do |record|
45
+ ActiveSupport::Notifications.instrument('stream_reader.process_record',
46
+ stream_name: @stream_name,
47
+ prefix: @prefix,
48
+ shard_id: shard_id,
49
+ ms_behind: resp.millis_behind_latest) do
50
+ AvroParser.new(record.data).each_with_schema_name(&block)
51
+ @tracker.last_sequence_number = record.sequence_number
52
+ end
53
+ end
54
+
55
+ shard_iterator = resp.next_shard_iterator
56
+ end
57
+
58
+ rescue Aws::Kinesis::Errors::ExpiredIteratorException
59
+ @logger.debug "Iterator expired! Fetching a new one."
60
+ end
61
+ end
62
+ end
63
+
64
+ private
65
+
66
+ def client
67
+ @client ||= Aws::Kinesis::Client.new
68
+ end
69
+
70
+ def shard_id
71
+ @shard_id ||= begin
72
+ resp = client.describe_stream(stream_name: @stream_name, limit: 1)
73
+ resp.stream_description.shards[0].shard_id
74
+ end
75
+ end
76
+ end
@@ -0,0 +1,17 @@
1
+ require 'avro'
2
+
3
+ class AvroParser
4
+ def initialize(data)
5
+ @data = data
6
+ end
7
+
8
+ def each_with_schema_name
9
+ buffer = StringIO.new(@data)
10
+ reader = Avro::DataFile::Reader.new(buffer, Avro::IO::DatumReader.new)
11
+ reader.each do |record|
12
+ schema_name = reader.datum_reader.readers_schema.name
13
+ yield record, schema_name
14
+ end
15
+ end
16
+ end
17
+
@@ -0,0 +1,17 @@
1
+ require 'redis'
2
+
3
+ class SequenceNumberTracker
4
+ def initialize(key_prefix:, redis_url: ENV['REDIS_URL'], key: 'kinesis-last-seq')
5
+ uri = URI.parse(redis_url || 'redis://localhost:6379')
6
+ @redis = Redis.new(url: uri)
7
+ @key = "#{key_prefix}-#{key}"
8
+ end
9
+
10
+ def last_sequence_number
11
+ @redis.get(@key)
12
+ end
13
+
14
+ def last_sequence_number=(value)
15
+ @redis.set(@key, value)
16
+ end
17
+ end
@@ -0,0 +1,3 @@
1
+ module StreamReader
2
+ VERSION = '0.1.0'
3
+ end
@@ -0,0 +1,9 @@
1
+ ENV['RAILS_ENV'] ||= 'test'
2
+ $LOAD_PATH.unshift File.expand_path('../../lib', __FILE__)
3
+ require 'stream_reader'
4
+ require 'pry'
5
+ require 'fakeredis/rspec'
6
+
7
+ RSpec.configure do |config|
8
+ config.color = true
9
+ end
@@ -0,0 +1,19 @@
1
+ require 'spec_helper'
2
+
3
+ describe AvroParser do
4
+ let(:data) { File.read(File.join(File.dirname(__FILE__), '..', 'support', 'user_was_created.avro')) }
5
+ let(:parser) { described_class.new(data) }
6
+
7
+ it 'parses an Avro message' do
8
+ parser.each_with_schema_name do |record, schema_name|
9
+ expect(schema_name).to eq('UserWasCreated')
10
+ expect(record).to eq({
11
+ "id"=>"1",
12
+ "username"=>"hello",
13
+ "created_at"=>"2015-08-17T13:57:09-06:00",
14
+ "email"=>"hello@example.com",
15
+ "analytics_id"=>"123123"
16
+ })
17
+ end
18
+ end
19
+ end
@@ -0,0 +1,26 @@
1
+ require 'spec_helper'
2
+
3
+ describe SequenceNumberTracker do
4
+ let(:tracker) { described_class.new(key_prefix: 'test-key')}
5
+ let(:tracker2) { described_class.new(key_prefix: 'test-key')}
6
+ let(:other_tracker) { described_class.new(key_prefix: 'other-test-key')}
7
+
8
+ it 'initially has a nil sequence number' do
9
+ expect(tracker.last_sequence_number).to be_nil
10
+ end
11
+
12
+ it 'stores the last saved value for the sequence number' do
13
+ tracker.last_sequence_number = '1000'
14
+ expect(tracker.last_sequence_number).to eq('1000')
15
+ end
16
+
17
+ it 'tracks the same value across individual tracker instances with the same key/prefix' do
18
+ tracker.last_sequence_number = '1000'
19
+ expect(tracker2.last_sequence_number).to eq('1000')
20
+ end
21
+
22
+ it 'does not track the same value across individual tracker instances with different keys/prefixes' do
23
+ tracker.last_sequence_number = '1000'
24
+ expect(other_tracker.last_sequence_number).to be_nil
25
+ end
26
+ end
@@ -0,0 +1,7 @@
1
+ require 'spec_helper'
2
+
3
+ describe StreamReader do
4
+ it 'has a logger' do
5
+ expect(described_class.logger).to be_a(Logger)
6
+ end
7
+ end
Binary file
@@ -0,0 +1,32 @@
1
+ # coding: utf-8
2
+ lib = File.expand_path('../lib', __FILE__)
3
+ $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
4
+ require './lib/stream_reader/version'
5
+
6
+ Gem::Specification.new do |spec|
7
+ spec.name = 'kinesis-stream-reader'
8
+ spec.version = StreamReader::VERSION
9
+ spec.authors = ['Justin-Holmes']
10
+ spec.email = ['justin.ryan.holmes@icloud.com']
11
+
12
+ spec.summary = %q{Ruby interface for reading AWS Kinesis streams}
13
+ spec.homepage = 'https://github.com/ello/kinesis-stream-reader'
14
+ spec.license = 'MIT'
15
+
16
+ spec.files = `git ls-files`.split($/)
17
+ spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
18
+ spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
19
+ spec.require_paths = ['lib']
20
+
21
+ spec.add_dependency 'avro'
22
+ spec.add_dependency 'aws-sdk-core'
23
+ spec.add_dependency 'redis'
24
+ spec.add_dependency 'activesupport'
25
+
26
+ spec.add_development_dependency 'bundler', '~> 1.10'
27
+ spec.add_development_dependency 'rake', '~> 10.0'
28
+ spec.add_development_dependency 'rspec'
29
+ spec.add_development_dependency 'fakeredis'
30
+ spec.add_development_dependency 'pry'
31
+ end
32
+
metadata ADDED
@@ -0,0 +1,192 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: kinesis-stream-reader
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.1.0
5
+ platform: ruby
6
+ authors:
7
+ - Justin-Holmes
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2016-03-09 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: avro
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - ">="
18
+ - !ruby/object:Gem::Version
19
+ version: '0'
20
+ type: :runtime
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - ">="
25
+ - !ruby/object:Gem::Version
26
+ version: '0'
27
+ - !ruby/object:Gem::Dependency
28
+ name: aws-sdk-core
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - ">="
32
+ - !ruby/object:Gem::Version
33
+ version: '0'
34
+ type: :runtime
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - ">="
39
+ - !ruby/object:Gem::Version
40
+ version: '0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: redis
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - ">="
46
+ - !ruby/object:Gem::Version
47
+ version: '0'
48
+ type: :runtime
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - ">="
53
+ - !ruby/object:Gem::Version
54
+ version: '0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: activesupport
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - ">="
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ type: :runtime
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - ">="
67
+ - !ruby/object:Gem::Version
68
+ version: '0'
69
+ - !ruby/object:Gem::Dependency
70
+ name: bundler
71
+ requirement: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - "~>"
74
+ - !ruby/object:Gem::Version
75
+ version: '1.10'
76
+ type: :development
77
+ prerelease: false
78
+ version_requirements: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - "~>"
81
+ - !ruby/object:Gem::Version
82
+ version: '1.10'
83
+ - !ruby/object:Gem::Dependency
84
+ name: rake
85
+ requirement: !ruby/object:Gem::Requirement
86
+ requirements:
87
+ - - "~>"
88
+ - !ruby/object:Gem::Version
89
+ version: '10.0'
90
+ type: :development
91
+ prerelease: false
92
+ version_requirements: !ruby/object:Gem::Requirement
93
+ requirements:
94
+ - - "~>"
95
+ - !ruby/object:Gem::Version
96
+ version: '10.0'
97
+ - !ruby/object:Gem::Dependency
98
+ name: rspec
99
+ requirement: !ruby/object:Gem::Requirement
100
+ requirements:
101
+ - - ">="
102
+ - !ruby/object:Gem::Version
103
+ version: '0'
104
+ type: :development
105
+ prerelease: false
106
+ version_requirements: !ruby/object:Gem::Requirement
107
+ requirements:
108
+ - - ">="
109
+ - !ruby/object:Gem::Version
110
+ version: '0'
111
+ - !ruby/object:Gem::Dependency
112
+ name: fakeredis
113
+ requirement: !ruby/object:Gem::Requirement
114
+ requirements:
115
+ - - ">="
116
+ - !ruby/object:Gem::Version
117
+ version: '0'
118
+ type: :development
119
+ prerelease: false
120
+ version_requirements: !ruby/object:Gem::Requirement
121
+ requirements:
122
+ - - ">="
123
+ - !ruby/object:Gem::Version
124
+ version: '0'
125
+ - !ruby/object:Gem::Dependency
126
+ name: pry
127
+ requirement: !ruby/object:Gem::Requirement
128
+ requirements:
129
+ - - ">="
130
+ - !ruby/object:Gem::Version
131
+ version: '0'
132
+ type: :development
133
+ prerelease: false
134
+ version_requirements: !ruby/object:Gem::Requirement
135
+ requirements:
136
+ - - ">="
137
+ - !ruby/object:Gem::Version
138
+ version: '0'
139
+ description:
140
+ email:
141
+ - justin.ryan.holmes@icloud.com
142
+ executables: []
143
+ extensions: []
144
+ extra_rdoc_files: []
145
+ files:
146
+ - ".gitignore"
147
+ - ".travis.yml"
148
+ - Gemfile
149
+ - LICENSE.txt
150
+ - README.md
151
+ - Rakefile
152
+ - lib/stream_helper.rb
153
+ - lib/stream_reader.rb
154
+ - lib/stream_reader/avro_parser.rb
155
+ - lib/stream_reader/sequence_number_tracker.rb
156
+ - lib/stream_reader/version.rb
157
+ - spec/spec_helper.rb
158
+ - spec/stream_reader/avro_parser_spec.rb
159
+ - spec/stream_reader/sequence_number_track_spec.rb
160
+ - spec/stream_reader_spec.rb
161
+ - spec/support/user_was_created.avro
162
+ - stream_reader.gemspec
163
+ homepage: https://github.com/ello/kinesis-stream-reader
164
+ licenses:
165
+ - MIT
166
+ metadata: {}
167
+ post_install_message:
168
+ rdoc_options: []
169
+ require_paths:
170
+ - lib
171
+ required_ruby_version: !ruby/object:Gem::Requirement
172
+ requirements:
173
+ - - ">="
174
+ - !ruby/object:Gem::Version
175
+ version: '0'
176
+ required_rubygems_version: !ruby/object:Gem::Requirement
177
+ requirements:
178
+ - - ">="
179
+ - !ruby/object:Gem::Version
180
+ version: '0'
181
+ requirements: []
182
+ rubyforge_project:
183
+ rubygems_version: 2.4.5.1
184
+ signing_key:
185
+ specification_version: 4
186
+ summary: Ruby interface for reading AWS Kinesis streams
187
+ test_files:
188
+ - spec/spec_helper.rb
189
+ - spec/stream_reader/avro_parser_spec.rb
190
+ - spec/stream_reader/sequence_number_track_spec.rb
191
+ - spec/stream_reader_spec.rb
192
+ - spec/support/user_was_created.avro