karafka 1.4.10 → 2.0.0.alpha2
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- checksums.yaml.gz.sig +0 -0
- data/.github/FUNDING.yml +3 -0
- data/.github/workflows/ci.yml +79 -26
- data/.ruby-version +1 -1
- data/CHANGELOG.md +46 -0
- data/CONTRIBUTING.md +6 -6
- data/Gemfile +6 -0
- data/Gemfile.lock +45 -53
- data/LICENSE +17 -0
- data/LICENSE-COMM +89 -0
- data/LICENSE-LGPL +165 -0
- data/README.md +16 -48
- data/bin/benchmarks +85 -0
- data/bin/create_token +28 -0
- data/bin/integrations +160 -0
- data/bin/karafka +4 -0
- data/bin/stress +13 -0
- data/certs/karafka-pro.pem +11 -0
- data/config/errors.yml +5 -38
- data/docker-compose.yml +12 -3
- data/karafka.gemspec +14 -14
- data/lib/active_job/karafka.rb +20 -0
- data/lib/active_job/queue_adapters/karafka_adapter.rb +26 -0
- data/lib/karafka/active_job/consumer.rb +24 -0
- data/lib/karafka/active_job/dispatcher.rb +38 -0
- data/lib/karafka/active_job/job_extensions.rb +34 -0
- data/lib/karafka/active_job/job_options_contract.rb +15 -0
- data/lib/karafka/active_job/routing_extensions.rb +18 -0
- data/lib/karafka/app.rb +14 -20
- data/lib/karafka/base_consumer.rb +103 -34
- data/lib/karafka/cli/base.rb +4 -4
- data/lib/karafka/cli/info.rb +44 -9
- data/lib/karafka/cli/install.rb +3 -8
- data/lib/karafka/cli/server.rb +16 -43
- data/lib/karafka/cli.rb +4 -11
- data/lib/karafka/connection/client.rb +279 -93
- data/lib/karafka/connection/listener.rb +137 -38
- data/lib/karafka/connection/messages_buffer.rb +57 -0
- data/lib/karafka/connection/pauses_manager.rb +46 -0
- data/lib/karafka/connection/rebalance_manager.rb +62 -0
- data/lib/karafka/contracts/base.rb +23 -0
- data/lib/karafka/contracts/config.rb +44 -8
- data/lib/karafka/contracts/consumer_group.rb +1 -176
- data/lib/karafka/contracts/consumer_group_topic.rb +16 -8
- data/lib/karafka/contracts/server_cli_options.rb +2 -12
- data/lib/karafka/contracts.rb +1 -1
- data/lib/karafka/env.rb +46 -0
- data/lib/karafka/errors.rb +18 -18
- data/lib/karafka/helpers/multi_delegator.rb +2 -2
- data/lib/karafka/instrumentation/callbacks/error.rb +40 -0
- data/lib/karafka/instrumentation/callbacks/statistics.rb +42 -0
- data/lib/karafka/instrumentation/monitor.rb +14 -21
- data/lib/karafka/instrumentation/stdout_listener.rb +67 -91
- data/lib/karafka/instrumentation.rb +21 -0
- data/lib/karafka/licenser.rb +76 -0
- data/lib/karafka/{params → messages}/batch_metadata.rb +9 -13
- data/lib/karafka/messages/builders/batch_metadata.rb +52 -0
- data/lib/karafka/messages/builders/message.rb +38 -0
- data/lib/karafka/messages/builders/messages.rb +40 -0
- data/lib/karafka/{params/params.rb → messages/message.rb} +7 -12
- data/lib/karafka/messages/messages.rb +64 -0
- data/lib/karafka/{params → messages}/metadata.rb +4 -6
- data/lib/karafka/messages/seek.rb +9 -0
- data/lib/karafka/patches/rdkafka/consumer.rb +22 -0
- data/lib/karafka/pro/active_job/dispatcher.rb +58 -0
- data/lib/karafka/pro/active_job/job_options_contract.rb +27 -0
- data/lib/karafka/pro/loader.rb +29 -0
- data/lib/karafka/pro.rb +13 -0
- data/lib/karafka/processing/executor.rb +96 -0
- data/lib/karafka/processing/executors_buffer.rb +49 -0
- data/lib/karafka/processing/jobs/base.rb +18 -0
- data/lib/karafka/processing/jobs/consume.rb +28 -0
- data/lib/karafka/processing/jobs/revoked.rb +22 -0
- data/lib/karafka/processing/jobs/shutdown.rb +23 -0
- data/lib/karafka/processing/jobs_queue.rb +121 -0
- data/lib/karafka/processing/worker.rb +57 -0
- data/lib/karafka/processing/workers_batch.rb +22 -0
- data/lib/karafka/railtie.rb +75 -0
- data/lib/karafka/routing/builder.rb +15 -24
- data/lib/karafka/routing/consumer_group.rb +10 -18
- data/lib/karafka/routing/consumer_mapper.rb +1 -2
- data/lib/karafka/routing/router.rb +1 -1
- data/lib/karafka/routing/subscription_group.rb +53 -0
- data/lib/karafka/routing/subscription_groups_builder.rb +51 -0
- data/lib/karafka/routing/topic.rb +47 -25
- data/lib/karafka/runner.rb +59 -0
- data/lib/karafka/serialization/json/deserializer.rb +6 -15
- data/lib/karafka/server.rb +62 -25
- data/lib/karafka/setup/config.rb +98 -171
- data/lib/karafka/status.rb +13 -3
- data/lib/karafka/templates/example_consumer.rb.erb +16 -0
- data/lib/karafka/templates/karafka.rb.erb +14 -50
- data/lib/karafka/time_trackers/base.rb +19 -0
- data/lib/karafka/time_trackers/pause.rb +84 -0
- data/lib/karafka/time_trackers/poll.rb +65 -0
- data/lib/karafka/version.rb +1 -1
- data/lib/karafka.rb +35 -13
- data.tar.gz.sig +0 -0
- metadata +82 -104
- metadata.gz.sig +0 -0
- data/MIT-LICENCE +0 -18
- data/lib/karafka/assignment_strategies/round_robin.rb +0 -13
- data/lib/karafka/attributes_map.rb +0 -63
- data/lib/karafka/backends/inline.rb +0 -16
- data/lib/karafka/base_responder.rb +0 -226
- data/lib/karafka/cli/flow.rb +0 -48
- data/lib/karafka/cli/missingno.rb +0 -19
- data/lib/karafka/code_reloader.rb +0 -67
- data/lib/karafka/connection/api_adapter.rb +0 -158
- data/lib/karafka/connection/batch_delegator.rb +0 -55
- data/lib/karafka/connection/builder.rb +0 -23
- data/lib/karafka/connection/message_delegator.rb +0 -36
- data/lib/karafka/consumers/batch_metadata.rb +0 -10
- data/lib/karafka/consumers/callbacks.rb +0 -71
- data/lib/karafka/consumers/includer.rb +0 -64
- data/lib/karafka/consumers/responders.rb +0 -24
- data/lib/karafka/consumers/single_params.rb +0 -15
- data/lib/karafka/contracts/responder_usage.rb +0 -54
- data/lib/karafka/fetcher.rb +0 -42
- data/lib/karafka/helpers/class_matcher.rb +0 -88
- data/lib/karafka/helpers/config_retriever.rb +0 -46
- data/lib/karafka/helpers/inflector.rb +0 -26
- data/lib/karafka/params/builders/batch_metadata.rb +0 -30
- data/lib/karafka/params/builders/params.rb +0 -38
- data/lib/karafka/params/builders/params_batch.rb +0 -25
- data/lib/karafka/params/params_batch.rb +0 -60
- data/lib/karafka/patches/ruby_kafka.rb +0 -47
- data/lib/karafka/persistence/client.rb +0 -29
- data/lib/karafka/persistence/consumers.rb +0 -45
- data/lib/karafka/persistence/topics.rb +0 -48
- data/lib/karafka/responders/builder.rb +0 -36
- data/lib/karafka/responders/topic.rb +0 -55
- data/lib/karafka/routing/topic_mapper.rb +0 -53
- data/lib/karafka/serialization/json/serializer.rb +0 -31
- data/lib/karafka/setup/configurators/water_drop.rb +0 -36
- data/lib/karafka/templates/application_responder.rb.erb +0 -11
@@ -0,0 +1,75 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
# This file contains Railtie for auto-configuration
|
4
|
+
|
5
|
+
rails = false
|
6
|
+
|
7
|
+
begin
|
8
|
+
require 'rails'
|
9
|
+
|
10
|
+
rails = true
|
11
|
+
rescue LoadError
|
12
|
+
# Without defining this in any way, Zeitwerk ain't happy so we do it that way
|
13
|
+
module Karafka
|
14
|
+
class Railtie
|
15
|
+
end
|
16
|
+
end
|
17
|
+
end
|
18
|
+
|
19
|
+
if rails
|
20
|
+
# Load Karafka
|
21
|
+
require 'karafka'
|
22
|
+
|
23
|
+
# Load ActiveJob adapter
|
24
|
+
require 'active_job/karafka'
|
25
|
+
|
26
|
+
# Setup env if configured (may be configured later by .net, etc)
|
27
|
+
ENV['KARAFKA_ENV'] ||= ENV['RAILS_ENV'] if ENV.key?('RAILS_ENV')
|
28
|
+
|
29
|
+
module Karafka
|
30
|
+
# Railtie for setting up Rails integration
|
31
|
+
class Railtie < Rails::Railtie
|
32
|
+
railtie_name :karafka
|
33
|
+
|
34
|
+
initializer 'karafka.active_job_integration' do
|
35
|
+
ActiveSupport.on_load(:active_job) do
|
36
|
+
# Extend ActiveJob with some Karafka specific ActiveJob magic
|
37
|
+
extend ::Karafka::ActiveJob::JobExtensions
|
38
|
+
end
|
39
|
+
end
|
40
|
+
|
41
|
+
initializer 'karafka.configure_rails_initialization' do |app|
|
42
|
+
# Consumers should autoload by default in the Rails app so they are visible
|
43
|
+
app.config.autoload_paths += %w[app/consumers]
|
44
|
+
|
45
|
+
# Make Karafka use Rails logger
|
46
|
+
::Karafka::App.config.logger = Rails.logger
|
47
|
+
|
48
|
+
# This lines will make Karafka print to stdout like puma or unicorn when we run karafka
|
49
|
+
# server + will support code reloading with each fetched loop. We do it only for karafka
|
50
|
+
# based commands as Rails processes and console will have it enabled already
|
51
|
+
if Rails.env.development? && ENV.key?('KARAFKA_CLI')
|
52
|
+
Rails.logger.extend(
|
53
|
+
ActiveSupport::Logger.broadcast(
|
54
|
+
ActiveSupport::Logger.new($stdout)
|
55
|
+
)
|
56
|
+
)
|
57
|
+
|
58
|
+
# We can have many listeners, but it does not matter in which we will reload the code as
|
59
|
+
# long as all the consumers will be re-created as Rails reload is thread-safe
|
60
|
+
::Karafka::App.monitor.subscribe('connection.listener.fetch_loop') do
|
61
|
+
# Reload code each time there is a change in the code
|
62
|
+
next unless Rails.application.reloaders.any?(&:updated?)
|
63
|
+
|
64
|
+
Rails.application.reloader.reload!
|
65
|
+
end
|
66
|
+
end
|
67
|
+
|
68
|
+
app.reloader.to_prepare do
|
69
|
+
# Load Karafka bot file, so it can be used in Rails server context
|
70
|
+
require Rails.root.join(Karafka.boot_file.to_s).to_s
|
71
|
+
end
|
72
|
+
end
|
73
|
+
end
|
74
|
+
end
|
75
|
+
end
|
@@ -10,14 +10,9 @@ module Karafka
|
|
10
10
|
# end
|
11
11
|
# end
|
12
12
|
class Builder < Concurrent::Array
|
13
|
-
# Consumer group consistency checking contract
|
14
|
-
CONTRACT = Karafka::Contracts::ConsumerGroup.new.freeze
|
15
|
-
|
16
|
-
private_constant :CONTRACT
|
17
|
-
|
18
13
|
def initialize
|
19
|
-
super
|
20
14
|
@draws = Concurrent::Array.new
|
15
|
+
super
|
21
16
|
end
|
22
17
|
|
23
18
|
# Used to draw routes for Karafka
|
@@ -38,11 +33,7 @@ module Karafka
|
|
38
33
|
instance_eval(&block)
|
39
34
|
|
40
35
|
each do |consumer_group|
|
41
|
-
|
42
|
-
validation_result = CONTRACT.call(hashed_group)
|
43
|
-
next if validation_result.success?
|
44
|
-
|
45
|
-
raise Errors::InvalidConfigurationError, validation_result.errors.to_h
|
36
|
+
Contracts::ConsumerGroup.new.validate!(consumer_group.to_h)
|
46
37
|
end
|
47
38
|
end
|
48
39
|
|
@@ -59,30 +50,30 @@ module Karafka
|
|
59
50
|
super
|
60
51
|
end
|
61
52
|
|
62
|
-
# Redraws all the routes for the in-process code reloading.
|
63
|
-
# @note This won't allow registration of new topics without process restart but will trigger
|
64
|
-
# cache invalidation so all the classes, etc are re-fetched after code reload
|
65
|
-
def reload
|
66
|
-
draws = @draws.dup
|
67
|
-
clear
|
68
|
-
draws.each { |block| draw(&block) }
|
69
|
-
end
|
70
|
-
|
71
53
|
private
|
72
54
|
|
73
55
|
# Builds and saves given consumer group
|
74
56
|
# @param group_id [String, Symbol] name for consumer group
|
75
57
|
# @param block [Proc] proc that should be executed in the proxy context
|
76
58
|
def consumer_group(group_id, &block)
|
77
|
-
consumer_group =
|
78
|
-
|
59
|
+
consumer_group = find { |cg| cg.name == group_id.to_s }
|
60
|
+
|
61
|
+
if consumer_group
|
62
|
+
Proxy.new(consumer_group, &block).target
|
63
|
+
else
|
64
|
+
consumer_group = ConsumerGroup.new(group_id.to_s)
|
65
|
+
self << Proxy.new(consumer_group, &block).target
|
66
|
+
end
|
79
67
|
end
|
80
68
|
|
69
|
+
# In case we use simple style of routing, all topics will be assigned to the same consumer
|
70
|
+
# group that will be based on the client_id
|
71
|
+
#
|
81
72
|
# @param topic_name [String, Symbol] name of a topic from which we want to consumer
|
82
73
|
# @param block [Proc] proc we want to evaluate in the topic context
|
83
74
|
def topic(topic_name, &block)
|
84
|
-
consumer_group(
|
85
|
-
topic(topic_name, &block)
|
75
|
+
consumer_group('app') do
|
76
|
+
topic(topic_name, &block)
|
86
77
|
end
|
87
78
|
end
|
88
79
|
end
|
@@ -5,14 +5,10 @@ module Karafka
|
|
5
5
|
# Object used to describe a single consumer group that is going to subscribe to
|
6
6
|
# given topics
|
7
7
|
# It is a part of Karafka's DSL
|
8
|
+
# @note A single consumer group represents Kafka consumer group, but it may not match 1:1 with
|
9
|
+
# subscription groups. There can be more subscription groups than consumer groups
|
8
10
|
class ConsumerGroup
|
9
|
-
|
10
|
-
|
11
|
-
attr_reader(
|
12
|
-
:topics,
|
13
|
-
:id,
|
14
|
-
:name
|
15
|
-
)
|
11
|
+
attr_reader :id, :topics, :name
|
16
12
|
|
17
13
|
# @param name [String, Symbol] raw name of this consumer group. Raw means, that it does not
|
18
14
|
# yet have an application client_id namespace, this will be added here by default.
|
@@ -35,28 +31,24 @@ module Karafka
|
|
35
31
|
# @return [Karafka::Routing::Topic] newly built topic instance
|
36
32
|
def topic=(name, &block)
|
37
33
|
topic = Topic.new(name, self)
|
38
|
-
@topics << Proxy.new(topic, &block).target
|
34
|
+
@topics << Proxy.new(topic, &block).target
|
39
35
|
@topics.last
|
40
36
|
end
|
41
37
|
|
42
|
-
|
43
|
-
|
38
|
+
# @return [Array<Routing::SubscriptionGroup>] all the subscription groups build based on
|
39
|
+
# the consumer group topics
|
40
|
+
def subscription_groups
|
41
|
+
App.config.internal.subscription_groups_builder.call(topics)
|
44
42
|
end
|
45
43
|
|
46
44
|
# Hashed version of consumer group that can be used for validation purposes
|
47
45
|
# @return [Hash] hash with consumer group attributes including serialized to hash
|
48
46
|
# topics inside of it.
|
49
47
|
def to_h
|
50
|
-
|
48
|
+
{
|
51
49
|
topics: topics.map(&:to_h),
|
52
50
|
id: id
|
53
|
-
}
|
54
|
-
|
55
|
-
Karafka::AttributesMap.consumer_group.each do |attribute|
|
56
|
-
result[attribute] = public_send(attribute)
|
57
|
-
end
|
58
|
-
|
59
|
-
result
|
51
|
+
}.freeze
|
60
52
|
end
|
61
53
|
end
|
62
54
|
end
|
@@ -26,8 +26,7 @@ module Karafka
|
|
26
26
|
# @param raw_consumer_group_name [String, Symbol] string or symbolized consumer group name
|
27
27
|
# @return [String] remapped final consumer group name
|
28
28
|
def call(raw_consumer_group_name)
|
29
|
-
|
30
|
-
"#{client_name}_#{raw_consumer_group_name}"
|
29
|
+
"#{Karafka::App.config.client_id}_#{raw_consumer_group_name}"
|
31
30
|
end
|
32
31
|
end
|
33
32
|
end
|
@@ -10,7 +10,7 @@ module Karafka
|
|
10
10
|
# Find a proper topic based on full topic id
|
11
11
|
# @param topic_id [String] proper topic id (already mapped, etc) for which we want to find
|
12
12
|
# routing topic
|
13
|
-
# @return [Karafka::Routing::
|
13
|
+
# @return [Karafka::Routing::Topic] proper route details
|
14
14
|
# @raise [Karafka::Topic::NonMatchingTopicError] raised if topic name does not match
|
15
15
|
# any route defined by user using routes.draw
|
16
16
|
def find(topic_id)
|
@@ -0,0 +1,53 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
module Karafka
|
4
|
+
module Routing
|
5
|
+
# Object representing a set of single consumer group topics that can be subscribed together
|
6
|
+
# with one connection.
|
7
|
+
#
|
8
|
+
# @note One subscription group will always belong to one consumer group, but one consumer
|
9
|
+
# group can have multiple subscription groups.
|
10
|
+
class SubscriptionGroup
|
11
|
+
attr_reader :id, :topics
|
12
|
+
|
13
|
+
# @param topics [Array<Topic>] all the topics that share the same key settings
|
14
|
+
# @return [SubscriptionGroup] built subscription group
|
15
|
+
def initialize(topics)
|
16
|
+
@id = SecureRandom.uuid
|
17
|
+
@topics = topics
|
18
|
+
freeze
|
19
|
+
end
|
20
|
+
|
21
|
+
# @return [String] consumer group id
|
22
|
+
def consumer_group_id
|
23
|
+
kafka[:'group.id']
|
24
|
+
end
|
25
|
+
|
26
|
+
# @return [Integer] max messages fetched in a single go
|
27
|
+
def max_messages
|
28
|
+
@topics.first.max_messages
|
29
|
+
end
|
30
|
+
|
31
|
+
# @return [Integer] max milliseconds we can wait for incoming messages
|
32
|
+
def max_wait_time
|
33
|
+
@topics.first.max_wait_time
|
34
|
+
end
|
35
|
+
|
36
|
+
# @return [Hash] kafka settings are a bit special. They are exactly the same for all of the
|
37
|
+
# topics but they lack the group.id (unless explicitly) provided. To make it compatible
|
38
|
+
# with our routing engine, we inject it before it will go to the consumer
|
39
|
+
def kafka
|
40
|
+
kafka = @topics.first.kafka.dup
|
41
|
+
|
42
|
+
kafka[:'client.id'] ||= Karafka::App.config.client_id
|
43
|
+
kafka[:'group.id'] ||= @topics.first.consumer_group.id
|
44
|
+
kafka[:'auto.offset.reset'] ||= 'earliest'
|
45
|
+
# Karafka manages the offsets based on the processing state, thus we do not rely on the
|
46
|
+
# rdkafka offset auto-storing
|
47
|
+
kafka[:'enable.auto.offset.store'] = 'false'
|
48
|
+
kafka.freeze
|
49
|
+
kafka
|
50
|
+
end
|
51
|
+
end
|
52
|
+
end
|
53
|
+
end
|
@@ -0,0 +1,51 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
module Karafka
|
4
|
+
module Routing
|
5
|
+
# rdkafka allows us to group topics subscriptions when they have same settings.
|
6
|
+
# This builder groups topics from a single consumer group into subscription groups that can be
|
7
|
+
# subscribed with one rdkafka connection.
|
8
|
+
# This way we save resources as having several rdkafka consumers under the hood is not the
|
9
|
+
# cheapest thing in a bigger system.
|
10
|
+
#
|
11
|
+
# In general, if we can, we try to subscribe to as many topics with one rdkafka connection as
|
12
|
+
# possible, but if not possible, we divide.
|
13
|
+
class SubscriptionGroupsBuilder
|
14
|
+
# Keys used to build up a hash for subscription groups distribution.
|
15
|
+
# In order to be able to use the same rdkafka connection for several topics, those keys need
|
16
|
+
# to have same values.
|
17
|
+
DISTRIBUTION_KEYS = %i[
|
18
|
+
kafka
|
19
|
+
max_messages
|
20
|
+
max_wait_time
|
21
|
+
].freeze
|
22
|
+
|
23
|
+
private_constant :DISTRIBUTION_KEYS
|
24
|
+
|
25
|
+
# @param topics [Array<Topic>] array with topics based on which we want to build subscription
|
26
|
+
# groups
|
27
|
+
# @return [Array<SubscriptionGroup>] all subscription groups we need in separate threads
|
28
|
+
def call(topics)
|
29
|
+
topics
|
30
|
+
.map { |topic| [checksum(topic), topic] }
|
31
|
+
.group_by(&:first)
|
32
|
+
.values
|
33
|
+
.map { |value| value.map(&:last) }
|
34
|
+
.map { |grouped_topics| SubscriptionGroup.new(grouped_topics) }
|
35
|
+
end
|
36
|
+
|
37
|
+
private
|
38
|
+
|
39
|
+
# @param topic [Karafka::Routing::Topic] topic for which we compute the grouping checksum
|
40
|
+
# @return [Integer] checksum that we can use to check if topics have the same set of
|
41
|
+
# settings based on which we group
|
42
|
+
def checksum(topic)
|
43
|
+
accu = {}
|
44
|
+
|
45
|
+
DISTRIBUTION_KEYS.each { |key| accu[key] = topic.public_send(key) }
|
46
|
+
|
47
|
+
accu.hash
|
48
|
+
end
|
49
|
+
end
|
50
|
+
end
|
51
|
+
end
|
@@ -2,17 +2,23 @@
|
|
2
2
|
|
3
3
|
module Karafka
|
4
4
|
module Routing
|
5
|
-
# Topic stores all the details on how we should interact with Kafka given topic
|
5
|
+
# Topic stores all the details on how we should interact with Kafka given topic.
|
6
6
|
# It belongs to a consumer group as from 0.6 all the topics can work in the same consumer group
|
7
|
-
# It is a part of Karafka's DSL
|
7
|
+
# It is a part of Karafka's DSL.
|
8
8
|
class Topic
|
9
|
-
|
10
|
-
|
9
|
+
attr_reader :id, :name, :consumer_group
|
10
|
+
attr_writer :consumer
|
11
11
|
|
12
|
-
|
13
|
-
|
12
|
+
# Attributes we can inherit from the root unless they were defined on this level
|
13
|
+
INHERITABLE_ATTRIBUTES = %i[
|
14
|
+
kafka
|
15
|
+
deserializer
|
16
|
+
manual_offset_management
|
17
|
+
max_messages
|
18
|
+
max_wait_time
|
19
|
+
].freeze
|
14
20
|
|
15
|
-
|
21
|
+
private_constant :INHERITABLE_ATTRIBUTES
|
16
22
|
|
17
23
|
# @param [String, Symbol] name of a topic on which we want to listen
|
18
24
|
# @param consumer_group [Karafka::Routing::ConsumerGroup] owning consumer group of this topic
|
@@ -22,40 +28,56 @@ module Karafka
|
|
22
28
|
@attributes = {}
|
23
29
|
# @note We use identifier related to the consumer group that owns a topic, because from
|
24
30
|
# Karafka 0.6 we can handle multiple Kafka instances with the same process and we can
|
25
|
-
# have same topic name across multiple
|
31
|
+
# have same topic name across multiple consumer groups
|
26
32
|
@id = "#{consumer_group.id}_#{@name}"
|
27
33
|
end
|
28
34
|
|
29
|
-
|
30
|
-
|
31
|
-
|
32
|
-
|
33
|
-
|
34
|
-
|
35
|
-
|
36
|
-
end
|
35
|
+
INHERITABLE_ATTRIBUTES.each do |attribute|
|
36
|
+
attr_writer attribute
|
37
|
+
|
38
|
+
define_method attribute do
|
39
|
+
current_value = instance_variable_get(:"@#{attribute}")
|
40
|
+
|
41
|
+
return current_value unless current_value.nil?
|
37
42
|
|
38
|
-
|
39
|
-
|
40
|
-
|
41
|
-
|
43
|
+
value = Karafka::App.config.send(attribute)
|
44
|
+
|
45
|
+
instance_variable_set(:"@#{attribute}", value)
|
46
|
+
end
|
42
47
|
end
|
43
48
|
|
44
|
-
|
45
|
-
|
49
|
+
# @return [Class] consumer class that we should use
|
50
|
+
def consumer
|
51
|
+
if Karafka::App.config.consumer_persistence
|
52
|
+
# When persistence of consumers is on, no need to reload them
|
53
|
+
@consumer
|
54
|
+
else
|
55
|
+
# In order to support code reload without having to change the topic api, we re-fetch the
|
56
|
+
# class of a consumer based on its class name. This will support all the cases where the
|
57
|
+
# consumer class is defined with a name. It won't support code reload for anonymous
|
58
|
+
# consumer classes, but this is an edge case
|
59
|
+
begin
|
60
|
+
::Object.const_get(@consumer.to_s)
|
61
|
+
rescue NameError
|
62
|
+
# It will only fail if the in case of anonymous classes
|
63
|
+
@consumer
|
64
|
+
end
|
65
|
+
end
|
46
66
|
end
|
47
67
|
|
48
68
|
# @return [Hash] hash with all the topic attributes
|
49
69
|
# @note This is being used when we validate the consumer_group and its topics
|
50
70
|
def to_h
|
51
|
-
map =
|
71
|
+
map = INHERITABLE_ATTRIBUTES.map do |attribute|
|
52
72
|
[attribute, public_send(attribute)]
|
53
73
|
end
|
54
74
|
|
55
75
|
Hash[map].merge!(
|
56
76
|
id: id,
|
57
|
-
|
58
|
-
|
77
|
+
name: name,
|
78
|
+
consumer: consumer,
|
79
|
+
consumer_group_id: consumer_group.id
|
80
|
+
).freeze
|
59
81
|
end
|
60
82
|
end
|
61
83
|
end
|
@@ -0,0 +1,59 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
module Karafka
|
4
|
+
# Class used to run the Karafka listeners in separate threads
|
5
|
+
class Runner
|
6
|
+
# Starts listening on all the listeners asynchronously
|
7
|
+
# Fetch loop should never end. If they do, it is a critical error
|
8
|
+
def call
|
9
|
+
# Despite possibility of having several independent listeners, we aim to have one queue for
|
10
|
+
# jobs across and one workers poll for that
|
11
|
+
jobs_queue = Processing::JobsQueue.new
|
12
|
+
|
13
|
+
workers = Processing::WorkersBatch.new(jobs_queue)
|
14
|
+
Karafka::Server.workers = workers
|
15
|
+
|
16
|
+
threads = listeners(jobs_queue).map do |listener|
|
17
|
+
# We abort on exception because there should be an exception handling developed for
|
18
|
+
# each listener running in separate threads, so the exceptions should never leak
|
19
|
+
# and if that happens, it means that something really bad happened and we should stop
|
20
|
+
# the whole process
|
21
|
+
Thread
|
22
|
+
.new { listener.call }
|
23
|
+
.tap { |thread| thread.abort_on_exception = true }
|
24
|
+
end
|
25
|
+
|
26
|
+
# We aggregate threads here for a supervised shutdown process
|
27
|
+
Karafka::Server.consumer_threads = threads
|
28
|
+
|
29
|
+
# All the listener threads need to finish
|
30
|
+
threads.each(&:join)
|
31
|
+
# All the workers need to stop processing anything before we can stop the runner completely
|
32
|
+
workers.each(&:join)
|
33
|
+
# If anything crashes here, we need to raise the error and crush the runner because it means
|
34
|
+
# that something terrible happened
|
35
|
+
rescue StandardError => e
|
36
|
+
Karafka.monitor.instrument(
|
37
|
+
'error.occurred',
|
38
|
+
caller: self,
|
39
|
+
error: e,
|
40
|
+
type: 'runner.call.error'
|
41
|
+
)
|
42
|
+
Karafka::App.stop!
|
43
|
+
raise e
|
44
|
+
end
|
45
|
+
|
46
|
+
private
|
47
|
+
|
48
|
+
# @param jobs_queue [Processing::JobsQueue] the main processing queue
|
49
|
+
# @return [Array<Karafka::Connection::Listener>] listeners that will consume messages for each
|
50
|
+
# of the subscription groups
|
51
|
+
def listeners(jobs_queue)
|
52
|
+
App
|
53
|
+
.subscription_groups
|
54
|
+
.map do |subscription_group|
|
55
|
+
Karafka::Connection::Listener.new(subscription_group, jobs_queue)
|
56
|
+
end
|
57
|
+
end
|
58
|
+
end
|
59
|
+
end
|
@@ -1,25 +1,16 @@
|
|
1
1
|
# frozen_string_literal: true
|
2
2
|
|
3
3
|
module Karafka
|
4
|
-
# Module for all supported by default serialization and deserialization ways
|
4
|
+
# Module for all supported by default serialization and deserialization ways.
|
5
5
|
module Serialization
|
6
|
-
# Namespace for json
|
6
|
+
# Namespace for json serializers and deserializers.
|
7
7
|
module Json
|
8
|
-
# Default Karafka Json deserializer for loading JSON data
|
8
|
+
# Default Karafka Json deserializer for loading JSON data.
|
9
9
|
class Deserializer
|
10
|
-
# @param
|
10
|
+
# @param message [Karafka::Messages::Message] Message object that we want to deserialize
|
11
11
|
# @return [Hash] hash with deserialized JSON data
|
12
|
-
|
13
|
-
|
14
|
-
# 'payload' => "{\"a\":1}",
|
15
|
-
# 'topic' => 'my-topic',
|
16
|
-
# 'headers' => { 'message_type' => :test }
|
17
|
-
# }
|
18
|
-
# Deserializer.call(params) #=> { 'a' => 1 }
|
19
|
-
def call(params)
|
20
|
-
params.raw_payload.nil? ? nil : ::JSON.parse(params.raw_payload)
|
21
|
-
rescue ::JSON::ParserError => e
|
22
|
-
raise ::Karafka::Errors::DeserializationError, e
|
12
|
+
def call(message)
|
13
|
+
message.raw_payload.nil? ? nil : ::JSON.parse(message.raw_payload)
|
23
14
|
end
|
24
15
|
end
|
25
16
|
end
|
data/lib/karafka/server.rb
CHANGED
@@ -3,8 +3,6 @@
|
|
3
3
|
module Karafka
|
4
4
|
# Karafka consuming server class
|
5
5
|
class Server
|
6
|
-
@consumer_threads = Concurrent::Array.new
|
7
|
-
|
8
6
|
# How long should we sleep between checks on shutting down consumers
|
9
7
|
SUPERVISION_SLEEP = 0.1
|
10
8
|
# What system exit code should we use when we terminated forcefully
|
@@ -19,53 +17,70 @@ module Karafka
|
|
19
17
|
# Set of consuming threads. Each consumer thread contains a single consumer
|
20
18
|
attr_accessor :consumer_threads
|
21
19
|
|
20
|
+
# Set of workers
|
21
|
+
attr_accessor :workers
|
22
|
+
|
22
23
|
# Writer for list of consumer groups that we want to consume in our current process context
|
23
24
|
attr_writer :consumer_groups
|
24
25
|
|
25
26
|
# Method which runs app
|
26
27
|
def run
|
27
|
-
process.on_sigint {
|
28
|
-
process.on_sigquit {
|
29
|
-
process.on_sigterm {
|
30
|
-
|
28
|
+
process.on_sigint { stop }
|
29
|
+
process.on_sigquit { stop }
|
30
|
+
process.on_sigterm { stop }
|
31
|
+
|
32
|
+
# Start is blocking until stop is called and when we stop, it will wait until
|
33
|
+
# all of the things are ready to stop
|
34
|
+
start
|
35
|
+
|
36
|
+
# We always need to wait for Karafka to stop here since we should wait for the stop running
|
37
|
+
# in a separate thread (or trap context) to indicate everything is closed
|
38
|
+
Thread.pass until Karafka::App.stopped?
|
39
|
+
# Try its best to shutdown underlying components before re-raising
|
40
|
+
# rubocop:disable Lint/RescueException
|
41
|
+
rescue Exception => e
|
42
|
+
# rubocop:enable Lint/RescueException
|
43
|
+
stop
|
44
|
+
|
45
|
+
raise e
|
31
46
|
end
|
32
47
|
|
33
48
|
# @return [Array<String>] array with names of consumer groups that should be consumed in a
|
34
49
|
# current server context
|
35
50
|
def consumer_groups
|
36
|
-
# If not specified, a server will
|
51
|
+
# If not specified, a server will listen on all the topics
|
37
52
|
@consumer_groups ||= Karafka::App.consumer_groups.map(&:name).freeze
|
38
53
|
end
|
39
54
|
|
40
|
-
private
|
41
|
-
|
42
|
-
# @return [Karafka::Process] process wrapper instance used to catch system signal calls
|
43
|
-
def process
|
44
|
-
Karafka::App.config.internal.process
|
45
|
-
end
|
46
|
-
|
47
55
|
# Starts Karafka with a supervision
|
48
56
|
# @note We don't need to sleep because Karafka::Fetcher is locking and waiting to
|
49
57
|
# finish loop (and it won't happen until we explicitly want to stop)
|
50
|
-
def
|
58
|
+
def start
|
51
59
|
process.supervise
|
52
60
|
Karafka::App.run!
|
53
|
-
Karafka::
|
61
|
+
Karafka::Runner.new.call
|
54
62
|
end
|
55
63
|
|
56
64
|
# Stops Karafka with a supervision (as long as there is a shutdown timeout)
|
57
|
-
# If consumers won't stop in a given time frame, it will force them to exit
|
58
|
-
|
65
|
+
# If consumers or workers won't stop in a given time frame, it will force them to exit
|
66
|
+
#
|
67
|
+
# @note This method is not async. It should not be executed from the workers as it will
|
68
|
+
# lock them forever. If you need to run Karafka shutdown from within workers threads,
|
69
|
+
# please start a separate thread to do so.
|
70
|
+
def stop
|
59
71
|
Karafka::App.stop!
|
60
72
|
|
61
|
-
# See https://github.com/dry-rb/dry-configurable/issues/93
|
62
73
|
timeout = Thread.new { Karafka::App.config.shutdown_timeout }.join.value
|
63
74
|
|
64
75
|
# We check from time to time (for the timeout period) if all the threads finished
|
65
76
|
# their work and if so, we can just return and normal shutdown process will take place
|
66
|
-
|
67
|
-
|
68
|
-
|
77
|
+
# We divide it by 1000 because we use time in ms.
|
78
|
+
((timeout / 1_000) * SUPERVISION_CHECK_FACTOR).to_i.times do
|
79
|
+
if consumer_threads.count(&:alive?).zero? &&
|
80
|
+
workers.count(&:alive?).zero?
|
81
|
+
|
82
|
+
Thread.new { Karafka::App.producer.close }.join
|
83
|
+
|
69
84
|
return
|
70
85
|
end
|
71
86
|
|
@@ -74,12 +89,34 @@ module Karafka
|
|
74
89
|
|
75
90
|
raise Errors::ForcefulShutdownError
|
76
91
|
rescue Errors::ForcefulShutdownError => e
|
77
|
-
Thread.new
|
78
|
-
|
79
|
-
|
92
|
+
thread = Thread.new do
|
93
|
+
Karafka.monitor.instrument(
|
94
|
+
'error.occurred',
|
95
|
+
caller: self,
|
96
|
+
error: e,
|
97
|
+
type: 'app.stopping.error'
|
98
|
+
)
|
99
|
+
|
100
|
+
# We're done waiting, lets kill them!
|
101
|
+
workers.each(&:terminate)
|
102
|
+
consumer_threads.each(&:terminate)
|
103
|
+
|
104
|
+
Karafka::App.producer.close
|
105
|
+
end
|
106
|
+
|
107
|
+
thread.join
|
80
108
|
|
81
109
|
# exit! is not within the instrumentation as it would not trigger due to exit
|
82
110
|
Kernel.exit! FORCEFUL_EXIT_CODE
|
111
|
+
ensure
|
112
|
+
Karafka::App.stopped!
|
113
|
+
end
|
114
|
+
|
115
|
+
private
|
116
|
+
|
117
|
+
# @return [Karafka::Process] process wrapper instance used to catch system signal calls
|
118
|
+
def process
|
119
|
+
Karafka::App.config.internal.process
|
83
120
|
end
|
84
121
|
end
|
85
122
|
end
|