karafka 2.0.41 → 2.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- checksums.yaml.gz.sig +0 -0
- data/.github/workflows/ci.yml +2 -2
- data/CHANGELOG.md +23 -1
- data/Gemfile.lock +12 -12
- data/config/locales/errors.yml +10 -0
- data/config/locales/pro_errors.yml +0 -2
- data/lib/karafka/active_job/consumer.rb +16 -11
- data/lib/karafka/active_job/current_attributes/loading.rb +36 -0
- data/lib/karafka/active_job/current_attributes/persistence.rb +28 -0
- data/lib/karafka/active_job/current_attributes.rb +42 -0
- data/lib/karafka/active_job/dispatcher.rb +8 -2
- data/lib/karafka/connection/client.rb +1 -1
- data/lib/karafka/errors.rb +3 -0
- data/lib/karafka/instrumentation/vendors/kubernetes/liveness_listener.rb +176 -0
- data/lib/karafka/pro/active_job/consumer.rb +1 -10
- data/lib/karafka/pro/active_job/dispatcher.rb +2 -2
- data/lib/karafka/pro/processing/coordinator.rb +20 -1
- data/lib/karafka/pro/processing/filters/virtual_limiter.rb +52 -0
- data/lib/karafka/pro/processing/filters_applier.rb +4 -0
- data/lib/karafka/pro/processing/strategies/aj/dlq_ftr_mom_vp.rb +1 -1
- data/lib/karafka/pro/processing/strategies/aj/dlq_lrj_mom.rb +3 -1
- data/lib/karafka/pro/processing/strategies/aj/dlq_mom_vp.rb +2 -2
- data/lib/karafka/pro/processing/strategies/aj/lrj_mom_vp.rb +2 -0
- data/lib/karafka/pro/processing/strategies/aj/mom_vp.rb +1 -1
- data/lib/karafka/pro/processing/strategies/dlq/ftr.rb +1 -1
- data/lib/karafka/pro/processing/strategies/dlq/ftr_lrj_mom.rb +3 -6
- data/lib/karafka/pro/processing/strategies/dlq/ftr_lrj_mom_vp.rb +43 -0
- data/lib/karafka/pro/processing/strategies/dlq/ftr_lrj_vp.rb +1 -0
- data/lib/karafka/pro/processing/strategies/dlq/ftr_mom.rb +3 -7
- data/lib/karafka/pro/processing/strategies/dlq/ftr_mom_vp.rb +41 -0
- data/lib/karafka/pro/processing/strategies/dlq/ftr_vp.rb +1 -0
- data/lib/karafka/pro/processing/strategies/dlq/lrj_mom.rb +3 -6
- data/lib/karafka/pro/processing/strategies/dlq/lrj_mom_vp.rb +36 -0
- data/lib/karafka/pro/processing/strategies/dlq/lrj_vp.rb +1 -0
- data/lib/karafka/pro/processing/strategies/dlq/mom.rb +8 -7
- data/lib/karafka/pro/processing/strategies/dlq/mom_vp.rb +37 -0
- data/lib/karafka/pro/processing/strategies/lrj/default.rb +2 -0
- data/lib/karafka/pro/processing/strategies/lrj/ftr_mom_vp.rb +40 -0
- data/lib/karafka/pro/processing/strategies/lrj/mom.rb +2 -0
- data/lib/karafka/pro/processing/strategies/lrj/mom_vp.rb +38 -0
- data/lib/karafka/pro/processing/strategies/mom/ftr_vp.rb +37 -0
- data/lib/karafka/pro/{base_consumer.rb → processing/strategies/mom/vp.rb} +17 -7
- data/lib/karafka/pro/processing/strategies/vp/default.rb +51 -0
- data/lib/karafka/pro/processing/virtual_offset_manager.rb +147 -0
- data/lib/karafka/pro/routing/features/virtual_partitions/contract.rb +0 -17
- data/lib/karafka/processing/strategies/default.rb +2 -0
- data/lib/karafka/processing/strategies/dlq_mom.rb +9 -7
- data/lib/karafka/version.rb +1 -1
- data/lib/karafka.rb +5 -0
- data.tar.gz.sig +0 -0
- metadata +16 -4
- metadata.gz.sig +0 -0
- data/lib/karafka/instrumentation/vendors/datadog/listener.rb +0 -16
@@ -0,0 +1,147 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
# This Karafka component is a Pro component under a commercial license.
|
4
|
+
# This Karafka component is NOT licensed under LGPL.
|
5
|
+
#
|
6
|
+
# All of the commercial components are present in the lib/karafka/pro directory of this
|
7
|
+
# repository and their usage requires commercial license agreement.
|
8
|
+
#
|
9
|
+
# Karafka has also commercial-friendly license, commercial support and commercial components.
|
10
|
+
#
|
11
|
+
# By sending a pull request to the pro components, you are agreeing to transfer the copyright of
|
12
|
+
# your code to Maciej Mensfeld.
|
13
|
+
|
14
|
+
module Karafka
|
15
|
+
module Pro
|
16
|
+
module Processing
|
17
|
+
# Manager that keeps track of our offsets with the virtualization layer that are local
|
18
|
+
# to given partition assignment. It allows for easier offset management for virtual
|
19
|
+
# virtual partition cases as it provides us ability to mark as consumed and move the
|
20
|
+
# real offset behind as expected.
|
21
|
+
#
|
22
|
+
# @note We still use the regular coordinator "real" offset management as we want to have
|
23
|
+
# them as separated as possible because the real seek offset management is also used for
|
24
|
+
# pausing, filtering and others and should not be impacted by the virtual one
|
25
|
+
#
|
26
|
+
# @note This manager is **not** thread-safe by itself. It should operate from coordinator
|
27
|
+
# locked locations.
|
28
|
+
class VirtualOffsetManager
|
29
|
+
attr_reader :groups
|
30
|
+
|
31
|
+
# @param topic [String]
|
32
|
+
# @param partition [Integer]
|
33
|
+
#
|
34
|
+
# @note We need topic and partition because we use a seek message (virtual) for real offset
|
35
|
+
# management. We could keep real message reference but this can be memory consuming
|
36
|
+
# and not worth it.
|
37
|
+
def initialize(topic, partition)
|
38
|
+
@topic = topic
|
39
|
+
@partition = partition
|
40
|
+
@groups = []
|
41
|
+
@marked = {}
|
42
|
+
@real_offset = -1
|
43
|
+
end
|
44
|
+
|
45
|
+
# Clears the manager for a next collective operation
|
46
|
+
def clear
|
47
|
+
@groups.clear
|
48
|
+
@marked = {}
|
49
|
+
@real_offset = -1
|
50
|
+
end
|
51
|
+
|
52
|
+
# Registers an offset group coming from one virtual consumer. In order to move the real
|
53
|
+
# underlying offset accordingly, we need to make sure to track the virtual consumers
|
54
|
+
# offsets groups independently and only materialize the end result.
|
55
|
+
#
|
56
|
+
# @param offsets_group [Array<Integer>] offsets from one virtual consumer
|
57
|
+
def register(offsets_group)
|
58
|
+
@groups << offsets_group
|
59
|
+
|
60
|
+
offsets_group.each { |offset| @marked[offset] = false }
|
61
|
+
end
|
62
|
+
|
63
|
+
# Marks given message as marked (virtually consumed).
|
64
|
+
# We mark given message offset and other earlier offsets from the same group as done
|
65
|
+
# and we can refresh our real offset representation based on that as it might have changed
|
66
|
+
# to a newer real offset.
|
67
|
+
# @param message [Karafka::Messages::Message] message coming from VP we want to mark
|
68
|
+
def mark(message)
|
69
|
+
offset = message.offset
|
70
|
+
|
71
|
+
group = @groups.find { |reg_group| reg_group.include?(offset) }
|
72
|
+
|
73
|
+
# This case can happen when someone uses MoM and wants to mark message from a previous
|
74
|
+
# batch as consumed. We can add it, since the real offset refresh will point to it
|
75
|
+
unless group
|
76
|
+
group = [offset]
|
77
|
+
@groups << group
|
78
|
+
end
|
79
|
+
|
80
|
+
position = group.index(offset)
|
81
|
+
|
82
|
+
# Mark all previous messages from the same group also as virtually consumed
|
83
|
+
group[0..position].each do |markable_offset|
|
84
|
+
@marked[markable_offset] = true
|
85
|
+
end
|
86
|
+
|
87
|
+
# Recompute the real offset representation
|
88
|
+
materialize_real_offset
|
89
|
+
end
|
90
|
+
|
91
|
+
# Mark all from all groups including the `message`.
|
92
|
+
# Useful when operating in a collapsed state for marking
|
93
|
+
# @param message [Karafka::Messages::Message]
|
94
|
+
def mark_until(message)
|
95
|
+
mark(message)
|
96
|
+
|
97
|
+
@groups.each do |group|
|
98
|
+
group.each do |offset|
|
99
|
+
next if offset > message.offset
|
100
|
+
|
101
|
+
@marked[offset] = true
|
102
|
+
end
|
103
|
+
end
|
104
|
+
|
105
|
+
materialize_real_offset
|
106
|
+
end
|
107
|
+
|
108
|
+
# @return [Array<Integer>] Offsets of messages already marked as consumed virtually
|
109
|
+
def marked
|
110
|
+
@marked.select { |_, status| status }.map(&:first).sort
|
111
|
+
end
|
112
|
+
|
113
|
+
# Is there a real offset we can mark as consumed
|
114
|
+
# @return [Boolean]
|
115
|
+
def markable?
|
116
|
+
!@real_offset.negative?
|
117
|
+
end
|
118
|
+
|
119
|
+
# @return [Messages::Seek] markable message for real offset marking
|
120
|
+
def markable
|
121
|
+
raise Errors::InvalidRealOffsetUsage unless markable?
|
122
|
+
|
123
|
+
Messages::Seek.new(
|
124
|
+
@topic,
|
125
|
+
@partition,
|
126
|
+
@real_offset
|
127
|
+
)
|
128
|
+
end
|
129
|
+
|
130
|
+
private
|
131
|
+
|
132
|
+
# Recomputes the biggest possible real offset we can have.
|
133
|
+
# It picks the the biggest offset that has uninterrupted stream of virtually marked as
|
134
|
+
# consumed because this will be the collective offset.
|
135
|
+
def materialize_real_offset
|
136
|
+
@marked.to_a.sort_by(&:first).each do |offset, marked|
|
137
|
+
break unless marked
|
138
|
+
|
139
|
+
@real_offset = offset
|
140
|
+
end
|
141
|
+
|
142
|
+
@real_offset = (@marked.keys.min - 1) if @real_offset.negative?
|
143
|
+
end
|
144
|
+
end
|
145
|
+
end
|
146
|
+
end
|
147
|
+
end
|
@@ -44,23 +44,6 @@ module Karafka
|
|
44
44
|
|
45
45
|
[[%i[virtual_partitions partitioner], :respond_to_call]]
|
46
46
|
end
|
47
|
-
|
48
|
-
# Make sure that manual offset management is not used together with Virtual Partitions
|
49
|
-
# This would not make any sense as there would be edge cases related to skipping
|
50
|
-
# messages even if there were errors.
|
51
|
-
virtual do |data, errors|
|
52
|
-
next unless errors.empty?
|
53
|
-
|
54
|
-
virtual_partitions = data[:virtual_partitions]
|
55
|
-
manual_offset_management = data[:manual_offset_management]
|
56
|
-
active_job = data[:active_job]
|
57
|
-
|
58
|
-
next unless virtual_partitions[:active]
|
59
|
-
next unless manual_offset_management[:active]
|
60
|
-
next if active_job[:active]
|
61
|
-
|
62
|
-
[[%i[manual_offset_management], :not_with_virtual_partitions]]
|
63
|
-
end
|
64
47
|
end
|
65
48
|
end
|
66
49
|
end
|
@@ -26,6 +26,7 @@ module Karafka
|
|
26
26
|
def mark_as_consumed(message)
|
27
27
|
# Ignore earlier offsets than the one we already committed
|
28
28
|
return true if coordinator.seek_offset > message.offset
|
29
|
+
return false if revoked?
|
29
30
|
|
30
31
|
unless client.mark_as_consumed(message)
|
31
32
|
coordinator.revoke
|
@@ -46,6 +47,7 @@ module Karafka
|
|
46
47
|
def mark_as_consumed!(message)
|
47
48
|
# Ignore earlier offsets than the one we already committed
|
48
49
|
return true if coordinator.seek_offset > message.offset
|
50
|
+
return false if revoked?
|
49
51
|
|
50
52
|
unless client.mark_as_consumed!(message)
|
51
53
|
coordinator.revoke
|
@@ -29,16 +29,18 @@ module Karafka
|
|
29
29
|
# We reset the pause to indicate we will now consider it as "ok".
|
30
30
|
coordinator.pause_tracker.reset
|
31
31
|
|
32
|
-
skippable_message,
|
32
|
+
skippable_message, = find_skippable_message
|
33
33
|
|
34
34
|
dispatch_to_dlq(skippable_message)
|
35
35
|
|
36
|
-
#
|
37
|
-
|
38
|
-
|
39
|
-
|
40
|
-
|
41
|
-
|
36
|
+
# Save the next offset we want to go with after moving given message to DLQ
|
37
|
+
# Without this, we would not be able to move forward and we would end up
|
38
|
+
# in an infinite loop trying to un-pause from the message we've already processed
|
39
|
+
# Of course, since it's a MoM a rebalance or kill, will move it back as no
|
40
|
+
# offsets are being committed
|
41
|
+
coordinator.seek_offset = skippable_message.offset + 1
|
42
|
+
|
43
|
+
pause(coordinator.seek_offset, nil, false)
|
42
44
|
end
|
43
45
|
end
|
44
46
|
end
|
data/lib/karafka/version.rb
CHANGED
data/lib/karafka.rb
CHANGED
@@ -114,6 +114,11 @@ end
|
|
114
114
|
loader = Zeitwerk::Loader.for_gem
|
115
115
|
# Do not load Rails extensions by default, this will be handled by Railtie if they are needed
|
116
116
|
loader.ignore(Karafka.gem_root.join('lib/active_job'))
|
117
|
+
# Do not load CurrentAttributes components as they will be loaded if needed
|
118
|
+
# @note We have to exclude both the .rb file as well as the whole directory so users can require
|
119
|
+
# current attributes only when needed
|
120
|
+
loader.ignore(Karafka.gem_root.join('lib/karafka/active_job/current_attributes'))
|
121
|
+
loader.ignore(Karafka.gem_root.join('lib/karafka/active_job/current_attributes.rb'))
|
117
122
|
# Do not load Railtie. It will load if after everything is ready, so we don't have to load any
|
118
123
|
# Karafka components when we require this railtie. Railtie needs to be loaded last.
|
119
124
|
loader.ignore(Karafka.gem_root.join('lib/karafka/railtie'))
|
data.tar.gz.sig
CHANGED
Binary file
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: karafka
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 2.
|
4
|
+
version: 2.1.1
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Maciej Mensfeld
|
@@ -35,7 +35,7 @@ cert_chain:
|
|
35
35
|
Qf04B9ceLUaC4fPVEz10FyobjaFoY4i32xRto3XnrzeAgfEe4swLq8bQsR3w/EF3
|
36
36
|
MGU0FeSV2Yj7Xc2x/7BzLK8xQn5l7Yy75iPF+KP3vVmDHnNl
|
37
37
|
-----END CERTIFICATE-----
|
38
|
-
date: 2023-
|
38
|
+
date: 2023-05-24 00:00:00.000000000 Z
|
39
39
|
dependencies:
|
40
40
|
- !ruby/object:Gem::Dependency
|
41
41
|
name: karafka-core
|
@@ -156,6 +156,9 @@ files:
|
|
156
156
|
- lib/active_job/queue_adapters/karafka_adapter.rb
|
157
157
|
- lib/karafka.rb
|
158
158
|
- lib/karafka/active_job/consumer.rb
|
159
|
+
- lib/karafka/active_job/current_attributes.rb
|
160
|
+
- lib/karafka/active_job/current_attributes/loading.rb
|
161
|
+
- lib/karafka/active_job/current_attributes/persistence.rb
|
159
162
|
- lib/karafka/active_job/dispatcher.rb
|
160
163
|
- lib/karafka/active_job/job_extensions.rb
|
161
164
|
- lib/karafka/active_job/job_options_contract.rb
|
@@ -197,9 +200,9 @@ files:
|
|
197
200
|
- lib/karafka/instrumentation/notifications.rb
|
198
201
|
- lib/karafka/instrumentation/proctitle_listener.rb
|
199
202
|
- lib/karafka/instrumentation/vendors/datadog/dashboard.json
|
200
|
-
- lib/karafka/instrumentation/vendors/datadog/listener.rb
|
201
203
|
- lib/karafka/instrumentation/vendors/datadog/logger_listener.rb
|
202
204
|
- lib/karafka/instrumentation/vendors/datadog/metrics_listener.rb
|
205
|
+
- lib/karafka/instrumentation/vendors/kubernetes/liveness_listener.rb
|
203
206
|
- lib/karafka/licenser.rb
|
204
207
|
- lib/karafka/messages/batch_metadata.rb
|
205
208
|
- lib/karafka/messages/builders/batch_metadata.rb
|
@@ -216,7 +219,6 @@ files:
|
|
216
219
|
- lib/karafka/pro/active_job/consumer.rb
|
217
220
|
- lib/karafka/pro/active_job/dispatcher.rb
|
218
221
|
- lib/karafka/pro/active_job/job_options_contract.rb
|
219
|
-
- lib/karafka/pro/base_consumer.rb
|
220
222
|
- lib/karafka/pro/encryption.rb
|
221
223
|
- lib/karafka/pro/encryption/cipher.rb
|
222
224
|
- lib/karafka/pro/encryption/contracts/config.rb
|
@@ -233,6 +235,7 @@ files:
|
|
233
235
|
- lib/karafka/pro/processing/filters/delayer.rb
|
234
236
|
- lib/karafka/pro/processing/filters/expirer.rb
|
235
237
|
- lib/karafka/pro/processing/filters/throttler.rb
|
238
|
+
- lib/karafka/pro/processing/filters/virtual_limiter.rb
|
236
239
|
- lib/karafka/pro/processing/filters_applier.rb
|
237
240
|
- lib/karafka/pro/processing/jobs/consume_non_blocking.rb
|
238
241
|
- lib/karafka/pro/processing/jobs/revoked_non_blocking.rb
|
@@ -262,26 +265,35 @@ files:
|
|
262
265
|
- lib/karafka/pro/processing/strategies/dlq/ftr.rb
|
263
266
|
- lib/karafka/pro/processing/strategies/dlq/ftr_lrj.rb
|
264
267
|
- lib/karafka/pro/processing/strategies/dlq/ftr_lrj_mom.rb
|
268
|
+
- lib/karafka/pro/processing/strategies/dlq/ftr_lrj_mom_vp.rb
|
265
269
|
- lib/karafka/pro/processing/strategies/dlq/ftr_lrj_vp.rb
|
266
270
|
- lib/karafka/pro/processing/strategies/dlq/ftr_mom.rb
|
271
|
+
- lib/karafka/pro/processing/strategies/dlq/ftr_mom_vp.rb
|
267
272
|
- lib/karafka/pro/processing/strategies/dlq/ftr_vp.rb
|
268
273
|
- lib/karafka/pro/processing/strategies/dlq/lrj.rb
|
269
274
|
- lib/karafka/pro/processing/strategies/dlq/lrj_mom.rb
|
275
|
+
- lib/karafka/pro/processing/strategies/dlq/lrj_mom_vp.rb
|
270
276
|
- lib/karafka/pro/processing/strategies/dlq/lrj_vp.rb
|
271
277
|
- lib/karafka/pro/processing/strategies/dlq/mom.rb
|
278
|
+
- lib/karafka/pro/processing/strategies/dlq/mom_vp.rb
|
272
279
|
- lib/karafka/pro/processing/strategies/dlq/vp.rb
|
273
280
|
- lib/karafka/pro/processing/strategies/ftr/default.rb
|
274
281
|
- lib/karafka/pro/processing/strategies/ftr/vp.rb
|
275
282
|
- lib/karafka/pro/processing/strategies/lrj/default.rb
|
276
283
|
- lib/karafka/pro/processing/strategies/lrj/ftr.rb
|
277
284
|
- lib/karafka/pro/processing/strategies/lrj/ftr_mom.rb
|
285
|
+
- lib/karafka/pro/processing/strategies/lrj/ftr_mom_vp.rb
|
278
286
|
- lib/karafka/pro/processing/strategies/lrj/ftr_vp.rb
|
279
287
|
- lib/karafka/pro/processing/strategies/lrj/mom.rb
|
288
|
+
- lib/karafka/pro/processing/strategies/lrj/mom_vp.rb
|
280
289
|
- lib/karafka/pro/processing/strategies/lrj/vp.rb
|
281
290
|
- lib/karafka/pro/processing/strategies/mom/default.rb
|
282
291
|
- lib/karafka/pro/processing/strategies/mom/ftr.rb
|
292
|
+
- lib/karafka/pro/processing/strategies/mom/ftr_vp.rb
|
293
|
+
- lib/karafka/pro/processing/strategies/mom/vp.rb
|
283
294
|
- lib/karafka/pro/processing/strategies/vp/default.rb
|
284
295
|
- lib/karafka/pro/processing/strategy_selector.rb
|
296
|
+
- lib/karafka/pro/processing/virtual_offset_manager.rb
|
285
297
|
- lib/karafka/pro/routing/features/base.rb
|
286
298
|
- lib/karafka/pro/routing/features/dead_letter_queue.rb
|
287
299
|
- lib/karafka/pro/routing/features/dead_letter_queue/contract.rb
|
metadata.gz.sig
CHANGED
Binary file
|
@@ -1,16 +0,0 @@
|
|
1
|
-
# frozen_string_literal: true
|
2
|
-
|
3
|
-
require_relative 'metrics_listener'
|
4
|
-
|
5
|
-
module Karafka
|
6
|
-
module Instrumentation
|
7
|
-
# Namespace for vendor specific instrumentation
|
8
|
-
module Vendors
|
9
|
-
# Datadog specific instrumentation
|
10
|
-
module Datadog
|
11
|
-
# Alias to keep backwards compatibility
|
12
|
-
Listener = MetricsListener
|
13
|
-
end
|
14
|
-
end
|
15
|
-
end
|
16
|
-
end
|