gitlab-sidekiq-fetcher 0.1.0 → 0.3.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +5 -5
- data/.gitignore +1 -1
- data/{RELEASE-GITLAB.md → README-GITLAB.md} +0 -0
- data/README.md +4 -15
- data/gitlab-sidekiq-fetcher.gemspec +4 -2
- data/lib/sidekiq-reliable-fetch.rb +2 -3
- data/lib/sidekiq-reliable-fetch/api.rb +56 -0
- data/lib/sidekiq-reliable-fetch/web.rb +24 -0
- data/lib/sidekiq/reliable_fetcher.rb +143 -0
- data/web/views/working_queue.erb +25 -0
- data/web/views/working_queues.erb +17 -0
- metadata +10 -21
- data/.gitlab-ci.yml +0 -53
- data/.rspec +0 -1
- data/Gemfile +0 -12
- data/Gemfile.lock +0 -50
- data/lib/sidekiq/base_reliable_fetch.rb +0 -185
- data/lib/sidekiq/reliable_fetch.rb +0 -40
- data/lib/sidekiq/semi_reliable_fetch.rb +0 -44
- data/spec/base_reliable_fetch_spec.rb +0 -73
- data/spec/fetch_shared_examples.rb +0 -118
- data/spec/reliable_fetch_spec.rb +0 -7
- data/spec/semi_reliable_fetch_spec.rb +0 -7
- data/spec/spec_helper.rb +0 -115
- data/test/README.md +0 -34
- data/test/config.rb +0 -31
- data/test/reliability_test.rb +0 -116
- data/test/worker.rb +0 -26
data/spec/reliable_fetch_spec.rb
DELETED
data/spec/spec_helper.rb
DELETED
@@ -1,115 +0,0 @@
|
|
1
|
-
require 'sidekiq'
|
2
|
-
require 'sidekiq/util'
|
3
|
-
require 'sidekiq/api'
|
4
|
-
require 'pry'
|
5
|
-
require 'simplecov'
|
6
|
-
|
7
|
-
SimpleCov.start
|
8
|
-
|
9
|
-
REDIS_URL = ENV['REDIS_URL'] || 'redis://localhost:6379/10'
|
10
|
-
|
11
|
-
Sidekiq.configure_client do |config|
|
12
|
-
config.redis = { url: REDIS_URL }
|
13
|
-
end
|
14
|
-
|
15
|
-
Sidekiq.logger.level = Logger::ERROR
|
16
|
-
# This file was generated by the `rspec --init` command. Conventionally, all
|
17
|
-
# specs live under a `spec` directory, which RSpec adds to the `$LOAD_PATH`.
|
18
|
-
# The generated `.rspec` file contains `--require spec_helper` which will cause
|
19
|
-
# this file to always be loaded, without a need to explicitly require it in any
|
20
|
-
# files.
|
21
|
-
#
|
22
|
-
# Given that it is always loaded, you are encouraged to keep this file as
|
23
|
-
# light-weight as possible. Requiring heavyweight dependencies from this file
|
24
|
-
# will add to the boot time of your test suite on EVERY test run, even for an
|
25
|
-
# individual file that may not need all of that loaded. Instead, consider making
|
26
|
-
# a separate helper file that requires the additional dependencies and performs
|
27
|
-
# the additional setup, and require it from the spec files that actually need
|
28
|
-
# it.
|
29
|
-
#
|
30
|
-
# See http://rubydoc.info/gems/rspec-core/RSpec/Core/Configuration
|
31
|
-
RSpec.configure do |config|
|
32
|
-
# rspec-expectations config goes here. You can use an alternate
|
33
|
-
# assertion/expectation library such as wrong or the stdlib/minitest
|
34
|
-
# assertions if you prefer.
|
35
|
-
config.expect_with :rspec do |expectations|
|
36
|
-
# This option will default to `true` in RSpec 4. It makes the `description`
|
37
|
-
# and `failure_message` of custom matchers include text for helper methods
|
38
|
-
# defined using `chain`, e.g.:
|
39
|
-
# be_bigger_than(2).and_smaller_than(4).description
|
40
|
-
# # => "be bigger than 2 and smaller than 4"
|
41
|
-
# ...rather than:
|
42
|
-
# # => "be bigger than 2"
|
43
|
-
expectations.include_chain_clauses_in_custom_matcher_descriptions = true
|
44
|
-
end
|
45
|
-
|
46
|
-
# rspec-mocks config goes here. You can use an alternate test double
|
47
|
-
# library (such as bogus or mocha) by changing the `mock_with` option here.
|
48
|
-
config.mock_with :rspec do |mocks|
|
49
|
-
# Prevents you from mocking or stubbing a method that does not exist on
|
50
|
-
# a real object. This is generally recommended, and will default to
|
51
|
-
# `true` in RSpec 4.
|
52
|
-
mocks.verify_partial_doubles = true
|
53
|
-
end
|
54
|
-
|
55
|
-
# This option will default to `:apply_to_host_groups` in RSpec 4 (and will
|
56
|
-
# have no way to turn it off -- the option exists only for backwards
|
57
|
-
# compatibility in RSpec 3). It causes shared context metadata to be
|
58
|
-
# inherited by the metadata hash of host groups and examples, rather than
|
59
|
-
# triggering implicit auto-inclusion in groups with matching metadata.
|
60
|
-
config.shared_context_metadata_behavior = :apply_to_host_groups
|
61
|
-
|
62
|
-
# The settings below are suggested to provide a good initial experience
|
63
|
-
# with RSpec, but feel free to customize to your heart's content.
|
64
|
-
=begin
|
65
|
-
# This allows you to limit a spec run to individual examples or groups
|
66
|
-
# you care about by tagging them with `:focus` metadata. When nothing
|
67
|
-
# is tagged with `:focus`, all examples get run. RSpec also provides
|
68
|
-
# aliases for `it`, `describe`, and `context` that include `:focus`
|
69
|
-
# metadata: `fit`, `fdescribe` and `fcontext`, respectively.
|
70
|
-
config.filter_run_when_matching :focus
|
71
|
-
|
72
|
-
# Allows RSpec to persist some state between runs in order to support
|
73
|
-
# the `--only-failures` and `--next-failure` CLI options. We recommend
|
74
|
-
# you configure your source control system to ignore this file.
|
75
|
-
config.example_status_persistence_file_path = "spec/examples.txt"
|
76
|
-
|
77
|
-
# Limits the available syntax to the non-monkey patched syntax that is
|
78
|
-
# recommended. For more details, see:
|
79
|
-
# - http://rspec.info/blog/2012/06/rspecs-new-expectation-syntax/
|
80
|
-
# - http://www.teaisaweso.me/blog/2013/05/27/rspecs-new-message-expectation-syntax/
|
81
|
-
# - http://rspec.info/blog/2014/05/notable-changes-in-rspec-3/#zero-monkey-patching-mode
|
82
|
-
config.disable_monkey_patching!
|
83
|
-
|
84
|
-
# This setting enables warnings. It's recommended, but in some cases may
|
85
|
-
# be too noisy due to issues in dependencies.
|
86
|
-
config.warnings = true
|
87
|
-
|
88
|
-
# Many RSpec users commonly either run the entire suite or an individual
|
89
|
-
# file, and it's useful to allow more verbose output when running an
|
90
|
-
# individual spec file.
|
91
|
-
if config.files_to_run.one?
|
92
|
-
# Use the documentation formatter for detailed output,
|
93
|
-
# unless a formatter has already been configured
|
94
|
-
# (e.g. via a command-line flag).
|
95
|
-
config.default_formatter = "doc"
|
96
|
-
end
|
97
|
-
|
98
|
-
# Print the 10 slowest examples and example groups at the
|
99
|
-
# end of the spec run, to help surface which specs are running
|
100
|
-
# particularly slow.
|
101
|
-
config.profile_examples = 10
|
102
|
-
|
103
|
-
# Run specs in random order to surface order dependencies. If you find an
|
104
|
-
# order dependency and want to debug it, you can fix the order by providing
|
105
|
-
# the seed, which is printed after each run.
|
106
|
-
# --seed 1234
|
107
|
-
config.order = :random
|
108
|
-
|
109
|
-
# Seed global randomization in this process using the `--seed` CLI option.
|
110
|
-
# Setting this allows you to use `--seed` to deterministically reproduce
|
111
|
-
# test failures related to randomization by passing the same `--seed` value
|
112
|
-
# as the one that triggered the failure.
|
113
|
-
Kernel.srand config.seed
|
114
|
-
=end
|
115
|
-
end
|
data/test/README.md
DELETED
@@ -1,34 +0,0 @@
|
|
1
|
-
# How to run
|
2
|
-
|
3
|
-
```
|
4
|
-
cd test
|
5
|
-
bundle exec ruby reliability_test.rb
|
6
|
-
```
|
7
|
-
|
8
|
-
You can adjust some parameters of the test in the `config.rb`
|
9
|
-
|
10
|
-
|
11
|
-
# How it works
|
12
|
-
|
13
|
-
This tool spawns configured number of Sidekiq workers and when the amount of processed jobs is about half of origin
|
14
|
-
number it will kill all the workers with `kill -9` and then it will spawn new workers again until all the jobs are processed. To track the process and counters we use Redis keys/counters.
|
15
|
-
|
16
|
-
# How to run tests
|
17
|
-
|
18
|
-
To run rspec:
|
19
|
-
|
20
|
-
```
|
21
|
-
bundle exec rspec
|
22
|
-
```
|
23
|
-
|
24
|
-
To run performance tests:
|
25
|
-
|
26
|
-
```
|
27
|
-
cd test
|
28
|
-
JOB_FETCHER=semi bundle exec ruby reliability_test.rb
|
29
|
-
```
|
30
|
-
|
31
|
-
JOB_FETCHER can be set to one of these values: `semi`, `reliable`, `basic`
|
32
|
-
|
33
|
-
To run both kind of tests you need to have redis server running on default HTTP port `6379`. To use other HTTP port, you can define
|
34
|
-
`REDIS_URL` environment varible with the port you need(example: `REDIS_URL="redis://localhost:9999"`).
|
data/test/config.rb
DELETED
@@ -1,31 +0,0 @@
|
|
1
|
-
# frozen_string_literal: true
|
2
|
-
|
3
|
-
require_relative '../lib/sidekiq/base_reliable_fetch'
|
4
|
-
require_relative '../lib/sidekiq/reliable_fetch'
|
5
|
-
require_relative '../lib/sidekiq/semi_reliable_fetch'
|
6
|
-
require_relative 'worker'
|
7
|
-
|
8
|
-
REDIS_FINISHED_LIST = 'reliable-fetcher-finished-jids'
|
9
|
-
|
10
|
-
NUMBER_OF_WORKERS = ENV['NUMBER_OF_WORKERS'] || 10
|
11
|
-
NUMBER_OF_JOBS = ENV['NUMBER_OF_JOBS'] || 1000
|
12
|
-
JOB_FETCHER = (ENV['JOB_FETCHER'] || :semi).to_sym # :basic, :semi, :reliable
|
13
|
-
TEST_CLEANUP_INTERVAL = 20
|
14
|
-
TEST_LEASE_INTERVAL = 5
|
15
|
-
WAIT_CLEANUP = TEST_CLEANUP_INTERVAL +
|
16
|
-
TEST_LEASE_INTERVAL +
|
17
|
-
Sidekiq::ReliableFetch::HEARTBEAT_LIFESPAN
|
18
|
-
|
19
|
-
Sidekiq.configure_server do |config|
|
20
|
-
if %i[semi reliable].include?(JOB_FETCHER)
|
21
|
-
config.options[:semi_reliable_fetch] = (JOB_FETCHER == :semi)
|
22
|
-
|
23
|
-
# We need to override these parameters to not wait too long
|
24
|
-
# The default values are good for production use only
|
25
|
-
# These will be ignored for :basic
|
26
|
-
config.options[:cleanup_interval] = TEST_CLEANUP_INTERVAL
|
27
|
-
config.options[:lease_interval] = TEST_LEASE_INTERVAL
|
28
|
-
|
29
|
-
Sidekiq::ReliableFetch.setup_reliable_fetch!(config)
|
30
|
-
end
|
31
|
-
end
|
data/test/reliability_test.rb
DELETED
@@ -1,116 +0,0 @@
|
|
1
|
-
# frozen_string_literal: true
|
2
|
-
|
3
|
-
require 'sidekiq'
|
4
|
-
require 'sidekiq/util'
|
5
|
-
require 'sidekiq/cli'
|
6
|
-
require_relative 'config'
|
7
|
-
|
8
|
-
def spawn_workers_and_stop_them_on_a_half_way
|
9
|
-
pids = spawn_workers
|
10
|
-
|
11
|
-
wait_until do |queue_size|
|
12
|
-
queue_size < NUMBER_OF_JOBS / 2
|
13
|
-
end
|
14
|
-
|
15
|
-
first_half_pids, second_half_pids = split_array(pids)
|
16
|
-
|
17
|
-
puts 'Killing half of the workers...'
|
18
|
-
signal_to_workers('KILL', first_half_pids)
|
19
|
-
|
20
|
-
puts 'Stopping another half of the workers...'
|
21
|
-
signal_to_workers('TERM', second_half_pids)
|
22
|
-
end
|
23
|
-
|
24
|
-
def spawn_workers_and_let_them_finish
|
25
|
-
puts 'Spawn workers and let them finish...'
|
26
|
-
|
27
|
-
pids = spawn_workers
|
28
|
-
|
29
|
-
wait_until do |queue_size|
|
30
|
-
queue_size.zero?
|
31
|
-
end
|
32
|
-
|
33
|
-
if %i[semi reliable].include? JOB_FETCHER
|
34
|
-
puts 'Waiting for clean up process that will requeue dead jobs...'
|
35
|
-
sleep WAIT_CLEANUP
|
36
|
-
end
|
37
|
-
|
38
|
-
signal_to_workers('TERM', pids)
|
39
|
-
end
|
40
|
-
|
41
|
-
def wait_until
|
42
|
-
loop do
|
43
|
-
sleep 3
|
44
|
-
|
45
|
-
queue_size = current_queue_size
|
46
|
-
puts "Jobs in the queue:#{queue_size}"
|
47
|
-
|
48
|
-
break if yield(queue_size)
|
49
|
-
end
|
50
|
-
end
|
51
|
-
|
52
|
-
def signal_to_workers(signal, pids)
|
53
|
-
pids.each { |pid| Process.kill(signal, pid) }
|
54
|
-
pids.each { |pid| Process.wait(pid) }
|
55
|
-
end
|
56
|
-
|
57
|
-
def spawn_workers
|
58
|
-
pids = []
|
59
|
-
NUMBER_OF_WORKERS.times do
|
60
|
-
pids << spawn('sidekiq -r ./config.rb')
|
61
|
-
end
|
62
|
-
|
63
|
-
pids
|
64
|
-
end
|
65
|
-
|
66
|
-
def current_queue_size
|
67
|
-
Sidekiq.redis { |c| c.llen('queue:default') }
|
68
|
-
end
|
69
|
-
|
70
|
-
def duplicates
|
71
|
-
Sidekiq.redis { |c| c.llen(REDIS_FINISHED_LIST) }
|
72
|
-
end
|
73
|
-
|
74
|
-
# Splits array into two halves
|
75
|
-
def split_array(arr)
|
76
|
-
first_arr = arr.take(arr.size / 2)
|
77
|
-
second_arr = arr - first_arr
|
78
|
-
[first_arr, second_arr]
|
79
|
-
end
|
80
|
-
|
81
|
-
##########################################################
|
82
|
-
|
83
|
-
puts '########################################'
|
84
|
-
puts "Mode: #{JOB_FETCHER}"
|
85
|
-
puts '########################################'
|
86
|
-
|
87
|
-
Sidekiq.redis(&:flushdb)
|
88
|
-
|
89
|
-
jobs = []
|
90
|
-
|
91
|
-
NUMBER_OF_JOBS.times do
|
92
|
-
jobs << TestWorker.perform_async
|
93
|
-
end
|
94
|
-
|
95
|
-
puts "Queued #{NUMBER_OF_JOBS} jobs"
|
96
|
-
|
97
|
-
spawn_workers_and_stop_them_on_a_half_way
|
98
|
-
spawn_workers_and_let_them_finish
|
99
|
-
|
100
|
-
jobs_lost = 0
|
101
|
-
|
102
|
-
Sidekiq.redis do |redis|
|
103
|
-
jobs.each do |job|
|
104
|
-
next if redis.lrem(REDIS_FINISHED_LIST, 1, job) == 1
|
105
|
-
jobs_lost += 1
|
106
|
-
end
|
107
|
-
end
|
108
|
-
|
109
|
-
puts "Remaining unprocessed: #{jobs_lost}"
|
110
|
-
puts "Duplicates found: #{duplicates}"
|
111
|
-
|
112
|
-
if jobs_lost.zero? && duplicates.zero?
|
113
|
-
exit 0
|
114
|
-
else
|
115
|
-
exit 1
|
116
|
-
end
|
data/test/worker.rb
DELETED
@@ -1,26 +0,0 @@
|
|
1
|
-
# frozen_string_literal: true
|
2
|
-
|
3
|
-
class TestWorker
|
4
|
-
include Sidekiq::Worker
|
5
|
-
|
6
|
-
def perform
|
7
|
-
# To mimic long running job and to increase the probability of losing the job
|
8
|
-
sleep 1
|
9
|
-
|
10
|
-
Sidekiq.redis do |redis|
|
11
|
-
redis.lpush(REDIS_FINISHED_LIST, get_sidekiq_job_id)
|
12
|
-
end
|
13
|
-
end
|
14
|
-
|
15
|
-
def get_sidekiq_job_id
|
16
|
-
context_data = Thread.current[:sidekiq_context]&.first
|
17
|
-
|
18
|
-
return unless context_data
|
19
|
-
|
20
|
-
index = context_data.index('JID-')
|
21
|
-
|
22
|
-
return unless index
|
23
|
-
|
24
|
-
context_data[index + 4..-1]
|
25
|
-
end
|
26
|
-
end
|