kubernetes_leader_election 0.1.1 → 0.1.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/MIT-LICENSE +20 -0
- data/lib/kubernetes_leader_election/version.rb +4 -0
- data/lib/kubernetes_leader_election.rb +130 -0
- metadata +5 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: ebf5e530aef5aa2090bb6722def02ea09f0727b4445f1fac80391687b4b69c81
|
4
|
+
data.tar.gz: 69a5f3e755e6c401733ab118944a155a1bc706121588359912f01b937283af53
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 86af0f3581d589358f6ccedeb9f04c4a39abb4dfc153c2b8e6ba69dd80b2153ffc8bf4183cd194e548e947eac9c12314517c8532ffb809f641f2e75dc1883002
|
7
|
+
data.tar.gz: f58367aff174456db85719244922b383c3972e796ecb5f6ed2f9295994c3ce323402650ffbd40c677ad851934b54220e129c9fed3216d7742d39e458586980a0
|
data/MIT-LICENSE
ADDED
@@ -0,0 +1,20 @@
|
|
1
|
+
Copyright (C) 2013 Michael Grosser <michael@grosser.it>
|
2
|
+
|
3
|
+
Permission is hereby granted, free of charge, to any person obtaining
|
4
|
+
a copy of this software and associated documentation files (the
|
5
|
+
"Software"), to deal in the Software without restriction, including
|
6
|
+
without limitation the rights to use, copy, modify, merge, publish,
|
7
|
+
distribute, sublicense, and/or sell copies of the Software, and to
|
8
|
+
permit persons to whom the Software is furnished to do so, subject to
|
9
|
+
the following conditions:
|
10
|
+
|
11
|
+
The above copyright notice and this permission notice shall be
|
12
|
+
included in all copies or substantial portions of the Software.
|
13
|
+
|
14
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
15
|
+
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
16
|
+
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
17
|
+
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
|
18
|
+
LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
|
19
|
+
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
|
20
|
+
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
@@ -0,0 +1,130 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
require 'time'
|
3
|
+
require 'openssl'
|
4
|
+
require 'timeout'
|
5
|
+
require 'kubeclient'
|
6
|
+
|
7
|
+
class KubernetesLeaderElection
|
8
|
+
ALREADY_EXISTS_CODE = 409
|
9
|
+
FAILED_KUBERNETES_REQUEST =
|
10
|
+
[Timeout::Error, OpenSSL::SSL::SSLError, Kubeclient::HttpError, SystemCallError, HTTP::ConnectionError].freeze
|
11
|
+
|
12
|
+
def initialize(name, kubeclient, logger:, statsd: nil, interval: 30)
|
13
|
+
@name = name
|
14
|
+
@kubeclient = kubeclient
|
15
|
+
@statsd = statsd
|
16
|
+
@logger = logger
|
17
|
+
@interval = interval
|
18
|
+
end
|
19
|
+
|
20
|
+
# not using `call` since we never want to be restarted
|
21
|
+
def become_leader_for_life
|
22
|
+
@logger.info message: "trying to become leader ... if both pods show this, delete the #{@name} lease"
|
23
|
+
loop do
|
24
|
+
break if become_leader
|
25
|
+
sleep @interval
|
26
|
+
end
|
27
|
+
yield # signal we are leader, but keep reporting
|
28
|
+
loop do
|
29
|
+
@statsd&.increment('leader_running') # we monitor this to make sure it's always exactly 1
|
30
|
+
sleep @interval
|
31
|
+
signal_alive
|
32
|
+
end
|
33
|
+
end
|
34
|
+
|
35
|
+
private
|
36
|
+
|
37
|
+
# show that we are alive or crash because we cannot reach the api (split-brain az)
|
38
|
+
def signal_alive
|
39
|
+
with_retries(*FAILED_KUBERNETES_REQUEST, times: 3) do
|
40
|
+
patch = { spec: { renewTime: microtime } }
|
41
|
+
reply = @kubeclient.patch_entity(
|
42
|
+
"leases", @name, patch, 'strategic-merge-patch', ENV.fetch("POD_NAMESPACE")
|
43
|
+
)
|
44
|
+
|
45
|
+
current_leader = reply.dig(:metadata, :ownerReferences, 0, :name)
|
46
|
+
raise "Lost leadership to #{current_leader}" if current_leader != ENV.fetch("POD_NAME")
|
47
|
+
end
|
48
|
+
end
|
49
|
+
|
50
|
+
# kubernetes needs exactly this format or it blows up
|
51
|
+
def microtime
|
52
|
+
Time.now.strftime('%FT%T.000000Z')
|
53
|
+
end
|
54
|
+
|
55
|
+
def alive?(lease)
|
56
|
+
Time.parse(lease.dig(:spec, :renewTime)) > Time.now - (2 * @interval)
|
57
|
+
end
|
58
|
+
|
59
|
+
# everyone tries to create the same leases, who succeeds is the owner,
|
60
|
+
# leases is auto-deleted by GC when owner is deleted
|
61
|
+
# same logic lives in kube-service-watcher & kube-stats
|
62
|
+
def become_leader
|
63
|
+
namespace = ENV.fetch("POD_NAMESPACE")
|
64
|
+
# retry request on regular api errors
|
65
|
+
reraise = ->(e) { e.is_a?(Kubeclient::HttpError) && e.error_code == ALREADY_EXISTS_CODE }
|
66
|
+
|
67
|
+
with_retries(*FAILED_KUBERNETES_REQUEST, reraise: reraise, times: 3) do
|
68
|
+
@kubeclient.create_entity(
|
69
|
+
"Lease",
|
70
|
+
"leases",
|
71
|
+
metadata: {
|
72
|
+
name: @name,
|
73
|
+
namespace: namespace,
|
74
|
+
ownerReferences: [{
|
75
|
+
apiVersion: "v1",
|
76
|
+
kind: "Pod",
|
77
|
+
name: ENV.fetch("POD_NAME"),
|
78
|
+
uid: ENV.fetch("POD_UID")
|
79
|
+
}]
|
80
|
+
},
|
81
|
+
spec: {
|
82
|
+
acquireTime: microtime,
|
83
|
+
holderIdentity: ENV.fetch("POD_NAME"), # shown in `kubectl get lease`
|
84
|
+
leaseDurationSeconds: @interval * 2,
|
85
|
+
leaseTransitions: 0, # will never change since we delete the lease
|
86
|
+
renewTime: microtime
|
87
|
+
}
|
88
|
+
)
|
89
|
+
end
|
90
|
+
@logger.info message: "became leader"
|
91
|
+
true # I'm the leader now
|
92
|
+
rescue Kubeclient::HttpError => e
|
93
|
+
raise e unless e.error_code == ALREADY_EXISTS_CODE # lease already exists
|
94
|
+
|
95
|
+
lease = with_retries(*FAILED_KUBERNETES_REQUEST, times: 3) do
|
96
|
+
@kubeclient.get_entity("leases", @name, namespace)
|
97
|
+
rescue Kubeclient::ResourceNotFoundError
|
98
|
+
nil
|
99
|
+
end
|
100
|
+
|
101
|
+
if !lease
|
102
|
+
@logger.info message: "stale lease was deleted"
|
103
|
+
false
|
104
|
+
elsif lease.dig(:metadata, :ownerReferences, 0, :name) == ENV.fetch("POD_NAME")
|
105
|
+
@logger.info message: "still leader"
|
106
|
+
true # I restarted and am still the leader
|
107
|
+
elsif !alive?(lease)
|
108
|
+
# this is still a race-condition since we could be deleting the newly succeeded leader
|
109
|
+
# see https://github.com/kubernetes/kubernetes/issues/20572
|
110
|
+
@logger.info message: "deleting stale lease"
|
111
|
+
with_retries(*FAILED_KUBERNETES_REQUEST, times: 3) do
|
112
|
+
@kubeclient.delete_entity("leases", @name, namespace)
|
113
|
+
end
|
114
|
+
false # leader is dead, do not assume leadership here to avoid race condition
|
115
|
+
else
|
116
|
+
false # leader is still alive ... not logging to avoid repetitive noise
|
117
|
+
end
|
118
|
+
end
|
119
|
+
|
120
|
+
def with_retries(*errors, times:, reraise: nil, backoff: [0.1, 0.5, 1])
|
121
|
+
yield
|
122
|
+
rescue *errors => e
|
123
|
+
retries ||= -1
|
124
|
+
retries += 1
|
125
|
+
raise if retries >= times || reraise&.call(e)
|
126
|
+
@logger.warn message: "Retryable error", type: e.class.to_s, retries: times - retries
|
127
|
+
sleep backoff[retries] || backoff.last
|
128
|
+
retry
|
129
|
+
end
|
130
|
+
end
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: kubernetes_leader_election
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.1.
|
4
|
+
version: 0.1.2
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Michael Grosser
|
@@ -29,7 +29,10 @@ email: michael@grosser.it
|
|
29
29
|
executables: []
|
30
30
|
extensions: []
|
31
31
|
extra_rdoc_files: []
|
32
|
-
files:
|
32
|
+
files:
|
33
|
+
- MIT-LICENSE
|
34
|
+
- lib/kubernetes_leader_election.rb
|
35
|
+
- lib/kubernetes_leader_election/version.rb
|
33
36
|
homepage: https://github.com/grosser/kubernetes_leader_election
|
34
37
|
licenses:
|
35
38
|
- MIT
|