kubernetes_leader_election 0.1.1 → 0.1.2

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 41efa4758ac05050cf98224f65987ca7928b1bb8f6f83198fabfc3b272f1026a
4
- data.tar.gz: 6d901c130466a461329dbf11caff97a7645f438e5c36e2a03d28ada0aa391147
3
+ metadata.gz: ebf5e530aef5aa2090bb6722def02ea09f0727b4445f1fac80391687b4b69c81
4
+ data.tar.gz: 69a5f3e755e6c401733ab118944a155a1bc706121588359912f01b937283af53
5
5
  SHA512:
6
- metadata.gz: 383f9b7a4135872be64db97a0f41ead019cf990cd200823633a365285ec473092e8f7227791a2535695f37830c075e579231b140a19ad4d848cfa1598c87e247
7
- data.tar.gz: c78cf533e76600728500baef08fb14628e67a4c5b26cd8789aba333d154cdd80457b71a2cfcf1f8fb64dd7b973679168200c39bdd2b2508005e6046ba874da75
6
+ metadata.gz: 86af0f3581d589358f6ccedeb9f04c4a39abb4dfc153c2b8e6ba69dd80b2153ffc8bf4183cd194e548e947eac9c12314517c8532ffb809f641f2e75dc1883002
7
+ data.tar.gz: f58367aff174456db85719244922b383c3972e796ecb5f6ed2f9295994c3ce323402650ffbd40c677ad851934b54220e129c9fed3216d7742d39e458586980a0
data/MIT-LICENSE ADDED
@@ -0,0 +1,20 @@
1
+ Copyright (C) 2013 Michael Grosser <michael@grosser.it>
2
+
3
+ Permission is hereby granted, free of charge, to any person obtaining
4
+ a copy of this software and associated documentation files (the
5
+ "Software"), to deal in the Software without restriction, including
6
+ without limitation the rights to use, copy, modify, merge, publish,
7
+ distribute, sublicense, and/or sell copies of the Software, and to
8
+ permit persons to whom the Software is furnished to do so, subject to
9
+ the following conditions:
10
+
11
+ The above copyright notice and this permission notice shall be
12
+ included in all copies or substantial portions of the Software.
13
+
14
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
15
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
16
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
17
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
18
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
19
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
20
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
@@ -0,0 +1,4 @@
1
+ # frozen_string_literal: true
2
+ class KubernetesLeaderElection
3
+ VERSION = "0.1.2"
4
+ end
@@ -0,0 +1,130 @@
1
+ # frozen_string_literal: true
2
+ require 'time'
3
+ require 'openssl'
4
+ require 'timeout'
5
+ require 'kubeclient'
6
+
7
+ class KubernetesLeaderElection
8
+ ALREADY_EXISTS_CODE = 409
9
+ FAILED_KUBERNETES_REQUEST =
10
+ [Timeout::Error, OpenSSL::SSL::SSLError, Kubeclient::HttpError, SystemCallError, HTTP::ConnectionError].freeze
11
+
12
+ def initialize(name, kubeclient, logger:, statsd: nil, interval: 30)
13
+ @name = name
14
+ @kubeclient = kubeclient
15
+ @statsd = statsd
16
+ @logger = logger
17
+ @interval = interval
18
+ end
19
+
20
+ # not using `call` since we never want to be restarted
21
+ def become_leader_for_life
22
+ @logger.info message: "trying to become leader ... if both pods show this, delete the #{@name} lease"
23
+ loop do
24
+ break if become_leader
25
+ sleep @interval
26
+ end
27
+ yield # signal we are leader, but keep reporting
28
+ loop do
29
+ @statsd&.increment('leader_running') # we monitor this to make sure it's always exactly 1
30
+ sleep @interval
31
+ signal_alive
32
+ end
33
+ end
34
+
35
+ private
36
+
37
+ # show that we are alive or crash because we cannot reach the api (split-brain az)
38
+ def signal_alive
39
+ with_retries(*FAILED_KUBERNETES_REQUEST, times: 3) do
40
+ patch = { spec: { renewTime: microtime } }
41
+ reply = @kubeclient.patch_entity(
42
+ "leases", @name, patch, 'strategic-merge-patch', ENV.fetch("POD_NAMESPACE")
43
+ )
44
+
45
+ current_leader = reply.dig(:metadata, :ownerReferences, 0, :name)
46
+ raise "Lost leadership to #{current_leader}" if current_leader != ENV.fetch("POD_NAME")
47
+ end
48
+ end
49
+
50
+ # kubernetes needs exactly this format or it blows up
51
+ def microtime
52
+ Time.now.strftime('%FT%T.000000Z')
53
+ end
54
+
55
+ def alive?(lease)
56
+ Time.parse(lease.dig(:spec, :renewTime)) > Time.now - (2 * @interval)
57
+ end
58
+
59
+ # everyone tries to create the same leases, who succeeds is the owner,
60
+ # leases is auto-deleted by GC when owner is deleted
61
+ # same logic lives in kube-service-watcher & kube-stats
62
+ def become_leader
63
+ namespace = ENV.fetch("POD_NAMESPACE")
64
+ # retry request on regular api errors
65
+ reraise = ->(e) { e.is_a?(Kubeclient::HttpError) && e.error_code == ALREADY_EXISTS_CODE }
66
+
67
+ with_retries(*FAILED_KUBERNETES_REQUEST, reraise: reraise, times: 3) do
68
+ @kubeclient.create_entity(
69
+ "Lease",
70
+ "leases",
71
+ metadata: {
72
+ name: @name,
73
+ namespace: namespace,
74
+ ownerReferences: [{
75
+ apiVersion: "v1",
76
+ kind: "Pod",
77
+ name: ENV.fetch("POD_NAME"),
78
+ uid: ENV.fetch("POD_UID")
79
+ }]
80
+ },
81
+ spec: {
82
+ acquireTime: microtime,
83
+ holderIdentity: ENV.fetch("POD_NAME"), # shown in `kubectl get lease`
84
+ leaseDurationSeconds: @interval * 2,
85
+ leaseTransitions: 0, # will never change since we delete the lease
86
+ renewTime: microtime
87
+ }
88
+ )
89
+ end
90
+ @logger.info message: "became leader"
91
+ true # I'm the leader now
92
+ rescue Kubeclient::HttpError => e
93
+ raise e unless e.error_code == ALREADY_EXISTS_CODE # lease already exists
94
+
95
+ lease = with_retries(*FAILED_KUBERNETES_REQUEST, times: 3) do
96
+ @kubeclient.get_entity("leases", @name, namespace)
97
+ rescue Kubeclient::ResourceNotFoundError
98
+ nil
99
+ end
100
+
101
+ if !lease
102
+ @logger.info message: "stale lease was deleted"
103
+ false
104
+ elsif lease.dig(:metadata, :ownerReferences, 0, :name) == ENV.fetch("POD_NAME")
105
+ @logger.info message: "still leader"
106
+ true # I restarted and am still the leader
107
+ elsif !alive?(lease)
108
+ # this is still a race-condition since we could be deleting the newly succeeded leader
109
+ # see https://github.com/kubernetes/kubernetes/issues/20572
110
+ @logger.info message: "deleting stale lease"
111
+ with_retries(*FAILED_KUBERNETES_REQUEST, times: 3) do
112
+ @kubeclient.delete_entity("leases", @name, namespace)
113
+ end
114
+ false # leader is dead, do not assume leadership here to avoid race condition
115
+ else
116
+ false # leader is still alive ... not logging to avoid repetitive noise
117
+ end
118
+ end
119
+
120
+ def with_retries(*errors, times:, reraise: nil, backoff: [0.1, 0.5, 1])
121
+ yield
122
+ rescue *errors => e
123
+ retries ||= -1
124
+ retries += 1
125
+ raise if retries >= times || reraise&.call(e)
126
+ @logger.warn message: "Retryable error", type: e.class.to_s, retries: times - retries
127
+ sleep backoff[retries] || backoff.last
128
+ retry
129
+ end
130
+ end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: kubernetes_leader_election
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.1.1
4
+ version: 0.1.2
5
5
  platform: ruby
6
6
  authors:
7
7
  - Michael Grosser
@@ -29,7 +29,10 @@ email: michael@grosser.it
29
29
  executables: []
30
30
  extensions: []
31
31
  extra_rdoc_files: []
32
- files: []
32
+ files:
33
+ - MIT-LICENSE
34
+ - lib/kubernetes_leader_election.rb
35
+ - lib/kubernetes_leader_election/version.rb
33
36
  homepage: https://github.com/grosser/kubernetes_leader_election
34
37
  licenses:
35
38
  - MIT