daemon_controller 1.2.0 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,16 +1,18 @@
1
+ # frozen_string_literal: true
2
+
1
3
  # daemon_controller, library for robust daemon management
2
- # Copyright (c) 2010-2014 Phusion
3
- #
4
+ # Copyright (c) 2010-2025 Asynchronous B.V.
5
+ #
4
6
  # Permission is hereby granted, free of charge, to any person obtaining a copy
5
7
  # of this software and associated documentation files (the "Software"), to deal
6
8
  # in the Software without restriction, including without limitation the rights
7
9
  # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
8
10
  # copies of the Software, and to permit persons to whom the Software is
9
11
  # furnished to do so, subject to the following conditions:
10
- #
12
+ #
11
13
  # The above copyright notice and this permission notice shall be included in
12
14
  # all copies or substantial portions of the Software.
13
- #
15
+ #
14
16
  # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15
17
  # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16
18
  # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
@@ -19,855 +21,943 @@
19
21
  # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
20
22
  # THE SOFTWARE.
21
23
 
22
- require 'tempfile'
23
- require 'fcntl'
24
- require 'socket'
25
- require 'timeout'
26
- if Process.respond_to?(:spawn)
27
- require 'rbconfig'
28
- end
24
+ require "tempfile"
25
+ require "fcntl"
26
+ require "socket"
27
+ require "pathname"
28
+ require "timeout"
29
+ require "rbconfig"
29
30
 
30
- require 'daemon_controller/lock_file'
31
+ require_relative "daemon_controller/lock_file"
31
32
 
32
33
  # Main daemon controller object. See the README for an introduction and tutorial.
33
34
  class DaemonController
34
- ALLOWED_CONNECT_EXCEPTIONS = [Errno::ECONNREFUSED, Errno::ENETUNREACH,
35
- Errno::ETIMEDOUT, Errno::ECONNRESET, Errno::EINVAL,
36
- Errno::EADDRNOTAVAIL]
37
-
38
- SPAWNER_FILE = File.expand_path(File.join(File.dirname(__FILE__),
39
- "daemon_controller", "spawn.rb"))
40
-
41
- class Error < StandardError
42
- end
43
- class TimeoutError < Error
44
- end
45
- class AlreadyStarted < Error
46
- end
47
- class StartError < Error
48
- end
49
- class StartTimeout < TimeoutError
50
- end
51
- class StopError < Error
52
- end
53
- class StopTimeout < TimeoutError
54
- end
55
- class ConnectError < Error
56
- end
57
- class DaemonizationTimeout < TimeoutError
58
- end
59
-
60
- # Create a new DaemonController object.
61
- #
62
- # === Mandatory options
63
- #
64
- # [:identifier]
65
- # A human-readable, unique name for this daemon, e.g. "Sphinx search server".
66
- # This identifier will be used in some error messages. On some platforms, it will
67
- # be used for concurrency control: on such platforms, no two DaemonController
68
- # objects will operate on the same identifier on the same time.
69
- #
70
- # [:start_command]
71
- # The command to start the daemon. This must be a a String, e.g.
72
- # "mongrel_rails start -e production", or a Proc which returns a String.
73
- #
74
- # If the value is a Proc, and the +before_start+ option is given too, then
75
- # the +start_command+ Proc is guaranteed to be called after the +before_start+
76
- # Proc is called.
77
- #
78
- # [:ping_command]
79
- # The ping command is used to check whether the daemon can be connected to.
80
- # It is also used to ensure that #start only returns when the daemon can be
81
- # connected to.
82
- #
83
- # The value may be a command string. This command must exit with an exit code of
84
- # 0 if the daemon can be successfully connected to, or exit with a non-0 exit
85
- # code on failure.
86
- #
87
- # The value may also be an Array which specifies the socket address of the daemon.
88
- # It must be in one of the following forms:
89
- # - [:tcp, host_name, port]
90
- # - [:unix, filename]
91
- #
92
- # The value may also be a Proc, which returns an expression that evaluates to
93
- # true (indicating that the daemon can be connected to) or false (failure).
94
- # If the Proc raises Errno::ECONNREFUSED, Errno::ENETUNREACH, Errno::ETIMEDOUT
95
- # Errno::ECONNRESET, Errno::EINVAL or Errno::EADDRNOTAVAIL then that also
96
- # means that the daemon cannot be connected to.
97
- # <b>NOTE:</b> if the ping command returns an object which responds to
98
- # <tt>#close</tt>, then that method will be called on it.
99
- # This makes it possible to specify a ping command such as
100
- # <tt>lambda { TCPSocket.new('localhost', 1234) }</tt>, without having to worry
101
- # about closing it afterwards.
102
- # Any exceptions raised by #close are ignored.
103
- #
104
- # [:pid_file]
105
- # The PID file that the daemon will write to. Used to check whether the daemon
106
- # is running.
107
- #
108
- # [:lock_file]
109
- # The lock file to use for serializing concurrent daemon management operations.
110
- # Defaults to "(filename of PID file).lock".
111
- #
112
- # [:log_file]
113
- # The log file that the daemon will write to. It will be consulted to see
114
- # whether the daemon has printed any error messages during startup.
115
- #
116
- # === Optional options
117
- # [:stop_command]
118
- # A command to stop the daemon with, e.g. "/etc/rc.d/nginx stop". If no stop
119
- # command is given (i.e. +nil+), then DaemonController will stop the daemon
120
- # by killing the PID written in the PID file.
121
- #
122
- # The default value is +nil+.
123
- #
124
- # [:restart_command]
125
- # A command to restart the daemon with, e.g. "/etc/rc.d/nginx restart". If
126
- # no restart command is given (i.e. +nil+), then DaemonController will
127
- # restart the daemon by calling #stop and #start.
128
- #
129
- # The default value is +nil+.
130
- #
131
- # [:before_start]
132
- # This may be a Proc. It will be called just before running the start command.
133
- # The before_start proc is not subject to the start timeout.
134
- #
135
- # [:start_timeout]
136
- # The maximum amount of time, in seconds, that #start may take to start
137
- # the daemon. Since #start also waits until the daemon can be connected to,
138
- # that wait time is counted as well. If the daemon does not start in time,
139
- # then #start will raise an exception.
140
- #
141
- # The default value is 15.
142
- #
143
- # [:stop_timeout]
144
- # The maximum amount of time, in seconds, that #stop may take to stop
145
- # the daemon. Since #stop also waits until the daemon is no longer running,
146
- # that wait time is counted as well. If the daemon does not stop in time,
147
- # then #stop will raise an exception.
148
- #
149
- # The default value is 15.
150
- #
151
- # [:log_file_activity_timeout]
152
- # Once a daemon has gone into the background, it will become difficult to
153
- # know for certain whether it is still initializing or whether it has
154
- # failed and exited, until it has written its PID file. Suppose that it
155
- # failed with an error after daemonizing but before it has written its PID file;
156
- # not many system administrators want to wait 15 seconds (the default start
157
- # timeout) to be notified of whether the daemon has terminated with an error.
158
- #
159
- # An alternative way to check whether the daemon has terminated with an error,
160
- # is by checking whether its log file has been recently updated. If, after the
161
- # daemon has started, the log file hasn't been updated for the amount of seconds
162
- # given by the :log_file_activity_timeout option, then the daemon is assumed to
163
- # have terminated with an error.
164
- #
165
- # The default value is 7.
166
- #
167
- # [:daemonize_for_me]
168
- # Normally daemon_controller will wait until the daemon has daemonized into the
169
- # background, in order to capture any errors that it may print on stdout or
170
- # stderr before daemonizing. However, if the daemon doesn't support daemonization
171
- # for some reason, then setting this option to true will cause daemon_controller
172
- # to do the daemonization for the daemon.
173
- #
174
- # The default is false.
175
- #
176
- # [:keep_ios]
177
- # Upon spawning the daemon, daemon_controller will normally close all file
178
- # descriptors except stdin, stdout and stderr. However if there are any file
179
- # descriptors you want to keep open, specify the IO objects here. This must be
180
- # an array of IO objects.
181
- #
182
- # [:env]
183
- # This must be a Hash. The hash will contain the environment variables available
184
- # to be made available to the daemon. Hash keys must be strings, not symbols.
185
- def initialize(options)
186
- [:identifier, :start_command, :ping_command, :pid_file, :log_file].each do |option|
187
- if !options.has_key?(option)
188
- raise ArgumentError, "The ':#{option}' option is mandatory."
189
- end
190
- end
191
- @identifier = options[:identifier]
192
- @start_command = options[:start_command]
193
- @stop_command = options[:stop_command]
194
- @ping_command = options[:ping_command]
195
- @restart_command = options[:restart_command]
196
- @ping_interval = options[:ping_interval] || 0.1
197
- @pid_file = options[:pid_file]
198
- @log_file = options[:log_file]
199
- @before_start = options[:before_start]
200
- @start_timeout = options[:start_timeout] || 15
201
- @stop_timeout = options[:stop_timeout] || 15
202
- @log_file_activity_timeout = options[:log_file_activity_timeout] || 7
203
- @daemonize_for_me = options[:daemonize_for_me]
204
- @keep_ios = options[:keep_ios] || []
205
- @lock_file = determine_lock_file(options, @identifier, @pid_file)
206
- @env = options[:env] || {}
207
- end
208
-
209
- # Start the daemon and wait until it can be pinged.
210
- #
211
- # Raises:
212
- # - AlreadyStarted - the daemon is already running.
213
- # - StartError - the start command failed.
214
- # - StartTimeout - the daemon did not start in time. This could also
215
- # mean that the daemon failed after it has gone into the background.
216
- def start
217
- @lock_file.exclusive_lock do
218
- start_without_locking
219
- end
220
- end
221
-
222
- # Connect to the daemon by running the given block, which contains the
223
- # connection logic. If the daemon isn't already running, then it will be
224
- # started.
225
- #
226
- # The block must return nil or raise Errno::ECONNREFUSED, Errno::ENETUNREACH,
227
- # Errno::ETIMEDOUT, Errno::ECONNRESET, Errno::EINVAL and Errno::EADDRNOTAVAIL
228
- # to indicate that the daemon cannot be
229
- # connected to. It must return non-nil if the daemon can be connected to.
230
- # Upon successful connection, the return value of the block will
231
- # be returned by #connect.
232
- #
233
- # Note that the block may be called multiple times.
234
- #
235
- # Raises:
236
- # - StartError - an attempt to start the daemon was made, but the start
237
- # command failed with an error.
238
- # - StartTimeout - an attempt to start the daemon was made, but the daemon
239
- # did not start in time, or it failed after it has gone into the background.
240
- # - ConnectError - the daemon wasn't already running, but we couldn't connect
241
- # to the daemon even after starting it.
242
- def connect
243
- connection = nil
244
- @lock_file.shared_lock do
245
- begin
246
- connection = yield
247
- rescue *ALLOWED_CONNECT_EXCEPTIONS
248
- connection = nil
249
- end
250
- end
251
- if connection.nil?
252
- @lock_file.exclusive_lock do
253
- if !daemon_is_running?
254
- start_without_locking
255
- end
256
- connect_exception = nil
257
- begin
258
- connection = yield
259
- rescue *ALLOWED_CONNECT_EXCEPTIONS => e
260
- connection = nil
261
- connect_exception = e
262
- end
263
- if connection.nil?
264
- # Daemon is running but we couldn't connect to it. Possible
265
- # reasons:
266
- # - The daemon froze.
267
- # - Bizarre security restrictions.
268
- # - There's a bug in the yielded code.
269
- if connect_exception
270
- raise ConnectError, "Cannot connect to the daemon: #{connect_exception} (#{connect_exception.class})"
271
- else
272
- raise ConnectError, "Cannot connect to the daemon"
273
- end
274
- else
275
- return connection
276
- end
277
- end
278
- else
279
- return connection
280
- end
281
- end
282
-
283
- # Stop the daemon and wait until it has exited.
284
- #
285
- # Raises:
286
- # - StopError - the stop command failed.
287
- # - StopTimeout - the daemon didn't stop in time.
288
- def stop
289
- @lock_file.exclusive_lock do
290
- begin
291
- Timeout.timeout(@stop_timeout, Timeout::Error) do
292
- kill_daemon
293
- wait_until do
294
- !daemon_is_running?
295
- end
296
- end
297
- rescue Timeout::Error
298
- raise StopTimeout, "Daemon '#{@identifier}' did not exit in time"
299
- end
300
- end
301
- end
302
-
303
- # Restarts the daemon. Uses the restart_command if provided, otherwise
304
- # calls #stop and #start.
305
- def restart
306
- if @restart_command
307
- run_command(@restart_command)
308
- else
309
- stop
310
- start
311
- end
312
- end
313
-
314
- # Returns the daemon's PID, as reported by its PID file. Returns the PID
315
- # as an integer, or nil there is no valid PID in the PID file.
316
- #
317
- # This method doesn't check whether the daemon's actually running.
318
- # Use #running? if you want to check whether it's actually running.
319
- #
320
- # Raises SystemCallError or IOError if something went wrong during
321
- # reading of the PID file.
322
- def pid
323
- @lock_file.shared_lock do
324
- return read_pid_file
325
- end
326
- end
327
-
328
- # Checks whether the daemon is still running. This is done by reading
329
- # the PID file and then checking whether there is a process with that
330
- # PID.
331
- #
332
- # Raises SystemCallError or IOError if something went wrong during
333
- # reading of the PID file.
334
- def running?
335
- @lock_file.shared_lock do
336
- return daemon_is_running?
337
- end
338
- end
339
-
340
- # Checks whether ping Unix domain sockets is supported. Currently
341
- # this is supported on all Ruby implementations, except JRuby.
342
- def self.can_ping_unix_sockets?
343
- return RUBY_PLATFORM != "java"
344
- end
345
-
346
- private
347
- def start_without_locking
348
- if daemon_is_running?
349
- raise AlreadyStarted, "Daemon '#{@identifier}' is already started"
350
- end
351
- save_log_file_information
352
- delete_pid_file
353
- begin
354
- started = false
355
- before_start
356
- Timeout.timeout(@start_timeout, Timeout::Error) do
357
- done = false
358
- spawn_daemon
359
- record_activity
360
-
361
- # We wait until the PID file is available and until
362
- # the daemon responds to pings, but we wait no longer
363
- # than @start_timeout seconds in total (including daemon
364
- # spawn time).
365
- # Furthermore, if the log file hasn't changed for
366
- # @log_file_activity_timeout seconds, and the PID file
367
- # still isn't available or the daemon still doesn't
368
- # respond to pings, then assume that the daemon has
369
- # terminated with an error.
370
- wait_until do
371
- if log_file_has_changed?
372
- record_activity
373
- elsif no_activity?(@log_file_activity_timeout)
374
- raise Timeout::Error, "Daemon seems to have exited"
375
- end
376
- pid_file_available?
377
- end
378
- wait_until(@ping_interval) do
379
- if log_file_has_changed?
380
- record_activity
381
- elsif no_activity?(@log_file_activity_timeout)
382
- raise Timeout::Error, "Daemon seems to have exited"
383
- end
384
- run_ping_command || !daemon_is_running?
385
- end
386
- started = run_ping_command
387
- end
388
- result = started
389
- rescue DaemonizationTimeout, Timeout::Error => e
390
- start_timed_out
391
- if pid_file_available?
392
- kill_daemon_with_signal(true)
393
- end
394
- if e.is_a?(DaemonizationTimeout)
395
- result = :daemonization_timeout
396
- else
397
- result = :start_timeout
398
- end
399
- end
400
- if !result
401
- raise(StartError, differences_in_log_file ||
402
- "Daemon '#{@identifier}' failed to start.")
403
- elsif result == :daemonization_timeout
404
- raise(StartTimeout, differences_in_log_file ||
405
- "Daemon '#{@identifier}' didn't daemonize in time.")
406
- elsif result == :start_timeout
407
- raise(StartTimeout, differences_in_log_file ||
408
- "Daemon '#{@identifier}' failed to start in time.")
409
- else
410
- return true
411
- end
412
- end
413
-
414
- def before_start
415
- if @before_start
416
- @before_start.call
417
- end
418
- end
419
-
420
- def spawn_daemon
421
- if @start_command.respond_to?(:call)
422
- run_command(@start_command.call)
423
- else
424
- run_command(@start_command)
425
- end
426
- end
427
-
428
- def kill_daemon
429
- if @stop_command
430
- begin
431
- run_command(@stop_command)
432
- rescue StartError => e
433
- raise StopError, e.message
434
- end
435
- else
436
- kill_daemon_with_signal
437
- end
438
- end
439
-
440
- def kill_daemon_with_signal(force = false)
441
- pid = read_pid_file
442
- if pid
443
- if force
444
- Process.kill('SIGKILL', pid)
445
- else
446
- Process.kill('SIGTERM', pid)
447
- end
448
- end
449
- rescue Errno::ESRCH, Errno::ENOENT
450
- end
451
-
452
- def daemon_is_running?
453
- begin
454
- pid = read_pid_file
455
- rescue Errno::ENOENT
456
- # The PID file may not exist, or another thread/process
457
- # executing #running? may have just deleted the PID file.
458
- # So we catch this error.
459
- pid = nil
460
- end
461
- if pid.nil?
462
- return false
463
- elsif check_pid(pid)
464
- return true
465
- else
466
- delete_pid_file
467
- return false
468
- end
469
- end
470
-
471
- def read_pid_file
472
- pid = File.read(@pid_file).strip
473
- if pid =~ /\A\d+\Z/
474
- return pid.to_i
475
- else
476
- return nil
477
- end
478
- end
479
-
480
- def delete_pid_file
481
- File.unlink(@pid_file)
482
- rescue Errno::EPERM, Errno::EACCES, Errno::ENOENT # ignore
483
- end
484
-
485
- def check_pid(pid)
486
- Process.kill(0, pid)
487
- return true
488
- rescue Errno::ESRCH
489
- return false
490
- rescue Errno::EPERM
491
- # We didn't have permission to kill the process. Either the process
492
- # is owned by someone else, or the system has draconian security
493
- # settings and we aren't allowed to kill *any* process. Assume that
494
- # the process is running.
495
- return true
496
- end
497
-
498
- def wait_until(sleep_interval = 0.1)
499
- while !yield
500
- sleep(sleep_interval)
501
- end
502
- end
503
-
504
- def wait_until_pid_file_is_available_or_log_file_has_changed
505
- while !(pid_file_available? || log_file_has_changed?)
506
- sleep 0.1
507
- end
508
- return pid_file_is_available?
509
- end
510
-
511
- def wait_until_daemon_responds_to_ping_or_has_exited_or_log_file_has_changed
512
- while !(run_ping_command || !daemon_is_running? || log_file_has_changed?)
513
- sleep(@ping_interval)
514
- end
515
- return run_ping_command
516
- end
517
-
518
- def record_activity
519
- @last_activity_time = Time.now
520
- end
521
-
522
- # Check whether there has been no recorded activity in the past +seconds+ seconds.
523
- def no_activity?(seconds)
524
- return Time.now - @last_activity_time > seconds
525
- end
526
-
527
- def pid_file_available?
528
- return File.exist?(@pid_file) && File.stat(@pid_file).size != 0
529
- end
530
-
531
- # This method does nothing and only serves as a hook for the unit test.
532
- def start_timed_out
533
- end
534
-
535
- # This method does nothing and only serves as a hook for the unit test.
536
- def daemonization_timed_out
537
- end
538
-
539
- def save_log_file_information
540
- @original_log_file_stat = File.stat(@log_file) rescue nil
541
- @current_log_file_stat = @original_log_file_stat
542
- end
543
-
544
- def log_file_has_changed?
545
- if @current_log_file_stat
546
- stat = File.stat(@log_file) rescue nil
547
- if stat
548
- result = @current_log_file_stat.mtime != stat.mtime ||
549
- @current_log_file_stat.size != stat.size
550
- @current_log_file_stat = stat
551
- return result
552
- else
553
- return true
554
- end
555
- else
556
- return false
557
- end
558
- end
559
-
560
- def differences_in_log_file
561
- if @original_log_file_stat
562
- File.open(@log_file, 'r') do |f|
563
- f.seek(@original_log_file_stat.size, IO::SEEK_SET)
564
- diff = f.read.strip
565
- if diff.empty?
566
- return nil
567
- else
568
- return diff
569
- end
570
- end
571
- else
572
- return nil
573
- end
574
- rescue Errno::ENOENT, Errno::ESPIPE
575
- # ESPIPE means the log file is a pipe.
576
- return nil
577
- end
578
-
579
- def determine_lock_file(options, identifier, pid_file)
580
- if options[:lock_file]
581
- return LockFile.new(File.expand_path(options[:lock_file]))
582
- else
583
- return LockFile.new(File.expand_path(pid_file + ".lock"))
584
- end
585
- end
586
-
587
- def self.fork_supported?
588
- return RUBY_PLATFORM != "java" && RUBY_PLATFORM !~ /win32/
589
- end
590
-
591
- def self.spawn_supported?
592
- # Process.spawn doesn't work very well in JRuby.
593
- return Process.respond_to?(:spawn) && RUBY_PLATFORM != "java"
594
- end
595
-
596
- def run_command(command)
597
- # Create tempfile for storing the command's output.
598
- tempfile = Tempfile.new('daemon-output')
599
- tempfile_path = tempfile.path
600
- File.chmod(0666, tempfile_path)
601
- tempfile.close
602
-
603
- if self.class.fork_supported? || self.class.spawn_supported?
604
- if Process.respond_to?(:spawn)
605
- options = {
606
- :in => "/dev/null",
607
- :out => tempfile_path,
608
- :err => tempfile_path,
609
- :close_others => true
610
- }
611
- @keep_ios.each do |io|
612
- options[io] = io
613
- end
614
- if @daemonize_for_me
615
- pid = Process.spawn(@env, ruby_interpreter, SPAWNER_FILE,
616
- command, options)
617
- else
618
- pid = Process.spawn(@env, command, options)
619
- end
620
- else
621
- pid = safe_fork(@daemonize_for_me) do
622
- ObjectSpace.each_object(IO) do |obj|
623
- if !@keep_ios.include?(obj)
624
- obj.close rescue nil
625
- end
626
- end
627
- STDIN.reopen("/dev/null", "r")
628
- STDOUT.reopen(tempfile_path, "w")
629
- STDERR.reopen(tempfile_path, "w")
630
- ENV.update(@env)
631
- exec(command)
632
- end
633
- end
634
-
635
- # run_command might be running in a timeout block (like
636
- # in #start_without_locking).
637
- begin
638
- interruptable_waitpid(pid)
639
- rescue Errno::ECHILD
640
- # Maybe a background thread or whatever waitpid()'ed
641
- # this child process before we had the chance. There's
642
- # no way to obtain the exit status now. Assume that
643
- # it started successfully; if it didn't we'll know
644
- # that later by checking the PID file and by pinging
645
- # it.
646
- return
647
- rescue Timeout::Error
648
- daemonization_timed_out
649
-
650
- # If the daemon doesn't fork into the background
651
- # in time, then kill it.
652
- begin
653
- Process.kill('SIGTERM', pid)
654
- rescue SystemCallError
655
- end
656
- begin
657
- Timeout.timeout(5, Timeout::Error) do
658
- begin
659
- interruptable_waitpid(pid)
660
- rescue SystemCallError
661
- end
662
- end
663
- rescue Timeout::Error
664
- begin
665
- Process.kill('SIGKILL', pid)
666
- interruptable_waitpid(pid)
667
- rescue SystemCallError
668
- end
669
- end
670
- raise DaemonizationTimeout
671
- end
672
- if $?.exitstatus != 0
673
- raise StartError, File.read(tempfile_path).strip
674
- end
675
- else
676
- if @env && !@env.empty?
677
- raise "Setting the :env option is not supported on this Ruby implementation."
678
- elsif @daemonize_for_me
679
- raise "Setting the :daemonize_for_me option is not supported on this Ruby implementation."
680
- end
681
-
682
- cmd = "#{command} >\"#{tempfile_path}\""
683
- cmd << " 2>\"#{tempfile_path}\"" unless PLATFORM =~ /mswin/
684
- if !system(cmd)
685
- raise StartError, File.read(tempfile_path).strip
686
- end
687
- end
688
- ensure
689
- File.unlink(tempfile_path) rescue nil
690
- end
691
-
692
- def run_ping_command
693
- if @ping_command.respond_to?(:call)
694
- begin
695
- value = @ping_command.call
696
- if value.respond_to?(:close)
697
- value.close rescue nil
698
- end
699
- return value
700
- rescue *ALLOWED_CONNECT_EXCEPTIONS
701
- return false
702
- end
703
- elsif @ping_command.is_a?(Array)
704
- type, *args = @ping_command
705
- if self.class.can_ping_unix_sockets?
706
- case type
707
- when :tcp
708
- hostname, port = args
709
- sockaddr = Socket.pack_sockaddr_in(port, hostname)
710
- return ping_tcp_socket(sockaddr)
711
- when :unix
712
- socket_domain = Socket::Constants::AF_LOCAL
713
- sockaddr = Socket.pack_sockaddr_un(args[0])
714
- return ping_socket(socket_domain, sockaddr)
715
- else
716
- raise ArgumentError, "Unknown ping command type #{type.inspect}"
717
- end
718
- else
719
- case type
720
- when :tcp
721
- hostname, port = args
722
- return ping_socket(hostname, port)
723
- when :unix
724
- raise "Pinging Unix domain sockets is not supported on this Ruby implementation"
725
- else
726
- raise ArgumentError, "Unknown ping command type #{type.inspect}"
727
- end
728
- end
729
- else
730
- return system(@ping_command)
731
- end
732
- end
733
-
734
- if !can_ping_unix_sockets?
735
- require 'java'
736
-
737
- def ping_socket(host_name, port)
738
- channel = java.nio.channels.SocketChannel.open
739
- begin
740
- address = java.net.InetSocketAddress.new(host_name, port)
741
- channel.configure_blocking(false)
742
- if channel.connect(address)
743
- return true
744
- end
745
-
746
- deadline = Time.now.to_f + 0.1
747
- done = false
748
- while true
749
- begin
750
- if channel.finish_connect
751
- return true
752
- end
753
- rescue java.net.ConnectException => e
754
- if e.message =~ /Connection refused/i
755
- return false
756
- else
757
- throw e
758
- end
759
- end
760
-
761
- # Not done connecting and no error.
762
- sleep 0.01
763
- if Time.now.to_f >= deadline
764
- return false
765
- end
766
- end
767
- ensure
768
- channel.close
769
- end
770
- end
771
- else
772
- def ping_socket(socket_domain, sockaddr)
773
- begin
774
- socket = Socket.new(socket_domain, Socket::Constants::SOCK_STREAM, 0)
775
- begin
776
- socket.connect_nonblock(sockaddr)
777
- rescue Errno::ENOENT, Errno::EINPROGRESS, Errno::EAGAIN, Errno::EWOULDBLOCK
778
- if select(nil, [socket], nil, 0.1)
779
- begin
780
- socket.connect_nonblock(sockaddr)
781
- rescue Errno::EISCONN
782
- rescue Errno::EINVAL
783
- if RUBY_PLATFORM =~ /freebsd/i
784
- raise Errno::ECONNREFUSED
785
- else
786
- raise
787
- end
788
- end
789
- else
790
- raise Errno::ECONNREFUSED
791
- end
792
- end
793
- return true
794
- rescue Errno::ECONNREFUSED, Errno::ENOENT
795
- return false
796
- ensure
797
- socket.close if socket
798
- end
799
- end
800
-
801
- def ping_tcp_socket(sockaddr)
802
- begin
803
- ping_socket(Socket::Constants::AF_INET, sockaddr)
804
- rescue Errno::EAFNOSUPPORT
805
- ping_socket(Socket::Constants::AF_INET6, sockaddr)
806
- end
807
- end
808
- end
809
-
810
- def ruby_interpreter
811
- if defined?(RbConfig)
812
- rb_config = RbConfig::CONFIG
813
- else
814
- rb_config = Config::CONFIG
815
- end
816
- File.join(
817
- rb_config['bindir'],
818
- rb_config['RUBY_INSTALL_NAME']
819
- ) + rb_config['EXEEXT']
820
- end
821
-
822
- def safe_fork(double_fork)
823
- pid = fork
824
- if pid.nil?
825
- begin
826
- if double_fork
827
- pid2 = fork
828
- if pid2.nil?
829
- Process.setsid
830
- yield
831
- end
832
- else
833
- yield
834
- end
835
- rescue Exception => e
836
- message = "*** Exception #{e.class} " <<
837
- "(#{e}) (process #{$$}):\n" <<
838
- "\tfrom " << e.backtrace.join("\n\tfrom ")
839
- STDERR.write(e)
840
- STDERR.flush
841
- exit!
842
- ensure
843
- exit!(0)
844
- end
845
- else
846
- if double_fork
847
- Process.waitpid(pid) rescue nil
848
- return pid
849
- else
850
- return pid
851
- end
852
- end
853
- end
854
-
855
- if RUBY_VERSION < "1.9"
856
- def interruptable_waitpid(pid)
857
- Process.waitpid(pid)
858
- end
859
- else
860
- # On Ruby 1.9, Thread#kill (which is called by timeout.rb) may
861
- # not be able to interrupt Process.waitpid. So here we use a
862
- # special version that's a bit less efficient but is at least
863
- # interruptable.
864
- def interruptable_waitpid(pid)
865
- result = nil
866
- while !result
867
- result = Process.waitpid(pid, Process::WNOHANG)
868
- sleep 0.01 if !result
869
- end
870
- return result
871
- end
872
- end
35
+ ALLOWED_CONNECT_EXCEPTIONS = [Errno::ECONNREFUSED, Errno::ENETUNREACH,
36
+ Errno::ETIMEDOUT, Errno::ECONNRESET, Errno::EINVAL,
37
+ Errno::EADDRNOTAVAIL]
38
+
39
+ SPAWNER_FILE = File.absolute_path(File.join(File.dirname(__FILE__),
40
+ "daemon_controller", "spawn.rb"))
41
+
42
+ class Error < StandardError
43
+ end
44
+
45
+ class TimeoutError < Error
46
+ end
47
+
48
+ class AlreadyStarted < Error
49
+ end
50
+
51
+ class StartError < Error
52
+ end
53
+
54
+ class StartTimeout < TimeoutError
55
+ end
56
+
57
+ class StopError < Error
58
+ end
59
+
60
+ class StopTimeout < TimeoutError
61
+ end
62
+
63
+ class ConnectError < Error
64
+ end
65
+
66
+ # Internal, not publicly thrown.
67
+ class DaemonizationTimeout < TimeoutError
68
+ attr_reader :output
69
+
70
+ def initialize(output)
71
+ super()
72
+ @output = output
73
+ end
74
+ end
75
+
76
+ # Create a new DaemonController object.
77
+ #
78
+ # === Mandatory options
79
+ #
80
+ # [:identifier]
81
+ # A human-readable, unique name for this daemon, e.g. "Sphinx search server".
82
+ # This identifier will be used in some error messages. On some platforms, it will
83
+ # be used for concurrency control: on such platforms, no two DaemonController
84
+ # objects will operate on the same identifier on the same time.
85
+ #
86
+ # [:start_command]
87
+ # The command to start the daemon. This must be a a String, e.g.
88
+ # "mongrel_rails start -e production", or a Proc which returns a String.
89
+ #
90
+ # If the value is a Proc, and the +before_start+ option is given too, then
91
+ # the +start_command+ Proc is guaranteed to be called after the +before_start+
92
+ # Proc is called.
93
+ #
94
+ # [:ping_command]
95
+ # The ping command is used to check whether the daemon can be connected to.
96
+ # It is also used to ensure that #start only returns when the daemon can be
97
+ # connected to.
98
+ #
99
+ # The value may be a command string. This command must exit with an exit code of
100
+ # 0 if the daemon can be successfully connected to, or exit with a non-0 exit
101
+ # code on failure.
102
+ #
103
+ # The value may also be an Array which specifies the socket address of the daemon.
104
+ # It must be in one of the following forms:
105
+ # - [:tcp, host_name, port]
106
+ # - [:unix, filename]
107
+ #
108
+ # The value may also be a Proc, which returns an expression that evaluates to
109
+ # true (indicating that the daemon can be connected to) or false (failure).
110
+ # If the Proc raises Errno::ECONNREFUSED, Errno::ENETUNREACH, Errno::ETIMEDOUT
111
+ # Errno::ECONNRESET, Errno::EINVAL or Errno::EADDRNOTAVAIL then that also
112
+ # means that the daemon cannot be connected to.
113
+ # <b>NOTE:</b> if the ping command returns an object which responds to
114
+ # <tt>#close</tt>, then that method will be called on it.
115
+ # This makes it possible to specify a ping command such as
116
+ # <tt>lambda { TCPSocket.new('localhost', 1234) }</tt>, without having to worry
117
+ # about closing it afterwards.
118
+ # Any exceptions raised by #close are ignored.
119
+ #
120
+ # [:pid_file]
121
+ # The PID file that the daemon will write to. Used to check whether the daemon
122
+ # is running.
123
+ #
124
+ # [:lock_file]
125
+ # The lock file to use for serializing concurrent daemon management operations.
126
+ # Defaults to "(filename of PID file).lock".
127
+ #
128
+ # [:log_file]
129
+ # The log file that the daemon will write to. It will be consulted to see
130
+ # whether the daemon has printed any error messages during startup.
131
+ #
132
+ # === Optional options
133
+ # [:stop_command]
134
+ # A command to stop the daemon with, e.g. "/etc/rc.d/nginx stop". If no stop
135
+ # command is given (i.e. +nil+), then DaemonController will stop the daemon
136
+ # by killing the PID written in the PID file.
137
+ #
138
+ # The default value is +nil+.
139
+ #
140
+ # [:restart_command]
141
+ # A command to restart the daemon with, e.g. "/etc/rc.d/nginx restart". If
142
+ # no restart command is given (i.e. +nil+), then DaemonController will
143
+ # restart the daemon by calling #stop and #start.
144
+ #
145
+ # The default value is +nil+.
146
+ #
147
+ # [:before_start]
148
+ # This may be a Proc. It will be called just before running the start command.
149
+ # The before_start proc is not subject to the start timeout.
150
+ #
151
+ # [:start_timeout]
152
+ # The maximum amount of time, in seconds, that #start may take to start
153
+ # the daemon. Since #start also waits until the daemon can be connected to,
154
+ # that wait time is counted as well. If the daemon does not start in time,
155
+ # then #start will raise an exception.
156
+ #
157
+ # The default value is 15.
158
+ #
159
+ # [:stop_timeout]
160
+ # The maximum amount of time, in seconds, that #stop may take to stop
161
+ # the daemon. Since #stop also waits until the daemon is no longer running,
162
+ # that wait time is counted as well. If the daemon does not stop in time,
163
+ # then #stop will raise an exception.
164
+ #
165
+ # The default value is 15.
166
+ #
167
+ # [:log_file_activity_timeout]
168
+ # Once a daemon has gone into the background, it will become difficult to
169
+ # know for certain whether it is still initializing or whether it has
170
+ # failed and exited, until it has written its PID file. Suppose that it
171
+ # failed with an error after daemonizing but before it has written its PID file;
172
+ # not many system administrators want to wait 15 seconds (the default start
173
+ # timeout) to be notified of whether the daemon has terminated with an error.
174
+ #
175
+ # An alternative way to check whether the daemon has terminated with an error,
176
+ # is by checking whether its log file has been recently updated. If, after the
177
+ # daemon has started, the log file hasn't been updated for the amount of seconds
178
+ # given by the :log_file_activity_timeout option, then the daemon is assumed to
179
+ # have terminated with an error.
180
+ #
181
+ # The default value is 7.
182
+ #
183
+ # [:dont_stop_if_pid_file_invalid]
184
+ # If the :stop_command option is given, then normally daemon_controller will
185
+ # always execute this command upon calling #stop. But if :dont_stop_if_pid_file_invalid
186
+ # is given, then daemon_controller will not do that if the PID file does not contain
187
+ # a valid number.
188
+ #
189
+ # The default is false.
190
+ #
191
+ # [:daemonize_for_me]
192
+ # Normally daemon_controller will wait until the daemon has daemonized into the
193
+ # background, in order to capture any errors that it may print on stdout or
194
+ # stderr before daemonizing. However, if the daemon doesn't support daemonization
195
+ # for some reason, then setting this option to true will cause daemon_controller
196
+ # to do the daemonization for the daemon.
197
+ #
198
+ # The default is false.
199
+ #
200
+ # [:keep_ios]
201
+ # Upon spawning the daemon, daemon_controller will normally close all file
202
+ # descriptors except stdin, stdout and stderr. However if there are any file
203
+ # descriptors you want to keep open, specify the IO objects here. This must be
204
+ # an array of IO objects.
205
+ #
206
+ # [:env]
207
+ # This must be a Hash. The hash will contain the environment variables available
208
+ # to be made available to the daemon. Hash keys must be strings, not symbols.
209
+ def initialize(options)
210
+ [:identifier, :start_command, :ping_command, :pid_file, :log_file].each do |option|
211
+ if !options.has_key?(option)
212
+ raise ArgumentError, "The ':#{option}' option is mandatory"
213
+ end
214
+ end
215
+ @identifier = options[:identifier]
216
+ @start_command = options[:start_command]
217
+ @stop_command = options[:stop_command]
218
+ @ping_command = options[:ping_command]
219
+ @restart_command = options[:restart_command]
220
+ @ping_interval = options[:ping_interval] || 0.1
221
+ @pid_file = options[:pid_file]
222
+ @log_file = options[:log_file]
223
+ @before_start = options[:before_start]
224
+ @start_timeout = options[:start_timeout] || 15
225
+ @stop_timeout = options[:stop_timeout] || 15
226
+ @log_file_activity_timeout = options[:log_file_activity_timeout] || 7
227
+ @dont_stop_if_pid_file_invalid = options[:dont_stop_if_pid_file_invalid]
228
+ @daemonize_for_me = options[:daemonize_for_me]
229
+ @keep_ios = options[:keep_ios] || []
230
+ @lock_file = determine_lock_file(options, @identifier, @pid_file)
231
+ @env = options[:env] || {}
232
+ end
233
+
234
+ # Start the daemon and wait until it can be pinged.
235
+ #
236
+ # Raises:
237
+ # - AlreadyStarted - the daemon is already running.
238
+ # - StartError - the start command failed.
239
+ # - StartTimeout - the daemon did not start in time. This could also
240
+ # mean that the daemon failed after it has gone into the background.
241
+ def start
242
+ @lock_file.exclusive_lock do
243
+ start_without_locking
244
+ end
245
+ end
246
+
247
+ # Connect to the daemon by running the given block, which contains the
248
+ # connection logic. If the daemon isn't already running, then it will be
249
+ # started.
250
+ #
251
+ # The block must return nil or raise Errno::ECONNREFUSED, Errno::ENETUNREACH,
252
+ # Errno::ETIMEDOUT, Errno::ECONNRESET, Errno::EINVAL and Errno::EADDRNOTAVAIL
253
+ # to indicate that the daemon cannot be
254
+ # connected to. It must return non-nil if the daemon can be connected to.
255
+ # Upon successful connection, the return value of the block will
256
+ # be returned by #connect.
257
+ #
258
+ # Note that the block may be called multiple times.
259
+ #
260
+ # Raises:
261
+ # - StartError - an attempt to start the daemon was made, but the start
262
+ # command failed with an error.
263
+ # - StartTimeout - an attempt to start the daemon was made, but the daemon
264
+ # did not start in time, or it failed after it has gone into the background.
265
+ # - ConnectError - the daemon wasn't already running, but we couldn't connect
266
+ # to the daemon even after starting it.
267
+ def connect
268
+ connection = nil
269
+ @lock_file.shared_lock do
270
+ connection = yield
271
+ rescue *ALLOWED_CONNECT_EXCEPTIONS
272
+ connection = nil
273
+ end
274
+ if connection.nil?
275
+ @lock_file.exclusive_lock do
276
+ if !daemon_is_running?
277
+ start_without_locking
278
+ end
279
+ connect_exception = nil
280
+ begin
281
+ connection = yield
282
+ rescue *ALLOWED_CONNECT_EXCEPTIONS => e
283
+ connection = nil
284
+ connect_exception = e
285
+ end
286
+ if connection.nil?
287
+ # Daemon is running but we couldn't connect to it. Possible
288
+ # reasons:
289
+ # - The daemon froze.
290
+ # - Bizarre security restrictions.
291
+ # - There's a bug in the yielded code.
292
+ if connect_exception
293
+ raise ConnectError, "Cannot connect to the daemon: #{connect_exception} (#{connect_exception.class})"
294
+ else
295
+ raise ConnectError, "Cannot connect to the daemon"
296
+ end
297
+ else
298
+ connection
299
+ end
300
+ end
301
+ else
302
+ connection
303
+ end
304
+ end
305
+
306
+ # Stop the daemon and wait until it has exited.
307
+ #
308
+ # Raises:
309
+ # - StopError - the stop command failed.
310
+ # - StopTimeout - the daemon didn't stop in time.
311
+ def stop
312
+ @lock_file.exclusive_lock do
313
+ Timeout.timeout(@stop_timeout, Timeout::Error) do
314
+ kill_daemon
315
+ wait_until do
316
+ !daemon_is_running?
317
+ end
318
+ end
319
+ rescue Timeout::Error
320
+ raise StopTimeout, "Daemon '#{@identifier}' did not exit in time"
321
+ end
322
+ end
323
+
324
+ # Restarts the daemon. Uses the restart_command if provided, otherwise
325
+ # calls #stop and #start.
326
+ def restart
327
+ if @restart_command
328
+ run_command(@restart_command)
329
+ else
330
+ stop
331
+ start
332
+ end
333
+ end
334
+
335
+ # Returns the daemon's PID, as reported by its PID file. Returns the PID
336
+ # as an integer, or nil there is no valid PID in the PID file.
337
+ #
338
+ # This method doesn't check whether the daemon's actually running.
339
+ # Use #running? if you want to check whether it's actually running.
340
+ #
341
+ # Raises SystemCallError or IOError if something went wrong during
342
+ # reading of the PID file.
343
+ def pid
344
+ @lock_file.shared_lock do
345
+ read_pid_file
346
+ end
347
+ end
348
+
349
+ # Checks whether the daemon is still running. This is done by reading
350
+ # the PID file and then checking whether there is a process with that
351
+ # PID.
352
+ #
353
+ # Raises SystemCallError or IOError if something went wrong during
354
+ # reading of the PID file.
355
+ def running?
356
+ @lock_file.shared_lock do
357
+ daemon_is_running?
358
+ end
359
+ end
360
+
361
+ # Checks whether ping Unix domain sockets is supported. Currently
362
+ # this is supported on all Ruby implementations, except JRuby.
363
+ def self.can_ping_unix_sockets?
364
+ RUBY_PLATFORM != "java"
365
+ end
366
+
367
+ private
368
+
369
+ def start_without_locking
370
+ if daemon_is_running?
371
+ raise AlreadyStarted, "Daemon '#{@identifier}' is already started"
372
+ end
373
+ save_log_file_information
374
+ delete_pid_file
375
+ begin
376
+ started = false
377
+ before_start
378
+ Timeout.timeout(@start_timeout, Timeout::Error) do
379
+ spawn_daemon
380
+ record_activity
381
+
382
+ # We wait until the PID file is available and until
383
+ # the daemon responds to pings, but we wait no longer
384
+ # than @start_timeout seconds in total (including daemon
385
+ # spawn time).
386
+ # Furthermore, if the log file hasn't changed for
387
+ # @log_file_activity_timeout seconds, and the PID file
388
+ # still isn't available or the daemon still doesn't
389
+ # respond to pings, then assume that the daemon has
390
+ # terminated with an error.
391
+ wait_until do
392
+ if log_file_has_changed?
393
+ record_activity
394
+ elsif no_activity?(@log_file_activity_timeout)
395
+ raise Timeout::Error, "Log file inactivity"
396
+ end
397
+ pid_file_available?
398
+ end
399
+ wait_until(@ping_interval) do
400
+ if log_file_has_changed?
401
+ record_activity
402
+ elsif no_activity?(@log_file_activity_timeout)
403
+ raise Timeout::Error, "Log file inactivity"
404
+ end
405
+ run_ping_command || !daemon_is_running?
406
+ end
407
+ started = run_ping_command
408
+ end
409
+ result = started
410
+ rescue DaemonizationTimeout, Timeout::Error => e
411
+ start_timed_out
412
+ if pid_file_available?
413
+ kill_daemon_with_signal(true)
414
+ end
415
+ result = if e.is_a?(DaemonizationTimeout)
416
+ :daemonization_timeout
417
+ else
418
+ :start_timeout
419
+ end
420
+ end
421
+
422
+ if !result
423
+ raise StartError, concat_spawn_output_and_logs(@spawn_output, differences_in_log_file)
424
+ elsif result == :daemonization_timeout
425
+ raise StartTimeout, concat_spawn_output_and_logs(@spawn_output, differences_in_log_file, nil, "timed out")
426
+ elsif result == :start_timeout
427
+ raise StartTimeout, concat_spawn_output_and_logs(@spawn_output, differences_in_log_file, nil, "timed out")
428
+ else
429
+ true
430
+ end
431
+ end
432
+
433
+ def before_start
434
+ if @before_start
435
+ @before_start.call
436
+ end
437
+ end
438
+
439
+ def spawn_daemon
440
+ @spawn_output = if @start_command.respond_to?(:call)
441
+ run_command(@start_command.call)
442
+ else
443
+ run_command(@start_command)
444
+ end
445
+ rescue DaemonizationTimeout => e
446
+ @spawn_output = e.output
447
+ raise e
448
+ end
449
+
450
+ def kill_daemon
451
+ if @stop_command
452
+ if @dont_stop_if_pid_file_invalid && read_pid_file.nil?
453
+ return
454
+ end
455
+ begin
456
+ run_command(@stop_command)
457
+ rescue StartError => e
458
+ raise StopError, e.message
459
+ end
460
+ else
461
+ kill_daemon_with_signal
462
+ end
463
+ end
464
+
465
+ def kill_daemon_with_signal(force = false)
466
+ pid = read_pid_file
467
+ if pid
468
+ if force
469
+ Process.kill("SIGKILL", pid)
470
+ else
471
+ Process.kill("SIGTERM", pid)
472
+ end
473
+ end
474
+ rescue Errno::ESRCH, Errno::ENOENT
475
+ end
476
+
477
+ def daemon_is_running?
478
+ begin
479
+ pid = read_pid_file
480
+ rescue Errno::ENOENT
481
+ # The PID file may not exist, or another thread/process
482
+ # executing #running? may have just deleted the PID file.
483
+ # So we catch this error.
484
+ pid = nil
485
+ end
486
+ if pid.nil?
487
+ false
488
+ elsif check_pid(pid)
489
+ true
490
+ else
491
+ delete_pid_file
492
+ false
493
+ end
494
+ end
495
+
496
+ def read_pid_file
497
+ begin
498
+ pid = File.read(@pid_file).strip
499
+ rescue Errno::ENOENT
500
+ return nil
501
+ end
502
+ if /\A\d+\Z/.match?(pid)
503
+ pid.to_i
504
+ end
505
+ end
506
+
507
+ def delete_pid_file
508
+ File.unlink(@pid_file)
509
+ rescue Errno::EPERM, Errno::EACCES, Errno::ENOENT # ignore
510
+ end
511
+
512
+ def check_pid(pid)
513
+ Process.kill(0, pid)
514
+ true
515
+ rescue Errno::ESRCH
516
+ false
517
+ rescue Errno::EPERM
518
+ # We didn't have permission to kill the process. Either the process
519
+ # is owned by someone else, or the system has draconian security
520
+ # settings and we aren't allowed to kill *any* process. Assume that
521
+ # the process is running.
522
+ true
523
+ end
524
+
525
+ def wait_until(sleep_interval = 0.1)
526
+ until yield
527
+ sleep(sleep_interval)
528
+ end
529
+ end
530
+
531
+ def wait_until_pid_file_is_available_or_log_file_has_changed
532
+ until pid_file_available? || log_file_has_changed?
533
+ sleep 0.1
534
+ end
535
+ pid_file_is_available?
536
+ end
537
+
538
+ def wait_until_daemon_responds_to_ping_or_has_exited_or_log_file_has_changed
539
+ until run_ping_command || !daemon_is_running? || log_file_has_changed?
540
+ sleep(@ping_interval)
541
+ end
542
+ run_ping_command
543
+ end
544
+
545
+ def record_activity
546
+ @last_activity_time = Time.now
547
+ end
548
+
549
+ # Check whether there has been no recorded activity in the past +seconds+ seconds.
550
+ def no_activity?(seconds)
551
+ Time.now - @last_activity_time > seconds
552
+ end
553
+
554
+ def pid_file_available?
555
+ File.exist?(@pid_file) && File.stat(@pid_file).size != 0
556
+ end
557
+
558
+ # This method does nothing and only serves as a hook for the unit test.
559
+ def start_timed_out
560
+ end
561
+
562
+ # This method does nothing and only serves as a hook for the unit test.
563
+ def daemonization_timed_out
564
+ end
565
+
566
+ def save_log_file_information
567
+ @original_log_file_stat = begin
568
+ File.stat(@log_file)
569
+ rescue
570
+ nil
571
+ end
572
+ @current_log_file_stat = @original_log_file_stat
573
+ end
574
+
575
+ def log_file_has_changed?
576
+ if @current_log_file_stat
577
+ stat = begin
578
+ File.stat(@log_file)
579
+ rescue
580
+ nil
581
+ end
582
+ if stat
583
+ result = @current_log_file_stat.mtime != stat.mtime ||
584
+ @current_log_file_stat.size != stat.size
585
+ @current_log_file_stat = stat
586
+ result
587
+ else
588
+ true
589
+ end
590
+ else
591
+ false
592
+ end
593
+ end
594
+
595
+ def differences_in_log_file
596
+ if @original_log_file_stat && @original_log_file_stat.file?
597
+ File.open(@log_file, "r") do |f|
598
+ f.seek(@original_log_file_stat.size, IO::SEEK_SET)
599
+ f.read.strip
600
+ end
601
+ end
602
+ rescue Errno::ENOENT, Errno::ESPIPE
603
+ # ESPIPE means the log file is a pipe.
604
+ nil
605
+ end
606
+
607
+ def determine_lock_file(options, identifier, pid_file)
608
+ if options[:lock_file]
609
+ LockFile.new(File.absolute_path(options[:lock_file]))
610
+ else
611
+ LockFile.new(File.absolute_path(pid_file + ".lock"))
612
+ end
613
+ end
614
+
615
+ def run_command(command)
616
+ if should_capture_output_while_running_command?
617
+ run_command_while_capturing_output(command)
618
+ else
619
+ run_command_without_capturing_output(command)
620
+ end
621
+ end
622
+
623
+ def should_capture_output_while_running_command?
624
+ if is_std_channel_chardev?(@log_file)
625
+ false
626
+ else
627
+ begin
628
+ real_log_file = Pathname.new(@log_file).realpath.to_s
629
+ rescue SystemCallError
630
+ real_log_file = nil
631
+ end
632
+ if real_log_file
633
+ !is_std_channel_chardev?(real_log_file)
634
+ else
635
+ true
636
+ end
637
+ end
638
+ end
639
+
640
+ def is_std_channel_chardev?(path)
641
+ path == "/dev/stdout" ||
642
+ path == "/dev/stderr" ||
643
+ path == "/dev/fd/1" ||
644
+ path == "/dev/fd/2" ||
645
+ path =~ %r{\A/proc/([0-9]+|self)/fd/[12]\Z}
646
+ end
647
+
648
+ def run_command_while_capturing_output(command)
649
+ # Create tempfile for storing the command's output.
650
+ tempfile = Tempfile.new("daemon-output")
651
+ tempfile.chmod(0o666)
652
+ tempfile_path = tempfile.path
653
+ tempfile.close
654
+
655
+ options = {
656
+ in: "/dev/null",
657
+ out: tempfile_path,
658
+ err: tempfile_path,
659
+ close_others: true
660
+ }
661
+ @keep_ios.each do |io|
662
+ options[io] = io
663
+ end
664
+ pid = if @daemonize_for_me
665
+ Process.spawn(@env, ruby_interpreter, SPAWNER_FILE,
666
+ command, options)
667
+ else
668
+ Process.spawn(@env, command, options)
669
+ end
670
+
671
+ # run_command might be running in a timeout block (like
672
+ # in #start_without_locking).
673
+ begin
674
+ interruptable_waitpid(pid)
675
+ rescue Errno::ECHILD
676
+ # Maybe a background thread or whatever waitpid()'ed
677
+ # this child process before we had the chance. There's
678
+ # no way to obtain the exit status now. Assume that
679
+ # it started successfully; if it didn't we'll know
680
+ # that later by checking the PID file and by pinging
681
+ # it.
682
+ return
683
+ rescue Timeout::Error
684
+ daemonization_timed_out
685
+
686
+ # If the daemon doesn't fork into the background
687
+ # in time, then kill it.
688
+ begin
689
+ Process.kill("SIGTERM", pid)
690
+ rescue SystemCallError
691
+ end
692
+ begin
693
+ Timeout.timeout(5, Timeout::Error) do
694
+ interruptable_waitpid(pid)
695
+ rescue SystemCallError
696
+ end
697
+ rescue Timeout::Error
698
+ begin
699
+ Process.kill("SIGKILL", pid)
700
+ interruptable_waitpid(pid)
701
+ rescue SystemCallError
702
+ end
703
+ end
704
+ raise DaemonizationTimeout, File.read(tempfile_path).strip
705
+ end
706
+
707
+ output = File.read(tempfile_path).strip
708
+ if $?.exitstatus != 0
709
+ raise StartError, concat_spawn_output_and_logs(output, differences_in_log_file, $?)
710
+ else
711
+ output
712
+ end
713
+ ensure
714
+ begin
715
+ File.unlink(tempfile_path)
716
+ rescue
717
+ nil
718
+ end
719
+ end
720
+
721
+ def run_command_without_capturing_output(command)
722
+ options = {
723
+ in: "/dev/null",
724
+ out: :out,
725
+ err: :err,
726
+ close_others: true
727
+ }
728
+ @keep_ios.each do |io|
729
+ options[io] = io
730
+ end
731
+ pid = if @daemonize_for_me
732
+ Process.spawn(@env, ruby_interpreter, SPAWNER_FILE,
733
+ command, options)
734
+ else
735
+ Process.spawn(@env, command, options)
736
+ end
737
+
738
+ # run_command might be running in a timeout block (like
739
+ # in #start_without_locking).
740
+ begin
741
+ interruptable_waitpid(pid)
742
+ rescue Errno::ECHILD
743
+ # Maybe a background thread or whatever waitpid()'ed
744
+ # this child process before we had the chance. There's
745
+ # no way to obtain the exit status now. Assume that
746
+ # it started successfully; if it didn't we'll know
747
+ # that later by checking the PID file and by pinging
748
+ # it.
749
+ return
750
+ rescue Timeout::Error
751
+ daemonization_timed_out
752
+
753
+ # If the daemon doesn't fork into the background
754
+ # in time, then kill it.
755
+ begin
756
+ Process.kill("SIGTERM", pid)
757
+ rescue SystemCallError
758
+ end
759
+ begin
760
+ Timeout.timeout(5, Timeout::Error) do
761
+ interruptable_waitpid(pid)
762
+ rescue SystemCallError
763
+ end
764
+ rescue Timeout::Error
765
+ begin
766
+ Process.kill("SIGKILL", pid)
767
+ interruptable_waitpid(pid)
768
+ rescue SystemCallError
769
+ end
770
+ end
771
+ raise DaemonizationTimeout, nil
772
+ end
773
+ if $?.exitstatus != 0
774
+ raise StartError, concat_spawn_output_and_logs(nil, differences_in_log_file, $?)
775
+ end
776
+ end
777
+
778
+ def run_ping_command
779
+ if @ping_command.respond_to?(:call)
780
+ begin
781
+ value = @ping_command.call
782
+ if value.respond_to?(:close)
783
+ begin
784
+ value.close
785
+ rescue
786
+ nil
787
+ end
788
+ end
789
+ value
790
+ rescue *ALLOWED_CONNECT_EXCEPTIONS
791
+ false
792
+ end
793
+ elsif @ping_command.is_a?(Array)
794
+ type, *args = @ping_command
795
+ if self.class.can_ping_unix_sockets?
796
+ case type
797
+ when :tcp
798
+ hostname, port = args
799
+ sockaddr = Socket.pack_sockaddr_in(port, hostname)
800
+ ping_tcp_socket(sockaddr)
801
+ when :unix
802
+ socket_domain = Socket::Constants::AF_LOCAL
803
+ sockaddr = Socket.pack_sockaddr_un(args[0])
804
+ ping_socket(socket_domain, sockaddr)
805
+ else
806
+ raise ArgumentError, "Unknown ping command type #{type.inspect}"
807
+ end
808
+ else
809
+ case type
810
+ when :tcp
811
+ hostname, port = args
812
+ ping_socket(hostname, port)
813
+ when :unix
814
+ raise "Pinging Unix domain sockets is not supported on this Ruby implementation"
815
+ else
816
+ raise ArgumentError, "Unknown ping command type #{type.inspect}"
817
+ end
818
+ end
819
+ else
820
+ system(@ping_command)
821
+ end
822
+ end
823
+
824
+ if !can_ping_unix_sockets?
825
+ require "java"
826
+
827
+ def ping_socket(host_name, port)
828
+ channel = java.nio.channels.SocketChannel.open
829
+ begin
830
+ address = java.net.InetSocketAddress.new(host_name, port)
831
+ channel.configure_blocking(false)
832
+ if channel.connect(address)
833
+ return true
834
+ end
835
+
836
+ deadline = Time.now.to_f + 0.1
837
+ while true
838
+ begin
839
+ if channel.finish_connect
840
+ return true
841
+ end
842
+ rescue java.net.ConnectException => e
843
+ if /Connection refused/i.match?(e.message)
844
+ return false
845
+ else
846
+ throw e
847
+ end
848
+ end
849
+
850
+ # Not done connecting and no error.
851
+ sleep 0.01
852
+ if Time.now.to_f >= deadline
853
+ return false
854
+ end
855
+ end
856
+ ensure
857
+ channel.close
858
+ end
859
+ end
860
+ else
861
+ def ping_socket(socket_domain, sockaddr)
862
+ socket = Socket.new(socket_domain, Socket::Constants::SOCK_STREAM, 0)
863
+ begin
864
+ socket.connect_nonblock(sockaddr)
865
+ rescue Errno::ENOENT, Errno::EINPROGRESS, Errno::EAGAIN, Errno::EWOULDBLOCK
866
+ if select(nil, [socket], nil, 0.1)
867
+ begin
868
+ socket.connect_nonblock(sockaddr)
869
+ rescue Errno::EISCONN
870
+ rescue Errno::EINVAL
871
+ if RUBY_PLATFORM.match?(/freebsd/i)
872
+ raise Errno::ECONNREFUSED
873
+ else
874
+ raise
875
+ end
876
+ end
877
+ else
878
+ raise Errno::ECONNREFUSED
879
+ end
880
+ end
881
+ true
882
+ rescue Errno::ECONNREFUSED, Errno::ENOENT
883
+ false
884
+ ensure
885
+ socket.close if socket
886
+ end
887
+
888
+ def ping_tcp_socket(sockaddr)
889
+ ping_socket(Socket::Constants::AF_INET, sockaddr)
890
+ rescue Errno::EAFNOSUPPORT
891
+ ping_socket(Socket::Constants::AF_INET6, sockaddr)
892
+ end
893
+ end
894
+
895
+ def ruby_interpreter
896
+ rb_config = if defined?(RbConfig)
897
+ RbConfig::CONFIG
898
+ else
899
+ Config::CONFIG
900
+ end
901
+ File.join(
902
+ rb_config["bindir"],
903
+ rb_config["RUBY_INSTALL_NAME"]
904
+ ) + rb_config["EXEEXT"]
905
+ end
906
+
907
+ # Thread#kill (which is called by timeout.rb) may
908
+ # not be able to interrupt Process.waitpid. So here we use a
909
+ # special version that's a bit less efficient but is at least
910
+ # interruptable.
911
+ def interruptable_waitpid(pid)
912
+ result = nil
913
+ until result
914
+ result = Process.waitpid(pid, Process::WNOHANG)
915
+ sleep 0.01 if !result
916
+ end
917
+ result
918
+ end
919
+
920
+ def signal_termination_message(process_status)
921
+ if process_status.signaled?
922
+ "terminated with signal #{signal_name_for(process_status.termsig)}"
923
+ else
924
+ "exited with status #{process_status.exitstatus}"
925
+ end
926
+ end
927
+
928
+ def signal_name_for(num)
929
+ if (name = Signal.list.find { |name, n| n == num }[0])
930
+ "SIG#{name}"
931
+ else
932
+ num.to_s
933
+ end
934
+ end
935
+
936
+ def concat_spawn_output_and_logs(output, logs, exit_status = nil, suffix_message = nil)
937
+ if output.nil? && logs.nil?
938
+ result_inner = [
939
+ "logs not available",
940
+ exit_status ? signal_termination_message(exit_status) : nil,
941
+ suffix_message
942
+ ].compact.join("; ")
943
+ "(#{result_inner})"
944
+ elsif (output && output.empty? && logs && logs.empty?) || (output && output.empty? && logs.nil?) || (output.nil? && logs && logs.empty?)
945
+ result_inner = [
946
+ "logs empty",
947
+ exit_status ? signal_termination_message(exit_status) : nil,
948
+ suffix_message
949
+ ].compact.join("; ")
950
+ "(#{result_inner})"
951
+ else
952
+ result = ((output || "") + "\n" + (logs || "")).strip
953
+ result_suffix = [
954
+ exit_status ? signal_termination_message(exit_status) : nil,
955
+ suffix_message
956
+ ].compact.join("; ")
957
+ if !result_suffix.empty?
958
+ result << "\n(#{result_suffix})"
959
+ end
960
+ result
961
+ end
962
+ end
873
963
  end