/usr/lib/ruby/vendor_ruby/chef/expander/cluster_supervisor.rb is in chef-expander 10.12.0-1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 | #
# Author:: Daniel DeLeo (<dan@opscode.com>)
# Author:: Seth Falcon (<seth@opscode.com>)
# Author:: Chris Walters (<cw@opscode.com>)
# Copyright:: Copyright (c) 2010-2011 Opscode, Inc.
# License:: Apache License, Version 2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
require 'chef/expander/loggable'
require 'chef/expander/daemonizable'
require 'chef/expander/version'
require 'chef/expander/configuration'
require 'chef/expander/vnode_supervisor'
module Chef
module Expander
#==ClusterSupervisor
# Manages a cluster of chef-expander processes. Usually this class will
# be instantiated from the chef-expander-cluster executable.
#
# ClusterSupervisor works by forking the desired number of processes, then
# running VNodeSupervisor.start_cluster_worker within the forked process.
# ClusterSupervisor keeps track of the process ids of its children, and will
# periodically attempt to reap them in a non-blocking call. If they are
# reaped, ClusterSupervisor knows they died and need to be respawned.
#
# The child processes are responsible for checking on the master process and
# dying if the master has died (VNodeSupervisor does this when started in
# with start_cluster_worker).
#
#===TODO:
# * This implementation currently assumes there is only one cluster, so it
# will claim all of the vnodes. It may be advantageous to allow multiple
# clusters.
# * There is no heartbeat implementation at this time, so a zombified child
# process will not be automatically killed--This behavior is left to the
# meatcloud for now.
class ClusterSupervisor
include Loggable
include Daemonizable
def initialize
@workers = {}
@running = true
@kill = :TERM
end
def start
trap(:INT) { stop(:INT) }
trap(:TERM) { stop(:TERM)}
Expander.init_config(ARGV)
log.info("Chef Expander #{Expander.version} starting cluster with #{Expander.config.node_count} nodes")
configure_process
start_workers
maintain_workers
release_locks
rescue Configuration::InvalidConfiguration => e
log.fatal {"Configuration Error: " + e.message}
exit(2)
rescue Exception => e
raise if SystemExit === e
log.fatal {e}
exit(1)
end
def start_workers
Expander.config.node_count.times do |i|
start_worker(i + 1)
end
end
def start_worker(index)
log.info { "Starting cluster worker #{index}" }
worker_params = {:index => index}
child_pid = fork do
Expander.config.index = index
VNodeSupervisor.start_cluster_worker
end
@workers[child_pid] = worker_params
end
def stop(signal)
log.info { "Stopping cluster on signal (#{signal})" }
@running = false
@kill = signal
end
def maintain_workers
while @running
sleep 1
workers_to_replace = {}
@workers.each do |process_id, worker_params|
if result = Process.waitpid2(process_id, Process::WNOHANG)
log.error { "worker #{worker_params[:index]} (PID: #{process_id}) died with status #{result[1].exitstatus || '(no status)'}"}
workers_to_replace[process_id] = worker_params
end
end
workers_to_replace.each do |dead_pid, worker_params|
@workers.delete(dead_pid)
start_worker(worker_params[:index])
end
end
@workers.each do |pid, worker_params|
log.info { "Stopping worker #{worker_params[:index]} (PID: #{pid})"}
Process.kill(@kill, pid)
end
@workers.each do |pid, worker_params|
Process.waitpid2(pid)
end
end
end
end
end
|