Coverage for src/bin/bind10/bind10_src : 68%
        
        
Hot-keys on this page
r m x p toggle line displays
j k next/prev highlighted chunk
0 (zero) top of page
1 (one) first highlighted chunk
| 
 #!/usr/bin/python3 
 # Copyright (C) 2010,2011 Internet Systems Consortium. # # Permission to use, copy, modify, and distribute this software for any # purpose with or without fee is hereby granted, provided that the above # copyright notice and this permission notice appear in all copies. # # THE SOFTWARE IS PROVIDED "AS IS" AND INTERNET SYSTEMS CONSORTIUM # DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL # INTERNET SYSTEMS CONSORTIUM BE LIABLE FOR ANY SPECIAL, DIRECT, # INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING # FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, # NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION # WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. 
 This file implements the Boss of Bind (BoB, or bob) program. 
 Its purpose is to start up the BIND 10 system, and then manage the processes, by starting and stopping processes, plus restarting processes that exit. 
 To start the system, it first runs the c-channel program (msgq), then connects to that. It then runs the configuration manager, and reads its own configuration. Then it proceeds to starting other modules. 
 The Python subprocess module is used for starting processes, but because this is not efficient for managing groups of processes, SIGCHLD signals are caught and processed using the signal module. 
 Most of the logic is contained in the BoB class. However, since Python requires that signal processing happen in the main thread, we do signal handling outside of that class, in the code running for __main__. """ 
 
 # If B10_FROM_SOURCE is set in the environment, we use data files # from a directory relative to that, otherwise we use the ones # installed on the system SPECFILE_LOCATION = os.environ["B10_FROM_SOURCE"] + "/src/bin/bind10/bob.spec" else: 
 
 
 
 # Pending system-wide debug level definitions, the ones we # use here are hardcoded for now 
 # Messages sent over the unix domain socket to indicate if it is followed by a real socket 
 # RCodes of known exceptions for the get_token command 
 # Assign this process some longer name 
 # This is the version that gets displayed to the user. # The VERSION string consists of the module name, the module version # number, and the overall BIND 10 version number (set in configure.ac). 
 # This is for boot_time of Boss 
 
 """Information about a process""" 
 
 dev_null_stderr=False): 
 """Function used before running a program that needs to run as a different user.""" # First, put us into a separate process group so we don't get # SIGINT signals on Ctrl-C (the boss will shut everthing down by # other means). os.setpgrp() 
 else: spawn_stderr = self.dev_null else: # Environment variables for the child process will be a copy of those # of the boss process with any additional specific variables given # on construction (self.env). stdin=subprocess.PIPE, stdout=spawn_stdout, stderr=spawn_stderr, close_fds=True, env=spawn_env, preexec_fn=self._preexec_work) 
 # spawn() and respawn() are the same for now, but in the future they # may have different functionality 
 
 
 
 """Boss of BIND class.""" 
 config_filename=None, clear_config=False, nocache=False, verbose=False, nokill=False, setuid=None, username=None, cmdctl_port=None, wait_time=10): """ Initialize the Boss of BIND. This is a singleton (only one can run). 
 The msgq_socket_file specifies the UNIX domain socket file that the msgq process listens on. If verbose is True, then the boss reports what it is doing. 
 Data path and config filename are passed through to config manager (if provided) and specify the config file to be used. 
 The cmdctl_port is passed to cmdctl and specify on which port it should listen. 
 wait_time controls the amount of time (in seconds) that Boss waits for selected processes to initialize before continuing with the initialization. Currently this is only the configuration manager. """ # Some time in future, it may happen that a single component has # multple processes (like a pipeline-like component). If so happens, # name "components" may be inapropriate. But as the code isn't probably # completely ready for it, we leave it at components for now. We also # want to support multiple instances of a single component. If it turns # out that we'll have a single component with multiple same processes # or if we start multiple components with the same configuration (we do # this now, but it might change) is an open question. # Simply list of components that died and need to wait for a # restart. Components manage their own restart schedule now isc.bind10.special_component.get_specials()) # The priorities here make them start in the correct order. First # the socket creator (which would drop root privileges by then), # then message queue and after that the config manager (which uses # the config manager) 'sockcreator': { 'kind': 'core', 'special': 'sockcreator', 'priority': 200 }, 'msgq': { 'kind': 'core', 'special': 'msgq', 'priority': 199 }, 'cfgmgr': { 'kind': 'core', 'special': 'cfgmgr', 'priority': 198 } } 
 # If -v was set, enable full debug logging. logger.set_severity("DEBUG", 99) # This is set in init_socket_srv 
 # Fill in the core components, so they stay alive "bind10 boss, do not set it") # Update the configuration 
 # If this is initial update, don't do anything now, leave it to startup new_config) 
 
 "data": { 'boot_time': time.strftime('%Y-%m-%dT%H:%M:%SZ', _BASETIME) } } 
 else: # send statistics data to the stats daemon immediately True, stats_data["data"]) # Consume the answer, in case it becomes a orphan message. except isc.cc.session.SessionTimeout: pass else: logger.fatal(BIND10_INVALID_STATISTICS_DATA); answer = isc.config.ccsession.create_answer( 1, "specified statistics data is invalid") create_answer(0, self.get_processes()) create_answer(1, "Missing token parameter") else: else: "Unknown command") 
 """ Called as part of the exception handling when a process fails to start, this runs through the list of started processes, killing each one. It then clears that list. """ logger.info(BIND10_KILLING_ALL_PROCESSES) 
 for pid in self.components: logger.info(BIND10_KILL_PROCESS, self.components[pid].name()) self.components[pid].kill(True) self.components = {} 
 """ Reads the parameters associated with the BoB module itself. 
 This means the list of components we should start now. 
 This could easily be combined into start_all_processes, but it stays because of historical reasons and because the tests replace the method sometimes. """ 
 
 """ A convenience function to output a "Starting xxx" message if the logging is set to DEBUG with debuglevel DBG_PROCESS or higher. Putting this into a separate method ensures that the output form is consistent across all processes. 
 The process name (passed as the first argument) is put into self.curproc, and is used to indicate which process failed to start if there is an error (and is used in the "Started" message on success). The optional port and address information are appended to the message (if present). """ self.curproc = process if port is None and address is None: logger.info(BIND10_STARTING_PROCESS, self.curproc) elif address is None: logger.info(BIND10_STARTING_PROCESS_PORT, self.curproc, port) else: logger.info(BIND10_STARTING_PROCESS_PORT_ADDRESS, self.curproc, address, port) 
 """ A convenience function to output a 'Started xxxx (PID yyyy)' message. As with starting_message(), this ensures a consistent format. """ if pid is None: logger.debug(DBG_PROCESS, BIND10_STARTED_PROCESS, self.curproc) else: logger.debug(DBG_PROCESS, BIND10_STARTED_PROCESS_PID, self.curproc, pid) 
 """ Some processes return a message to the Boss after they have started to indicate that they are running. The form of the message is a dictionary with contents {"running:", "<process>"}. This method checks the passed message and returns True if the "who" process is contained in the message (so is presumably running). It returns False for all other conditions and will log an error if appropriate. """ if msg is not None: try: if msg["running"] == who: return True else: logger.error(BIND10_STARTUP_UNEXPECTED_MESSAGE, msg) except: logger.error(BIND10_STARTUP_UNRECOGNISED_MESSAGE, msg) 
 return False 
 # The next few methods start the individual processes of BIND-10. They # are called via start_all_processes(). If any fail, an exception is # raised which is caught by the caller of start_all_processes(); this kills # processes started up to that point before terminating the program. 
 """ Start the message queue and connect to the command channel. """ self.log_starting("b10-msgq") msgq_proc = ProcessInfo("b10-msgq", ["b10-msgq"], self.c_channel_env, True, not self.verbose) msgq_proc.spawn() self.log_started(msgq_proc.pid) 
 # Now connect to the c-channel cc_connect_start = time.time() while self.cc_session is None: # if we have been trying for "a while" give up if (time.time() - cc_connect_start) > 5: raise CChannelConnectError("Unable to connect to c-channel after 5 seconds") 
 # try to connect, and if we can't wait a short while try: self.cc_session = isc.cc.Session(self.msgq_socket_file) except isc.cc.session.SessionError: time.sleep(0.1) 
 # Subscribe to the message queue. The only messages we expect to receive # on this channel are once relating to process startup. self.cc_session.group_subscribe("Boss") 
 return msgq_proc 
 """ Starts the configuration manager process """ self.log_starting("b10-cfgmgr") args = ["b10-cfgmgr"] if self.data_path is not None: args.append("--data-path=" + self.data_path) if self.config_filename is not None: args.append("--config-filename=" + self.config_filename) if self.clear_config: args.append("--clear-config") bind_cfgd = ProcessInfo("b10-cfgmgr", args, self.c_channel_env) bind_cfgd.spawn() self.log_started(bind_cfgd.pid) 
 # Wait for the configuration manager to start up as subsequent initialization # cannot proceed without it. The time to wait can be set on the command line. time_remaining = self.wait_time msg, env = self.cc_session.group_recvmsg() while time_remaining > 0 and not self.process_running(msg, "ConfigManager"): logger.debug(DBG_PROCESS, BIND10_WAIT_CFGMGR) time.sleep(1) time_remaining = time_remaining - 1 msg, env = self.cc_session.group_recvmsg() 
 if not self.process_running(msg, "ConfigManager"): raise ProcessStartError("Configuration manager process has not started") 
 return bind_cfgd 
 """ Start the CC Session 
 The argument c_channel_env is unused but is supplied to keep the argument list the same for all start_xxx methods. 
 With regards to logging, note that as the CC session is not a process, the log_starting/log_started methods are not used. """ logger.info(BIND10_STARTING_CC) self.ccs = isc.config.ModuleCCSession(SPECFILE_LOCATION, self.config_handler, self.command_handler, socket_file = self.msgq_socket_file) self.ccs.start() logger.debug(DBG_PROCESS, BIND10_STARTED_CC) 
 # A couple of utility methods for starting processes... 
 """ Given a set of command arguments, start the process and output appropriate log messages. If the start is successful, the process is added to the list of started processes. 
 The port and address arguments are for log messages only. """ self.log_starting(name, port, address) newproc = ProcessInfo(name, args, c_channel_env) newproc.spawn() self.log_started(newproc.pid) return newproc 
 """ Put another process into boss to watch over it. When the process dies, the component.failed() is called with the exit code. 
 It is expected the info is a isc.bind10.component.BaseComponent subclass (or anything having the same interface). """ 
 """ Most of the BIND-10 processes are started with the command: 
 <process-name> [-v] 
 ... where -v is appended if verbose is enabled. This method generates the arguments from the name and starts the process. 
 The port and address arguments are for log messages only. """ # Set up the command arguments. args = [name] if self.verbose: args += ['-v'] 
 # ... and start the process return self.start_process(name, args, self.c_channel_env) 
 # The next few methods start up the rest of the BIND-10 processes. # Although many of these methods are little more than a call to # start_simple, they are retained (a) for testing reasons and (b) as a place # where modifications can be made if the process start-up sequence changes # for a given process. 
 """ Start the Authoritative server """ if self.uid is not None and self.__started: logger.warn(BIND10_START_AS_NON_ROOT_AUTH) authargs = ['b10-auth'] if self.nocache: authargs += ['-n'] if self.verbose: authargs += ['-v'] 
 # ... and start return self.start_process("b10-auth", authargs, self.c_channel_env) 
 """ Start the Resolver. At present, all these arguments and switches are pure speculation. As with the auth daemon, they should be read from the configuration database. """ if self.uid is not None and self.__started: logger.warn(BIND10_START_AS_NON_ROOT_RESOLVER) self.curproc = "b10-resolver" # XXX: this must be read from the configuration manager in the future resargs = ['b10-resolver'] if self.verbose: resargs += ['-v'] 
 # ... and start return self.start_process("b10-resolver", resargs, self.c_channel_env) 
 """ Starts the command control process """ args = ["b10-cmdctl"] if self.cmdctl_port is not None: args.append("--port=" + str(self.cmdctl_port)) if self.verbose: args.append("-v") return self.start_process("b10-cmdctl", args, self.c_channel_env, self.cmdctl_port) 
 """ Starts up all the components. Any exception generated during the starting of the components is handled by the caller. """ # Start the real core (sockcreator, msgq, cfgmgr) 
 # Connect to the msgq. This is not a process, so it's not handled # inside the configurator. 
 # Extract the parameters associated with Bob. This can only be # done after the CC Session is started. Note that the logging # configuration may override the "-v" switch set on the command line. 
 # TODO: Return the dropping of privileges 
 """ Start the BoB instance. 
 Returns None if successful, otherwise an string describing the problem. """ # Try to connect to the c-channel daemon, to see if it is already # running c_channel_env = {} if self.msgq_socket_file is not None: c_channel_env["BIND10_MSGQ_SOCKET_FILE"] = self.msgq_socket_file logger.debug(DBG_PROCESS, BIND10_CHECK_MSGQ_ALREADY_RUNNING) # try to connect, and if we can't wait a short while try: self.cc_session = isc.cc.Session(self.msgq_socket_file) logger.fatal(BIND10_MSGQ_ALREADY_RUNNING) return "b10-msgq already running, or socket file not cleaned , cannot start" except isc.cc.session.SessionError: # this is the case we want, where the msgq is not running pass 
 # Start all components. If any one fails to start, kill all started # components and exit with an error indication. try: self.c_channel_env = c_channel_env self.start_all_components() except Exception as e: self.kill_started_components() return "Unable to start " + self.curproc + ": " + str(e) 
 # Started successfully self.runnable = True self.__started = True return None 
 """ Stop the given process, friendly-like. The process is the name it has (in logs, etc), the recipient is the address on msgq. The pid is the pid of the process (if we have multiple processes of the same name, it might want to choose if it is for this one). """ create_command('shutdown', {'pid': pid}), recipient, recipient) 
 """ Stop the Boss instance from a components' request. The exitcode indicates the desired exit code. 
 If we did not start yet, it raises an exception, which is meant to propagate through the component and configurator to the startup routine and abort the startup immediately. If it is started up already, we just mark it so we terminate soon. 
 It does set the exit code in both cases. """ else: 
 """Stop the BoB instance.""" # If ccsession is still there, inform rest of the system this module # is stopping. Since everything will be stopped shortly, this is not # really necessary, but this is done to reflect that boss is also # 'just' a module. 
 # try using the BIND 10 request to stop except: pass # XXX: some delay probably useful... how much is uncertain # I have changed the delay from 0.5 to 1, but sometime it's # still not enough. 
 # Send TERM and KILL signals to modules if we're not prevented # from doing so # next try sending a SIGTERM except OSError: # ignore these (usually ESRCH because the child # finally exited) pass # finally, send SIGKILL (unmaskable termination) until everybody dies # XXX: some delay probably useful... how much is uncertain component.pid()) except OSError: # ignore these (usually ESRCH because the child # finally exited) pass 
 
 """Check to see if any of our child processes have exited, and note this for later handling. """ # XXX: should be impossible to get any other error here raise if pid == 0: break if pid in self.components: # One of the components we know about. Get information on it. component = self.components.pop(pid) logger.info(BIND10_PROCESS_ENDED, component.name(), pid, exit_status) if component.running() and self.runnable: # Tell it it failed. But only if it matters (we are # not shutting down and the component considers itself # to be running. component_restarted = component.failed(exit_status); # if the process wants to be restarted, but not just yet, # it returns False if not component_restarted: self.components_to_restart.append(component) else: logger.info(BIND10_UNKNOWN_CHILD_PROCESS_ENDED, pid) 
 """ Restart any dead processes: 
 * Returns the time when the next process is ready to be restarted. * If the server is shutting down, returns 0. * If there are no processes, returns None. 
 The values returned can be safely passed into select() as the timeout value. 
 """ return 0 # keep track of the first time we need to check this queue again, # if at all if not component.restart(now): still_dead.append(component) if next_restart_time is None or\ next_restart_time > component.get_restart_time(): next_restart_time = component.get_restart_time() 
 
 """ Implementation of the get_socket CC command. It asks the cache to provide the token and sends the information back. """ " or NO") isc.config.ccsession.create_answer(1, "Missing parameter " + str(ke)) 
 # FIXME: This call contains blocking IPC. It is expected to be # short, but if it turns out to be problem, we'll need to do # something about it. share_mode, share_name) 'token': token, 'path': self._socket_path }) str(e)) str(e)) 
 """ This function handles a token that comes over a unix_domain socket. The function looks into the _socket_cache and sends the socket identified by the token back over the unix_socket. """ # FIXME: These two calls are blocking in their nature. An OS-level # buffer is likely to be large enough to hold all these data, but # if it wasn't and the remote application got stuck, we would have # a problem. If there appear such problems, we should do something # about it. 
 """ This function handles when a unix_socket closes. This means all sockets sent to it are to be considered closed. This function signals so to the _socket_cache. """ # This means the application holds no sockets. It's harmless, as it # can happen in real life - for example, it requests a socket, but # get_socket doesn't find it, so the application dies. It should be # rare, though. 
 """ Registeres a socket creator into the boss. The socket creator is not used directly, but through a cache. The cache is created in this method. 
 If called more than once, it raises a ValueError. """ 
 """ Creates and listens on a unix-domain socket to be able to send out the sockets. 
 This method should be called after switching user, or the switched applications won't be able to access the socket. """ self._srv_socket = socket.socket(socket.AF_UNIX) # We create a temporary directory somewhere safe and unique, to avoid # the need to find the place ourself or bother users. Also, this # secures the socket on some platforms, as it creates a private # directory. self._tmpdir = tempfile.mkdtemp(prefix='sockcreator-') # Get the name self._socket_path = os.path.join(self._tmpdir, "sockcreator") # And bind the socket to the name self._srv_socket.bind(self._socket_path) self._srv_socket.listen(5) 
 """ Closes and removes the listening socket and the directory where it lives, as we created both. 
 It does nothing if the _srv_socket is not set (eg. it was not yet initialized). """ if self._srv_socket is not None: self._srv_socket.close() os.remove(self._socket_path) os.rmdir(self._tmpdir) 
 """ Accept a socket from the unix domain socket server and put it to the others we care about. """ 
 """ This is called when a socket identified by the socket_fileno needs attention. We try to read data from there. If it is closed, we remove it. """ # These two might be different on some systems # No more data now. Oh, well, just store what we have. else: else: # Handle this token and clear it else: 
 """ The main loop, waiting for sockets, commands and dead processes. Runs as long as the runnable is true. 
 The wakeup_fd descriptor is the read end of pipe where CHLD signal handler writes. """ # clean up any processes that exited else: wait_time = max(next_restart - time.time(), 0) 
 # select() can raise EINTR when a signal arrives, # even if they are resumable, so we have to catch # the exception select.select([wakeup_fd, ccs_fd, self._srv_socket.fileno()] + list(self._unix_sockets.keys()), [], [], wait_time) except select.error as err: if err.args[0] == errno.EINTR: (rlist, wlist, xlist) = ([], [], []) else: logger.fatal(BIND10_SELECT_ERROR, err) break 
 try: self.ccs.check_command() except isc.cc.session.ProtocolError: logger.fatal(BIND10_MSGQ_DISAPPEARED) self.runnable = False break os.read(wakeup_fd, 32) 
 # global variables, needed for signal handlers 
 """A child process has died (SIGCHLD received).""" # don't do anything... # the Python signal handler has been set up to write # down a pipe, waking up our select() bit pass 
 """Return the symbolic name for a signal.""" for sig in dir(signal): if sig.startswith("SIG") and sig[3].isalnum(): if getattr(signal, sig) == signal_number: return sig return "Unknown signal %d" % signal_number 
 # XXX: perhaps register atexit() function and invoke that instead """We need to exit (SIGINT or SIGTERM received).""" global options global boss_of_bind logger.info(BIND10_RECEIVED_SIGNAL, get_signame(signal_number)) signal.signal(signal.SIGCHLD, signal.SIG_DFL) boss_of_bind.runnable = False 
 """Function that renames the process if it is requested by a option.""" isc.util.process.rename(value) 
 """ Function for parsing command line arguments. Returns the options object from OptionParser. """ type="string", default=None, help="UNIX domain socket file the b10-msgq daemon will use") default=False, help="disable hot-spot cache in authoritative DNS server") default=False, help="do not send SIGTERM and SIGKILL signals to modules during shutdown") help="Change user after startup (must run as root)") help="display more about what is going on") callback=process_rename, help="Set the process name (displayed in ps, top, ...)") dest="config_file", default=None, help="Configuration database filename") dest="clear_config", default=False, help="Create backup of the configuration file and " + "start with a clean configuration") help="Directory to search for configuration files", default=None) default=None, help="Port of command control") default=None, help="file to dump the PID of the BIND 10 process") default=10, help="Time (in seconds) to wait for config manager to start up") 
 
 
 parser.print_help() sys.exit(1) 
 
 """ Dump the PID of the current process to the specified file. If the given file is None this function does nothing. If the file already exists, the existing content will be removed. If a system error happens in creating or writing to the file, the corresponding exception will be propagated to the caller. """ 
 """ Remove the given file, which is basically expected to be the PID file created by dump_pid(). The specified may or may not exist; if it doesn't this function does nothing. Other system level errors in removing the file will be propagated as the corresponding exception. """ raise 
 
 global options global boss_of_bind # Enforce line buffering on stdout, even when not a TTY sys.stdout = io.TextIOWrapper(sys.stdout.detach(), line_buffering=True) 
 options = parse_args() 
 # Check user ID. setuid = None username = None if options.user: # Try getting information about the user, assuming UID passed. try: pw_ent = pwd.getpwuid(int(options.user)) setuid = pw_ent.pw_uid username = pw_ent.pw_name except ValueError: pass except KeyError: pass 
 # Next try getting information about the user, assuming user name # passed. # If the information is both a valid user name and user number, we # prefer the name because we try it second. A minor point, hopefully. try: pw_ent = pwd.getpwnam(options.user) setuid = pw_ent.pw_uid username = pw_ent.pw_name except KeyError: pass 
 if setuid is None: logger.fatal(BIND10_INVALID_USER, options.user) sys.exit(1) 
 # Announce startup. logger.info(BIND10_STARTING, VERSION) 
 # Create wakeup pipe for signal handlers wakeup_pipe = os.pipe() signal.set_wakeup_fd(wakeup_pipe[1]) 
 # Set signal handlers for catching child termination, as well # as our own demise. signal.signal(signal.SIGCHLD, reaper) signal.siginterrupt(signal.SIGCHLD, False) signal.signal(signal.SIGINT, fatal_signal) signal.signal(signal.SIGTERM, fatal_signal) 
 # Block SIGPIPE, as we don't want it to end this process signal.signal(signal.SIGPIPE, signal.SIG_IGN) 
 try: # Go bob! boss_of_bind = BoB(options.msgq_socket_file, options.data_path, options.config_file, options.clear_config, options.nocache, options.verbose, options.nokill, setuid, username, options.cmdctl_port, options.wait_time) startup_result = boss_of_bind.startup() if startup_result: logger.fatal(BIND10_STARTUP_ERROR, startup_result) sys.exit(1) boss_of_bind.init_socket_srv() logger.info(BIND10_STARTUP_COMPLETE) dump_pid(options.pid_file) 
 # Let it run boss_of_bind.run(wakeup_pipe[0]) 
 # shutdown signal.signal(signal.SIGCHLD, signal.SIG_DFL) boss_of_bind.shutdown() finally: # Clean up the filesystem unlink_pid_file(options.pid_file) if boss_of_bind is not None: boss_of_bind.remove_socket_srv() sys.exit(boss_of_bind.exitcode) 
 main()  |