mirror of
https://github.com/openvswitch/ovs
synced 2025-10-21 14:49:41 +00:00
450 lines
15 KiB
Python
450 lines
15 KiB
Python
# Copyright (c) 2010, 2011 Nicira Networks
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at:
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
import errno
|
|
import fcntl
|
|
import logging
|
|
import os
|
|
import resource
|
|
import signal
|
|
import sys
|
|
import time
|
|
|
|
import ovs.dirs
|
|
import ovs.fatal_signal
|
|
#import ovs.lockfile
|
|
import ovs.process
|
|
import ovs.socket_util
|
|
import ovs.timeval
|
|
import ovs.util
|
|
|
|
# --detach: Should we run in the background?
|
|
_detach = False
|
|
|
|
# --pidfile: Name of pidfile (null if none).
|
|
_pidfile = None
|
|
|
|
# Our pidfile's inode and device, if we have created one.
|
|
_pidfile_dev = None
|
|
_pidfile_ino = None
|
|
|
|
# --overwrite-pidfile: Create pidfile even if one already exists and is locked?
|
|
_overwrite_pidfile = False
|
|
|
|
# --no-chdir: Should we chdir to "/"?
|
|
_chdir = True
|
|
|
|
# --monitor: Should a supervisory process monitor the daemon and restart it if
|
|
# it dies due to an error signal?
|
|
_monitor = False
|
|
|
|
# File descriptor used by daemonize_start() and daemonize_complete().
|
|
_daemonize_fd = None
|
|
|
|
RESTART_EXIT_CODE = 5
|
|
|
|
def make_pidfile_name(name):
|
|
"""Returns the file name that would be used for a pidfile if 'name' were
|
|
provided to set_pidfile()."""
|
|
if name is None or name == "":
|
|
return "%s/%s.pid" % (ovs.dirs.RUNDIR, ovs.util.PROGRAM_NAME)
|
|
else:
|
|
return ovs.util.abs_file_name(ovs.dirs.RUNDIR, name)
|
|
|
|
def set_pidfile(name):
|
|
"""Sets up a following call to daemonize() to create a pidfile named
|
|
'name'. If 'name' begins with '/', then it is treated as an absolute path.
|
|
Otherwise, it is taken relative to ovs.util.RUNDIR, which is
|
|
$(prefix)/var/run by default.
|
|
|
|
If 'name' is null, then ovs.util.PROGRAM_NAME followed by ".pid" is
|
|
used."""
|
|
global _pidfile
|
|
_pidfile = make_pidfile_name(name)
|
|
|
|
def get_pidfile():
|
|
"""Returns an absolute path to the configured pidfile, or None if no
|
|
pidfile is configured. The caller must not modify or free the returned
|
|
string."""
|
|
return _pidfile
|
|
|
|
def set_no_chdir():
|
|
"""Sets that we do not chdir to "/"."""
|
|
global _chdir
|
|
_chdir = False
|
|
|
|
def is_chdir_enabled():
|
|
"""Will we chdir to "/" as part of daemonizing?"""
|
|
return _chdir
|
|
|
|
def ignore_existing_pidfile():
|
|
"""Normally, die_if_already_running() will terminate the program with a
|
|
message if a locked pidfile already exists. If this function is called,
|
|
die_if_already_running() will merely log a warning."""
|
|
global _overwrite_pidfile
|
|
_overwrite_pidfile = True
|
|
|
|
def set_detach():
|
|
"""Sets up a following call to daemonize() to detach from the foreground
|
|
session, running this process in the background."""
|
|
global _detach
|
|
_detach = True
|
|
|
|
def get_detach():
|
|
"""Will daemonize() really detach?"""
|
|
return _detach
|
|
|
|
def set_monitor():
|
|
"""Sets up a following call to daemonize() to fork a supervisory process to
|
|
monitor the daemon and restart it if it dies due to an error signal."""
|
|
global _monitor
|
|
_monitor = True
|
|
|
|
def die_if_already_running():
|
|
"""If a locked pidfile exists, issue a warning message and, unless
|
|
ignore_existing_pidfile() has been called, terminate the program."""
|
|
if _pidfile is None:
|
|
return
|
|
pid = read_pidfile_if_exists(_pidfile)
|
|
if pid > 0:
|
|
if not _overwrite_pidfile:
|
|
msg = "%s: already running as pid %d" % (_pidfile, pid)
|
|
logging.error("%s, aborting" % msg)
|
|
sys.stderr.write("%s\n" % msg)
|
|
sys.exit(1)
|
|
else:
|
|
logging.warn("%s: %s already running"
|
|
% (get_pidfile(), ovs.util.PROGRAM_NAME))
|
|
|
|
def _make_pidfile():
|
|
"""If a pidfile has been configured, creates it and stores the running
|
|
process's pid in it. Ensures that the pidfile will be deleted when the
|
|
process exits."""
|
|
if _pidfile is not None:
|
|
# Create pidfile via temporary file, so that observers never see an
|
|
# empty pidfile or an unlocked pidfile.
|
|
pid = os.getpid()
|
|
tmpfile = "%s.tmp%d" % (_pidfile, pid)
|
|
ovs.fatal_signal.add_file_to_unlink(tmpfile)
|
|
|
|
try:
|
|
# This is global to keep Python from garbage-collecting and
|
|
# therefore closing our file after this function exits. That would
|
|
# unlock the lock for us, and we don't want that.
|
|
global file
|
|
|
|
file = open(tmpfile, "w")
|
|
except IOError, e:
|
|
logging.error("%s: create failed: %s"
|
|
% (tmpfile, os.strerror(e.errno)))
|
|
return
|
|
|
|
try:
|
|
fcntl.lockf(file, fcntl.LOCK_EX | fcntl.LOCK_NB)
|
|
except IOError, e:
|
|
logging.error("%s: fcntl failed: %s"
|
|
% (tmpfile, os.strerror(e.errno)))
|
|
file.close()
|
|
return
|
|
|
|
try:
|
|
file.write("%s\n" % pid)
|
|
file.flush()
|
|
ovs.fatal_signal.add_file_to_unlink(_pidfile)
|
|
except OSError, e:
|
|
logging.error("%s: write failed: %s"
|
|
% (tmpfile, os.strerror(e.errno)))
|
|
file.close()
|
|
return
|
|
|
|
try:
|
|
os.rename(tmpfile, _pidfile)
|
|
except OSError, e:
|
|
ovs.fatal_signal.remove_file_to_unlink(_pidfile)
|
|
logging.error("failed to rename \"%s\" to \"%s\": %s"
|
|
% (tmpfile, _pidfile, os.strerror(e.errno)))
|
|
file.close()
|
|
return
|
|
|
|
s = os.fstat(file.fileno())
|
|
_pidfile_dev = s.st_dev
|
|
_pidfile_ino = s.st_ino
|
|
|
|
def daemonize():
|
|
"""If configured with set_pidfile() or set_detach(), creates the pid file
|
|
and detaches from the foreground session."""
|
|
daemonize_start()
|
|
daemonize_complete()
|
|
|
|
def _waitpid(pid, options):
|
|
while True:
|
|
try:
|
|
return os.waitpid(pid, options)
|
|
except OSError, e:
|
|
if e.errno == errno.EINTR:
|
|
pass
|
|
return -e.errno, 0
|
|
|
|
def _fork_and_wait_for_startup():
|
|
try:
|
|
rfd, wfd = os.pipe()
|
|
except OSError, e:
|
|
sys.stderr.write("pipe failed: %s\n" % os.strerror(e.errno))
|
|
sys.exit(1)
|
|
|
|
try:
|
|
pid = os.fork()
|
|
except OSError, e:
|
|
sys.stderr.write("could not fork: %s\n" % os.strerror(e.errno))
|
|
sys.exit(1)
|
|
|
|
if pid > 0:
|
|
# Running in parent process.
|
|
os.close(wfd)
|
|
ovs.fatal_signal.fork()
|
|
try:
|
|
s = os.read(rfd, 1)
|
|
except OSError, e:
|
|
s = ""
|
|
if len(s) != 1:
|
|
retval, status = _waitpid(pid, 0)
|
|
if (retval == pid and
|
|
os.WIFEXITED(status) and os.WEXITSTATUS(status)):
|
|
# Child exited with an error. Convey the same error to
|
|
# our parent process as a courtesy.
|
|
sys.exit(os.WEXITSTATUS(status))
|
|
else:
|
|
sys.stderr.write("fork child failed to signal startup\n")
|
|
sys.exit(1)
|
|
|
|
os.close(rfd)
|
|
else:
|
|
# Running in parent process.
|
|
os.close(rfd)
|
|
ovs.timeval.postfork()
|
|
#ovs.lockfile.postfork()
|
|
|
|
global _daemonize_fd
|
|
_daemonize_fd = wfd
|
|
return pid
|
|
|
|
def _fork_notify_startup(fd):
|
|
if fd is not None:
|
|
error, bytes_written = ovs.socket_util.write_fully(fd, "0")
|
|
if error:
|
|
sys.stderr.write("could not write to pipe\n")
|
|
sys.exit(1)
|
|
os.close(fd)
|
|
|
|
def _should_restart(status):
|
|
global RESTART_EXIT_CODE
|
|
|
|
if os.WIFEXITED(status) and os.WEXITSTATUS(status) == RESTART_EXIT_CODE:
|
|
return True
|
|
|
|
if os.WIFSIGNALED(status):
|
|
for signame in ("SIGABRT", "SIGALRM", "SIGBUS", "SIGFPE", "SIGILL",
|
|
"SIGPIPE", "SIGSEGV", "SIGXCPU", "SIGXFSZ"):
|
|
if (signame in signal.__dict__ and
|
|
os.WTERMSIG(status) == signal.__dict__[signame]):
|
|
return True
|
|
return False
|
|
|
|
def _monitor_daemon(daemon_pid):
|
|
# XXX should log daemon's stderr output at startup time
|
|
# XXX should use setproctitle module if available
|
|
last_restart = None
|
|
while True:
|
|
retval, status = _waitpid(daemon_pid, 0)
|
|
if retval < 0:
|
|
sys.stderr.write("waitpid failed\n")
|
|
sys.exit(1)
|
|
elif retval == daemon_pid:
|
|
status_msg = ("pid %d died, %s"
|
|
% (daemon_pid, ovs.process.status_msg(status)))
|
|
|
|
if _should_restart(status):
|
|
if os.WCOREDUMP(status):
|
|
# Disable further core dumps to save disk space.
|
|
try:
|
|
resource.setrlimit(resource.RLIMIT_CORE, (0, 0))
|
|
except resource.error:
|
|
logging.warning("failed to disable core dumps")
|
|
|
|
# Throttle restarts to no more than once every 10 seconds.
|
|
if (last_restart is not None and
|
|
ovs.timeval.msec() < last_restart + 10000):
|
|
logging.warning("%s, waiting until 10 seconds since last "
|
|
"restart" % status_msg)
|
|
while True:
|
|
now = ovs.timeval.msec()
|
|
wakeup = last_restart + 10000
|
|
if now > wakeup:
|
|
break
|
|
print "sleep %f" % ((wakeup - now) / 1000.0)
|
|
time.sleep((wakeup - now) / 1000.0)
|
|
last_restart = ovs.timeval.msec()
|
|
|
|
logging.error("%s, restarting" % status_msg)
|
|
daemon_pid = _fork_and_wait_for_startup()
|
|
if not daemon_pid:
|
|
break
|
|
else:
|
|
logging.info("%s, exiting" % status_msg)
|
|
sys.exit(0)
|
|
|
|
# Running in new daemon process.
|
|
|
|
def _close_standard_fds():
|
|
"""Close stdin, stdout, stderr. If we're started from e.g. an SSH session,
|
|
then this keeps us from holding that session open artificially."""
|
|
null_fd = ovs.socket_util.get_null_fd()
|
|
if null_fd >= 0:
|
|
os.dup2(null_fd, 0)
|
|
os.dup2(null_fd, 1)
|
|
os.dup2(null_fd, 2)
|
|
|
|
def daemonize_start():
|
|
"""If daemonization is configured, then starts daemonization, by forking
|
|
and returning in the child process. The parent process hangs around until
|
|
the child lets it know either that it completed startup successfully (by
|
|
calling daemon_complete()) or that it failed to start up (by exiting with a
|
|
nonzero exit code)."""
|
|
|
|
if _detach:
|
|
if _fork_and_wait_for_startup() > 0:
|
|
# Running in parent process.
|
|
sys.exit(0)
|
|
# Running in daemon or monitor process.
|
|
|
|
if _monitor:
|
|
saved_daemonize_fd = _daemonize_fd
|
|
daemon_pid = _fork_and_wait_for_startup()
|
|
if daemon_pid > 0:
|
|
# Running in monitor process.
|
|
_fork_notify_startup(saved_daemonize_fd)
|
|
_close_standard_fds()
|
|
_monitor_daemon(daemon_pid)
|
|
# Running in daemon process
|
|
|
|
_make_pidfile()
|
|
|
|
def daemonize_complete():
|
|
"""If daemonization is configured, then this function notifies the parent
|
|
process that the child process has completed startup successfully."""
|
|
_fork_notify_startup(_daemonize_fd)
|
|
|
|
if _detach:
|
|
os.setsid()
|
|
if _chdir:
|
|
os.chdir("/")
|
|
_close_standard_fds()
|
|
|
|
def usage():
|
|
sys.stdout.write("""
|
|
Daemon options:
|
|
--detach run in background as daemon
|
|
--no-chdir do not chdir to '/'
|
|
--pidfile[=FILE] create pidfile (default: %s/%s.pid)
|
|
--overwrite-pidfile with --pidfile, start even if already running
|
|
""" % (ovs.dirs.RUNDIR, ovs.util.PROGRAM_NAME))
|
|
|
|
def __read_pidfile(pidfile, must_exist):
|
|
if _pidfile_dev is not None:
|
|
try:
|
|
s = os.stat(pidfile)
|
|
if s.st_ino == _pidfile_ino and s.st_dev == _pidfile_dev:
|
|
# It's our own pidfile. We can't afford to open it,
|
|
# because closing *any* fd for a file that a process
|
|
# has locked also releases all the locks on that file.
|
|
#
|
|
# Fortunately, we know the associated pid anyhow.
|
|
return os.getpid()
|
|
except OSError:
|
|
pass
|
|
|
|
try:
|
|
file = open(pidfile, "r")
|
|
except IOError, e:
|
|
if e.errno == errno.ENOENT and not must_exist:
|
|
return 0
|
|
logging.warning("%s: open: %s" % (pidfile, os.strerror(e.errno)))
|
|
return -e.errno
|
|
|
|
# Python fcntl doesn't directly support F_GETLK so we have to just try
|
|
# to lock it. If we get a conflicting lock that's "success"; otherwise
|
|
# the file is not locked.
|
|
try:
|
|
fcntl.lockf(file, fcntl.LOCK_EX | fcntl.LOCK_NB)
|
|
# File isn't locked if we get here, so treat that as an error.
|
|
logging.warning("%s: pid file is not locked" % pidfile)
|
|
try:
|
|
# As a side effect, this drops the lock.
|
|
file.close()
|
|
except IOError:
|
|
pass
|
|
return -errno.ESRCH
|
|
except IOError, e:
|
|
if e.errno not in [errno.EACCES, errno.EAGAIN]:
|
|
logging.warn("%s: fcntl: %s" % (pidfile, os.strerror(e.errno)))
|
|
return -e.errno
|
|
|
|
try:
|
|
try:
|
|
return int(file.readline())
|
|
except IOError, e:
|
|
logging.warning("%s: read: %s" % (pidfile, e.strerror))
|
|
return -e.errno
|
|
except ValueError:
|
|
logging.warning("%s does not contain a pid" % pidfile)
|
|
return -errno.EINVAL
|
|
finally:
|
|
try:
|
|
file.close()
|
|
except IOError:
|
|
pass
|
|
|
|
def read_pidfile(pidfile):
|
|
"""Opens and reads a PID from 'pidfile'. Returns the positive PID if
|
|
successful, otherwise a negative errno value."""
|
|
return __read_pidfile(pidfile, True)
|
|
|
|
def read_pidfile_if_exists(pidfile):
|
|
"""Opens and reads a PID from 'pidfile'. Returns 0 if 'pidfile' does not
|
|
exist, the positive PID if successful, otherwise a negative errno value."""
|
|
return __read_pidfile(pidfile, False)
|
|
|
|
# XXX Python's getopt does not support options with optional arguments, so we
|
|
# have to separate --pidfile (with no argument) from --pidfile-name (with an
|
|
# argument). Need to write our own getopt I guess.
|
|
LONG_OPTIONS = ["detach", "no-chdir", "pidfile", "pidfile-name=",
|
|
"overwrite-pidfile", "monitor"]
|
|
|
|
def parse_opt(option, arg):
|
|
if option == '--detach':
|
|
set_detach()
|
|
elif option == '--no-chdir':
|
|
set_no_chdir()
|
|
elif option == '--pidfile':
|
|
set_pidfile(None)
|
|
elif option == '--pidfile-name':
|
|
set_pidfile(arg)
|
|
elif option == '--overwrite-pidfile':
|
|
ignore_existing_pidfile()
|
|
elif option == '--monitor':
|
|
set_monitor()
|
|
else:
|
|
return False
|
|
return True
|