Commit 65556465 authored by Xavier Thompson's avatar Xavier Thompson

grid/utils.py: Detect too old existing process

parent df92f04d
...@@ -92,6 +92,10 @@ LOCALE_ENVIRONMENT_REMOVE_LIST = [ ...@@ -92,6 +92,10 @@ LOCALE_ENVIRONMENT_REMOVE_LIST = [
'LC_TIME', 'LC_TIME',
] ]
SLAPGRID_TIMEOUT = 60 * 60 * 2
SLAPGRID_KILL_TIMEOUT = 60 * 60 * 24
class LineLogger(object): class LineLogger(object):
""" """
...@@ -249,7 +253,10 @@ def getCleanEnvironment(logger, home_path='/tmp'): ...@@ -249,7 +253,10 @@ def getCleanEnvironment(logger, home_path='/tmp'):
def setRunning(logger, pidfile): def setRunning(logger, pidfile):
"""Creates a pidfile. If a pidfile already exists, we exit""" """
Creates a pidfile. If a pidfile already exists, we exit.
If the pid file is too old, we report a stall.
"""
if os.path.exists(pidfile): if os.path.exists(pidfile):
try: try:
with open(pidfile, 'r') as f: with open(pidfile, 'r') as f:
...@@ -266,9 +273,26 @@ def setRunning(logger, pidfile): ...@@ -266,9 +273,26 @@ def setRunning(logger, pidfile):
'Error getting information about process with pid %s', 'Error getting information about process with pid %s',
pid, exc_info=True) pid, exc_info=True)
if is_slapos_running: if is_slapos_running:
logger.info('New slapos process started, but another slapos ' creation_time = process.create_time()
'process is aleady running with pid %s, exiting.', pid) running_time = time.time() - creation_time
sys.exit(10) if running_time > SLAPGRID_KILL_TIMEOUT:
logger.warning(
"Existing slapos process has been running too long "
"(%ds > %d), killing it",
running_time, SLAPGRID_KILL_TIMEOUT)
killProcessTree(pid, logger)
elif running_time > SLAPGRID_TIMEOUT:
logger.warning(
"Existing slapos process has been running too long "
"(%ds > %d), reporting likely problem",
running_time, SLAPGRID_TIMEOUT)
# report to master ?
else:
logger.info(
"New slapos process started, but another slapos "
"process is aleady running with pid %s for %ds, exiting.",
pid, running_time)
sys.exit(10)
logger.info('Existing pid file %r was stale, overwritten', pidfile) logger.info('Existing pid file %r was stale, overwritten', pidfile)
# Start new process # Start new process
write_pid(logger, pidfile) write_pid(logger, pidfile)
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment