2003-06-14 21:39:57 +00:00
|
|
|
#!/usr/bin/env python
|
2004-06-11 09:54:23 +00:00
|
|
|
# -*- mode: python; python-indent: 4; -*-
|
2003-06-14 21:39:57 +00:00
|
|
|
|
|
|
|
## $Id$
|
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
'''
|
2004-05-27 19:32:32 +00:00
|
|
|
A program to start/stop BOINC server daemons and run periodic tasks.
|
|
|
|
Parses config.xml and runs <daemon> and <task> entries.
|
|
|
|
The format of config.xml is described in boinc/doc/configuration.php.
|
2003-06-14 21:39:58 +00:00
|
|
|
|
2003-12-02 22:47:32 +00:00
|
|
|
The main script is "start"; sym-link or hard-link "start" to "stop", "cron".
|
2003-06-14 21:39:58 +00:00
|
|
|
Invocation methods:
|
|
|
|
|
2003-06-14 21:40:00 +00:00
|
|
|
--enable (default if invoked as "start")
|
2003-12-02 22:47:32 +00:00
|
|
|
Set the project to ENABLED mode and start daemons
|
2003-06-14 21:39:58 +00:00
|
|
|
|
2003-12-02 22:47:32 +00:00
|
|
|
--cron If project is in ENABLED mode start daemons and run tasks;
|
|
|
|
else do nothing.
|
|
|
|
This command is intended to be run as a real cron job
|
2003-06-14 21:40:00 +00:00
|
|
|
every five minutes.
|
2005-01-18 23:35:53 +00:00
|
|
|
--cron-tasks Run tasks but do not start daemons;
|
|
|
|
This command is intended to be run as a real cron job
|
|
|
|
every five minutes.
|
2003-06-14 21:39:58 +00:00
|
|
|
|
2003-12-02 22:47:32 +00:00
|
|
|
--disable (default if invoked as "stop")
|
|
|
|
Set project to DISABLED mode and stop daemons.
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
--status Show status.
|
|
|
|
|
|
|
|
See "start --help" for options.
|
|
|
|
|
2003-12-06 19:42:21 +00:00
|
|
|
Daemons:
|
|
|
|
These are continuously-running programs.
|
2003-12-23 19:21:52 +00:00
|
|
|
The process ID is recorded in the <pid_dir> directory
|
|
|
|
and the process is sent a SIGHUP in a DISABLE operation.
|
2003-12-06 19:42:21 +00:00
|
|
|
|
|
|
|
Both tasks and daemons can run on a different host (specified by <host>).
|
2003-12-30 19:29:54 +00:00
|
|
|
The default is the project's main host, which is specified in config.host
|
|
|
|
A daemon or task can be turned off by adding the <disabled/> element.
|
2003-06-14 21:39:59 +00:00
|
|
|
|
2003-06-14 21:40:00 +00:00
|
|
|
IMPLEMENTATION:
|
2003-06-14 21:39:59 +00:00
|
|
|
|
2004-05-03 19:30:01 +00:00
|
|
|
"Start" uses a file "run_state_HOST.xml" that records the enabled mode
|
2003-12-06 19:42:21 +00:00
|
|
|
and the last run time of periodic tasks on that host.
|
2003-12-02 22:47:32 +00:00
|
|
|
Looks like this:
|
|
|
|
<?xml version="1.0">
|
|
|
|
<boinc>
|
|
|
|
<tasks>
|
|
|
|
<task>
|
|
|
|
<cmd>
|
|
|
|
get_load
|
|
|
|
</cmd>
|
|
|
|
<last_run>
|
|
|
|
1070392808.86
|
|
|
|
</last_run>
|
|
|
|
</task>
|
|
|
|
...
|
|
|
|
</tasks>
|
|
|
|
<enabled>
|
|
|
|
1
|
|
|
|
</enabled>
|
|
|
|
</boinc>
|
|
|
|
|
|
|
|
|
2003-06-14 21:39:59 +00:00
|
|
|
Daemons:
|
2004-05-27 19:32:32 +00:00
|
|
|
Writes a PID to pid_HOST/command.pid.
|
2003-06-14 21:39:59 +00:00
|
|
|
|
2003-12-06 19:42:21 +00:00
|
|
|
Tasks:
|
|
|
|
Writes a timestamp to run_state_HOST.xml
|
|
|
|
to remember when the task was last run.
|
2003-06-14 21:39:59 +00:00
|
|
|
|
|
|
|
Both:
|
2004-05-27 19:32:32 +00:00
|
|
|
A lock file (pid_HOST/command.lock)
|
2003-12-06 19:42:21 +00:00
|
|
|
prevents tasks and daemons from being run
|
2003-06-14 21:39:59 +00:00
|
|
|
again when they are currently running.
|
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
'''
|
|
|
|
|
2004-11-24 07:17:46 +00:00
|
|
|
import configxml
|
2003-12-06 19:42:21 +00:00
|
|
|
import sys, os, getopt, time, glob, fcntl, signal, socket
|
2003-06-14 21:39:57 +00:00
|
|
|
|
2004-05-13 17:00:52 +00:00
|
|
|
right_now = int(time.time())
|
2003-06-14 21:39:57 +00:00
|
|
|
verbose = os.isatty(sys.stdout.fileno())
|
2003-06-14 21:39:58 +00:00
|
|
|
verbose_daemon_run = 0
|
2003-12-02 22:47:32 +00:00
|
|
|
# how long (in seconds) parent should wait before continuing after a fork.
|
|
|
|
# this is just a safety measure in case anything doesn't play nice if
|
2003-06-14 21:39:59 +00:00
|
|
|
# starting simultaneously. also it keeps output in sequence.
|
|
|
|
fork_delay = 0.1
|
2003-06-14 21:40:02 +00:00
|
|
|
ignore_timestamps = False
|
2004-06-11 09:54:24 +00:00
|
|
|
prune_run_state = True #
|
2003-12-06 19:42:21 +00:00
|
|
|
is_main_host = False
|
|
|
|
local_hostname = ''
|
2004-06-14 11:19:07 +00:00
|
|
|
delegate_other_hosts_in_parallel = False
|
2003-12-06 19:42:21 +00:00
|
|
|
|
|
|
|
def get_host_list():
|
|
|
|
'''
|
|
|
|
Get a list of hosts mentioned in <host> elements of tasks and daemons
|
|
|
|
'''
|
|
|
|
hosts = []
|
|
|
|
for task in config.tasks:
|
|
|
|
host = task.__dict__.get('host')
|
|
|
|
if (host and (host not in hosts)):
|
|
|
|
hosts.append(host)
|
|
|
|
for task in config.daemons:
|
|
|
|
host = task.__dict__.get('host')
|
|
|
|
if (host and (host not in hosts)):
|
|
|
|
hosts.append(host)
|
|
|
|
return hosts
|
|
|
|
|
2003-12-30 19:29:54 +00:00
|
|
|
def assign_task_defaults():
|
2003-12-06 19:42:21 +00:00
|
|
|
'''
|
2003-12-30 19:29:54 +00:00
|
|
|
Set the "host" and "disabled" attribute of tasks and daemons
|
2003-12-06 19:42:21 +00:00
|
|
|
|
|
|
|
'''
|
|
|
|
for task in config.tasks:
|
|
|
|
host = task.__dict__.get('host')
|
|
|
|
if not host:
|
|
|
|
task.host = config.config.host
|
2003-12-30 19:29:54 +00:00
|
|
|
disabled = task.__dict__.get('disabled')
|
|
|
|
if disabled:
|
|
|
|
task.disabled = 1
|
|
|
|
else:
|
|
|
|
task.disabled = 0
|
2003-12-06 19:42:21 +00:00
|
|
|
for task in config.daemons:
|
|
|
|
host = task.__dict__.get('host')
|
|
|
|
if not host:
|
|
|
|
task.host = config.config.host
|
2003-12-30 19:29:54 +00:00
|
|
|
disabled = task.__dict__.get('disabled')
|
|
|
|
if disabled:
|
|
|
|
task.disabled = 1
|
|
|
|
else:
|
|
|
|
task.disabled = 0
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
def get_dir(name):
|
|
|
|
return config.config.__dict__.get(name+'_dir') or os.path.join(project_dir,name)
|
|
|
|
|
|
|
|
def ensure_get_dir(name):
|
|
|
|
f = get_dir(name)
|
|
|
|
ensure_dir(f)
|
|
|
|
return f
|
|
|
|
|
|
|
|
def is_daemon(task):
|
|
|
|
'''returns true if task is a daemon'''
|
|
|
|
return task._name == 'daemon'
|
|
|
|
|
2003-06-14 21:40:03 +00:00
|
|
|
def get_task_command_basename(task):
|
|
|
|
return os.path.basename(task.cmd.split()[0])
|
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
def get_task_output_name(task):
|
|
|
|
return os.path.join(log_dir,
|
2003-12-06 19:42:21 +00:00
|
|
|
task.__dict__.get('output') or get_task_command_basename(task) + '.out')
|
2003-06-14 21:39:58 +00:00
|
|
|
|
2003-06-14 21:40:04 +00:00
|
|
|
def get_daemon_output_name(task):
|
2003-06-14 21:39:58 +00:00
|
|
|
return os.path.join(log_dir,
|
2003-12-06 19:42:21 +00:00
|
|
|
task.__dict__.get('output') or get_task_command_basename(task) + '.log')
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
def get_daemon_pid_name(task):
|
|
|
|
return os.path.join(pid_dir,
|
2003-12-06 19:42:21 +00:00
|
|
|
task.__dict__.get('pid_file') or get_task_command_basename(task) + '.pid')
|
2003-06-14 21:39:58 +00:00
|
|
|
|
2003-06-14 21:40:07 +00:00
|
|
|
def output_is_file(filename):
|
|
|
|
return filename and not filename.startswith('/dev/')
|
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
def get_task_lock_name(task):
|
|
|
|
return os.path.join(pid_dir,
|
2003-12-06 19:42:21 +00:00
|
|
|
task.__dict__.get('lock_file')
|
|
|
|
or (output_is_file(task.__dict__.get('output')) and task.__dict__.get('output')+'.lock')
|
|
|
|
or get_task_command_basename(task) + '.lock')
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
def ensure_dir(filename):
|
|
|
|
try:
|
|
|
|
os.mkdir(filename)
|
|
|
|
except OSError:
|
|
|
|
return
|
|
|
|
|
2003-06-14 21:40:02 +00:00
|
|
|
def timestamp(t = None):
|
2004-05-13 17:00:52 +00:00
|
|
|
return time.strftime('%Y/%m/%d %H:%M:%S', time.localtime(t or right_now))
|
2003-06-14 21:39:59 +00:00
|
|
|
|
2003-06-14 21:40:00 +00:00
|
|
|
def safe_read_int(filename):
|
|
|
|
try:
|
|
|
|
return int(open(filename).readline().strip())
|
|
|
|
except:
|
|
|
|
return 0
|
|
|
|
|
2004-05-03 19:30:01 +00:00
|
|
|
def get_stop_daemons_filename():
|
|
|
|
return os.path.join(project_dir, 'stop_daemons')
|
2003-06-14 21:40:00 +00:00
|
|
|
|
2004-05-03 19:30:01 +00:00
|
|
|
def get_stop_sched_filename():
|
|
|
|
return os.path.join(project_dir, 'stop_sched')
|
2003-06-14 21:40:00 +00:00
|
|
|
|
2004-05-03 19:30:01 +00:00
|
|
|
def write_stop_daemons():
|
|
|
|
print >>open(get_stop_daemons_filename(),'w'), '<stop/>'
|
|
|
|
|
|
|
|
def remove_stop_daemons():
|
|
|
|
if os.path.exists(get_stop_daemons_filename()):
|
|
|
|
os.unlink(get_stop_daemons_filename())
|
|
|
|
|
|
|
|
def write_stop_sched():
|
|
|
|
print >>open(get_stop_sched_filename(),'w'), '<stop/>'
|
|
|
|
|
|
|
|
def remove_stop_sched():
|
|
|
|
if os.path.exists(get_stop_sched_filename()):
|
|
|
|
os.unlink(get_stop_sched_filename())
|
2003-06-14 21:40:00 +00:00
|
|
|
|
|
|
|
def safe_unlink(filename):
|
|
|
|
try:
|
|
|
|
os.unlink(filename)
|
|
|
|
except OSError, e:
|
|
|
|
print "Couldn't unlink %s:"%filename,e
|
|
|
|
|
2004-06-10 19:43:54 +00:00
|
|
|
def remove_cached_home_page():
|
2004-08-03 16:42:22 +00:00
|
|
|
path = os.path.join(project_dir, 'html/cache/65/index.php')
|
2004-06-14 01:51:04 +00:00
|
|
|
if os.path.exists(path):
|
|
|
|
print 'removing ' + path
|
|
|
|
safe_unlink(path)
|
2004-06-10 19:43:54 +00:00
|
|
|
|
2003-06-14 21:40:00 +00:00
|
|
|
def redirect(stdout='/dev/null', stderr=None, stdin='/dev/null'):
|
2003-06-14 21:39:58 +00:00
|
|
|
'''
|
|
|
|
Redirects stdio. The stdin, stdout, and stderr arguments are file names
|
|
|
|
that will be opened and be used to replace the standard file descriptors
|
|
|
|
in sys.stdin, sys.stdout, and sys.stderr. These arguments are optional
|
|
|
|
and default to /dev/null.
|
|
|
|
'''
|
|
|
|
|
|
|
|
si = open(stdin, 'r')
|
|
|
|
if not stderr: stderr = stdout
|
|
|
|
se = open(stderr, 'a+', 0)
|
|
|
|
if stdout == stderr:
|
|
|
|
so = se
|
|
|
|
else:
|
|
|
|
so = open(stdout, 'a+')
|
|
|
|
|
|
|
|
# Redirect standard file descriptors.
|
|
|
|
os.dup2(si.fileno(), sys.stdin.fileno())
|
|
|
|
os.dup2(so.fileno(), sys.stdout.fileno())
|
|
|
|
os.dup2(se.fileno(), sys.stderr.fileno())
|
2003-06-14 21:39:57 +00:00
|
|
|
|
2003-06-14 21:39:59 +00:00
|
|
|
def fork():
|
|
|
|
''' fork with fork_delay '''
|
|
|
|
pid = os.fork()
|
|
|
|
if pid:
|
|
|
|
time.sleep(fork_delay)
|
|
|
|
return pid
|
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
def double_fork():
|
|
|
|
'''
|
|
|
|
This forks the current process into a daemon using a double-fork.
|
|
|
|
Returns 1 for parent, 0 for child.
|
2003-06-14 21:39:57 +00:00
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
See: http://www.erlenstar.demon.co.uk/unix/faq_2.html#SEC16
|
|
|
|
http://aspn.activestate.com/ASPN/Cookbook/Python/Recipe/66012
|
|
|
|
'''
|
|
|
|
# this is necessary because otherwise any buffered output would get
|
|
|
|
# printed twice after the fork!
|
|
|
|
sys.stdout.flush()
|
2003-06-14 21:39:57 +00:00
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
# Do first fork.
|
|
|
|
try:
|
2003-06-14 21:39:59 +00:00
|
|
|
pid = fork()
|
2003-06-14 21:39:58 +00:00
|
|
|
if pid > 0: return 1
|
|
|
|
except OSError, e:
|
|
|
|
sys.stderr.write("fork #1 failed: (%d) %s\n" % (e.errno, e.strerror))
|
|
|
|
sys.exit(1)
|
2003-06-14 21:39:57 +00:00
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
# Decouple from parent environment.
|
|
|
|
os.chdir("/")
|
|
|
|
os.umask(0)
|
|
|
|
os.setsid()
|
2003-06-14 21:39:57 +00:00
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
# Do second fork.
|
|
|
|
try:
|
|
|
|
pid = os.fork()
|
2003-07-15 22:03:04 +00:00
|
|
|
if pid > 0: os._exit(0) # Exit second parent.
|
2003-06-14 21:39:58 +00:00
|
|
|
except OSError, e:
|
|
|
|
sys.stderr.write("fork #2 failed: (%d) %s\n" % (e.errno, e.strerror))
|
2003-07-15 22:03:04 +00:00
|
|
|
os._exit(1)
|
2003-06-14 21:39:58 +00:00
|
|
|
return 0
|
2003-06-14 21:39:57 +00:00
|
|
|
|
2003-06-14 21:40:00 +00:00
|
|
|
def write_pid_file(pidfile):
|
|
|
|
print >>open(pidfile,'w'), os.getpid()
|
|
|
|
|
2003-06-14 21:40:02 +00:00
|
|
|
def is_pid_running(pid):
|
|
|
|
try:
|
|
|
|
os.kill(pid,0)
|
|
|
|
return True
|
|
|
|
except OSError:
|
|
|
|
return False
|
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
# if we ever want to use this on windows see:
|
|
|
|
# http://aspn.activestate.com/ASPN/Cookbook/Python/Recipe/65203
|
|
|
|
# returns 0 on success, -1 on error
|
|
|
|
locks = []
|
|
|
|
def lock_file(filename):
|
|
|
|
global locks
|
|
|
|
file = open(filename,'w')
|
|
|
|
locks.append(file)
|
|
|
|
try:
|
2006-12-30 18:11:25 +00:00
|
|
|
return fcntl.lockf(file.fileno(), fcntl.LOCK_EX|fcntl.LOCK_NB)
|
2003-06-14 21:39:58 +00:00
|
|
|
except IOError:
|
|
|
|
return -1
|
|
|
|
|
2003-06-14 21:40:02 +00:00
|
|
|
def is_lock_file_locked(filename):
|
|
|
|
if lock_file(filename):
|
|
|
|
return True
|
|
|
|
else:
|
|
|
|
os.unlink(filename)
|
|
|
|
|
2003-06-14 21:40:01 +00:00
|
|
|
def contains_shell_characters(command):
|
|
|
|
return ('"' in command or "'" in command or
|
|
|
|
'\\' in command or '|' in command or
|
|
|
|
'>' in command)
|
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
def exec_command_string(command):
|
2003-06-14 21:40:01 +00:00
|
|
|
args = command.strip().split()
|
2003-06-14 21:39:58 +00:00
|
|
|
# set default path for program to <bin_dir>:
|
2003-06-14 21:39:59 +00:00
|
|
|
args[0] = os.path.realpath(os.path.join( bin_dir, args[0] ))
|
2004-07-28 01:26:36 +00:00
|
|
|
os.chdir(tmp_dir)
|
2003-06-14 21:39:59 +00:00
|
|
|
try:
|
2003-06-14 21:40:01 +00:00
|
|
|
if contains_shell_characters(command):
|
|
|
|
os.execl('/bin/sh', 'sh', '-c', ' '.join(args))
|
|
|
|
else:
|
|
|
|
os.execv( args[0], args )
|
2003-06-14 21:39:59 +00:00
|
|
|
# on success we don't reach here
|
2003-06-14 21:40:01 +00:00
|
|
|
print >>sys.stderr, "Couldn't exec '%s'"%command
|
2003-06-14 21:39:59 +00:00
|
|
|
except OSError, e:
|
|
|
|
print >>sys.stderr, "Couldn't execute '%s':" %command, e
|
|
|
|
os._exit(1)
|
2003-06-14 21:39:58 +00:00
|
|
|
|
2003-06-14 21:39:59 +00:00
|
|
|
def lookup_task_run_state(task):
|
2003-06-14 21:40:02 +00:00
|
|
|
for run_state_task in run_state.tasks:
|
|
|
|
if run_state_task.cmd == task.cmd:
|
2004-06-11 09:54:23 +00:00
|
|
|
run_state_task.prunable = False
|
2003-06-14 21:40:02 +00:00
|
|
|
return run_state_task
|
2003-06-14 21:40:03 +00:00
|
|
|
run_state_task = run_state.tasks.make_node_and_append('task')
|
2003-06-14 21:40:02 +00:00
|
|
|
run_state_task.cmd = task.cmd
|
|
|
|
run_state_task.last_run = 0
|
2004-06-13 17:58:18 +00:00
|
|
|
run_state_task.prunable = False
|
2003-06-14 21:40:02 +00:00
|
|
|
return run_state_task
|
|
|
|
|
|
|
|
def interpret_period(str):
|
|
|
|
''' "5 min" -> 5*60 ; "1 hour" -> 1*60*60; "2" -> 2*60 '''
|
|
|
|
s = str.strip().split()
|
|
|
|
try:
|
|
|
|
num = int(s[0])
|
|
|
|
if len(s) == 1:
|
|
|
|
return num*60
|
|
|
|
if len(s) == 2:
|
|
|
|
u = s[1].lower()
|
|
|
|
if u.startswith('s'):
|
|
|
|
return num
|
|
|
|
if u.startswith('m'):
|
|
|
|
return num*60
|
|
|
|
if u.startswith('h'):
|
|
|
|
return num*60*60
|
|
|
|
if u.startswith('d'):
|
|
|
|
return num*60*60*24
|
|
|
|
if u.startswith('w'):
|
|
|
|
return num*60*60*24*7
|
|
|
|
if u.startswith('mo'):
|
|
|
|
return num*60*60*24*30
|
|
|
|
except ValueError:
|
|
|
|
pass
|
|
|
|
raise SystemExit('Invalid task period "%s"'%str)
|
|
|
|
|
|
|
|
|
|
|
|
def when_will_task_next_run(task, task_run_state):
|
2003-06-14 21:40:03 +00:00
|
|
|
return float(task_run_state.last_run) + interpret_period(task.period)
|
2003-06-14 21:39:58 +00:00
|
|
|
|
2003-06-14 21:39:59 +00:00
|
|
|
def time_to_run_task(task, task_run_state):
|
2003-12-06 19:42:21 +00:00
|
|
|
return (ignore_timestamps
|
2004-05-13 17:00:52 +00:00
|
|
|
or (right_now >= when_will_task_next_run(task,task_run_state)))
|
2003-06-14 21:39:59 +00:00
|
|
|
|
|
|
|
def update_task_timestamp(task_run_state):
|
2004-05-13 17:00:52 +00:00
|
|
|
task_run_state.last_run = right_now
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
def run_task(task):
|
|
|
|
'''Fork and exec command without stdout/err redirection'''
|
2003-06-14 21:39:59 +00:00
|
|
|
task_run_state = lookup_task_run_state(task)
|
|
|
|
if not time_to_run_task(task, task_run_state):
|
2003-06-14 21:39:58 +00:00
|
|
|
if verbose:
|
|
|
|
print " Not running task because not time yet:",task.cmd
|
|
|
|
return
|
|
|
|
if verbose:
|
|
|
|
print " Running task:", task.cmd
|
2003-06-14 21:40:03 +00:00
|
|
|
update_task_timestamp(task_run_state)
|
2003-06-14 21:39:58 +00:00
|
|
|
# we don't need the full double-fork because this should finish quickly
|
2003-06-14 21:39:59 +00:00
|
|
|
if fork() > 0: return
|
2003-06-14 21:39:58 +00:00
|
|
|
if lock_file(get_task_lock_name(task)):
|
2003-06-14 21:40:03 +00:00
|
|
|
print >>sys.stderr, " Task currently running! (%s)"%task.cmd
|
2003-06-14 21:39:58 +00:00
|
|
|
sys.exit(1)
|
2003-06-14 21:40:00 +00:00
|
|
|
redirect(get_task_output_name(task))
|
2003-06-14 21:39:58 +00:00
|
|
|
exec_command_string(task.cmd)
|
|
|
|
|
|
|
|
def run_daemon(task):
|
|
|
|
'''Double-fork and exec command with stdout/err redirection and pid writing'''
|
|
|
|
if double_fork() > 0: return
|
|
|
|
if lock_file(get_task_lock_name(task)):
|
|
|
|
if verbose:
|
2003-06-14 21:39:59 +00:00
|
|
|
print >>sys.stderr, " Daemon already running:",task.cmd
|
2003-06-14 21:39:58 +00:00
|
|
|
sys.exit(0)
|
2003-06-14 21:39:59 +00:00
|
|
|
if verbose or verbose_daemon_run:
|
|
|
|
print " Starting daemon:", task.cmd
|
|
|
|
sys.stdout.flush()
|
2003-06-14 21:40:00 +00:00
|
|
|
redirect(get_daemon_output_name(task))
|
|
|
|
write_pid_file(get_daemon_pid_name(task))
|
2003-06-14 21:39:59 +00:00
|
|
|
print "[%s] Executing command:"%timestamp(), task.cmd
|
|
|
|
sys.stdout.flush()
|
2003-06-14 21:39:58 +00:00
|
|
|
exec_command_string(task.cmd)
|
|
|
|
|
|
|
|
def run_daemons():
|
|
|
|
if verbose: print "Starting daemons"
|
2003-12-06 19:42:21 +00:00
|
|
|
if is_main_host:
|
2004-05-03 19:30:01 +00:00
|
|
|
remove_stop_daemons()
|
2003-12-06 19:42:21 +00:00
|
|
|
for task in config.daemons:
|
|
|
|
if task.host != local_hostname:
|
2004-01-13 02:47:34 +00:00
|
|
|
continue
|
2003-12-30 19:29:54 +00:00
|
|
|
if task.disabled:
|
2004-01-13 02:47:34 +00:00
|
|
|
continue
|
2003-12-06 19:42:21 +00:00
|
|
|
run_daemon(task)
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
def run_tasks():
|
|
|
|
if verbose: print "Running tasks"
|
2004-06-11 09:54:23 +00:00
|
|
|
prepare_run_state_pruning()
|
2003-12-06 19:42:21 +00:00
|
|
|
for task in config.tasks:
|
|
|
|
if task.host != local_hostname:
|
2004-01-13 02:47:34 +00:00
|
|
|
continue
|
2003-12-30 19:29:54 +00:00
|
|
|
if task.disabled:
|
2004-01-13 02:47:34 +00:00
|
|
|
continue
|
2004-10-27 21:04:15 +00:00
|
|
|
if task.__dict__.get('always_run'):
|
|
|
|
run_task(task)
|
|
|
|
continue
|
|
|
|
if run_state.enabled:
|
|
|
|
run_task(task)
|
2004-06-11 09:54:23 +00:00
|
|
|
do_prune_run_states()
|
|
|
|
|
|
|
|
def prepare_run_state_pruning():
|
|
|
|
for run_state_task in run_state.tasks:
|
|
|
|
run_state_task.prunable = True
|
|
|
|
|
|
|
|
def do_prune_run_states():
|
|
|
|
'''\
|
|
|
|
|
|
|
|
Delete tasks that have prunable==True (since we didn't touch them this run)
|
|
|
|
|
|
|
|
'''
|
|
|
|
|
|
|
|
if not prune_run_state:
|
|
|
|
return
|
|
|
|
for run_state_task in run_state.tasks:
|
|
|
|
if run_state_task.prunable:
|
2004-06-11 10:10:59 +00:00
|
|
|
print 'Deleting obsolete run_state task', run_state_task.cmd, '(last run %s)' %timestamp(float(run_state_task.last_run))
|
2004-06-11 10:20:07 +00:00
|
|
|
run_state.tasks.remove_node(run_state_task)
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
def stop_daemon(pid):
|
|
|
|
'''returns 1 if something stopped, else 0'''
|
|
|
|
try:
|
2003-12-23 19:21:52 +00:00
|
|
|
os.kill(pid, signal.SIGHUP)
|
2003-06-14 21:39:58 +00:00
|
|
|
except OSError, e:
|
|
|
|
if e.errno != 3:
|
|
|
|
print >>sys.stderr, "Warning: couldn't kill pid %d:"%pid, e
|
|
|
|
return 0
|
|
|
|
if verbose:
|
|
|
|
print " Killed process", pid
|
|
|
|
return 1
|
|
|
|
|
2003-07-25 23:57:24 +00:00
|
|
|
def wait_for_process_to_end(pid):
|
|
|
|
'''if process is still running, wait for it to end.'''
|
|
|
|
if is_pid_running(pid):
|
|
|
|
if verbose:
|
|
|
|
print " Waiting for process",pid,"to end: ",
|
2003-07-25 23:57:26 +00:00
|
|
|
sys.stdout.flush()
|
2003-07-25 23:57:24 +00:00
|
|
|
while is_pid_running(pid):
|
|
|
|
if verbose:
|
2003-07-25 23:57:26 +00:00
|
|
|
sys.stdout.write('.')
|
|
|
|
sys.stdout.flush()
|
2003-07-25 23:57:24 +00:00
|
|
|
time.sleep(.5)
|
|
|
|
if verbose:
|
|
|
|
print ' ok'
|
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
def stop_daemons():
|
|
|
|
if verbose: print "Stopping all daemons"
|
2004-05-03 19:30:01 +00:00
|
|
|
write_stop_daemons()
|
2003-06-14 21:39:58 +00:00
|
|
|
pid_files = glob.glob(os.path.join(pid_dir, '*.pid'))
|
|
|
|
count = 0
|
2003-07-25 23:57:24 +00:00
|
|
|
pids = map(safe_read_int, pid_files)
|
2003-07-25 23:57:25 +00:00
|
|
|
map(safe_unlink, pid_files)
|
2003-07-25 23:57:24 +00:00
|
|
|
for pid in pids:
|
|
|
|
count += stop_daemon(pid)
|
|
|
|
for pid in pids:
|
|
|
|
wait_for_process_to_end(pid)
|
2003-06-14 21:39:58 +00:00
|
|
|
if verbose:
|
|
|
|
if not count:
|
2003-06-14 21:40:00 +00:00
|
|
|
print " (No processes stopped)"
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
|
|
|
|
######################################################################
|
|
|
|
## command (action) functions:
|
|
|
|
def command_enable_start():
|
|
|
|
if verbose:
|
|
|
|
if run_state.enabled:
|
|
|
|
print "Staying in ENABLED mode"
|
|
|
|
else:
|
|
|
|
print "Entering ENABLED mode"
|
2004-06-04 12:01:17 +00:00
|
|
|
# NOTE: must use '1', not '0' here
|
|
|
|
run_state.enabled = 1
|
2003-06-14 21:39:58 +00:00
|
|
|
run_daemons()
|
2004-04-30 19:33:05 +00:00
|
|
|
time.sleep(10) # give feeder time to start up and create shmem
|
2004-05-03 19:30:01 +00:00
|
|
|
remove_stop_sched()
|
2004-06-10 19:43:54 +00:00
|
|
|
remove_cached_home_page()
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
def command_cron_start():
|
2003-06-14 21:40:04 +00:00
|
|
|
if verbose: print "Verbose cron-start: status ==", (run_state.enabled and 'ENABLED' or 'DISABLED')
|
2004-10-27 21:04:15 +00:00
|
|
|
global verbose_daemon_run
|
2003-06-14 21:39:58 +00:00
|
|
|
if run_state.enabled:
|
|
|
|
verbose_daemon_run = 1
|
|
|
|
run_daemons()
|
|
|
|
run_tasks()
|
2004-10-27 21:04:15 +00:00
|
|
|
else:
|
|
|
|
verbose_daemon_run = 1
|
|
|
|
run_tasks()
|
2003-06-14 21:39:58 +00:00
|
|
|
|
2005-01-18 23:35:53 +00:00
|
|
|
def command_tasks_start():
|
|
|
|
if verbose: print "Verbose cron-start: status ==", (run_state.enabled and 'ENABLED' or 'DISABLED')
|
|
|
|
run_tasks()
|
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
def command_disable_stop():
|
2003-06-14 21:39:59 +00:00
|
|
|
if verbose:
|
|
|
|
if run_state.enabled:
|
|
|
|
print "Entering DISABLED mode"
|
|
|
|
else:
|
|
|
|
print "Staying in DISABLED mode"
|
2004-06-04 12:01:17 +00:00
|
|
|
run_state.enabled = 0
|
2007-04-17 23:08:24 +00:00
|
|
|
write_stop_sched() # do this before stop_daemons(),
|
|
|
|
# else scheduler will complained about no shared mem
|
2003-06-14 21:39:58 +00:00
|
|
|
stop_daemons()
|
2004-06-10 19:43:54 +00:00
|
|
|
remove_cached_home_page()
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
def command_status():
|
|
|
|
if run_state.enabled:
|
|
|
|
print "BOINC is ENABLED"
|
|
|
|
else:
|
|
|
|
print "BOINC is DISABLED"
|
2003-06-14 21:39:59 +00:00
|
|
|
if verbose:
|
2003-06-14 21:40:02 +00:00
|
|
|
print
|
2006-12-29 19:01:03 +00:00
|
|
|
print "DAEMON pid status lockfile disabled commandline"
|
2003-06-14 21:40:02 +00:00
|
|
|
n = 0
|
|
|
|
for task in config.daemons:
|
2003-12-06 19:42:21 +00:00
|
|
|
if task.host != local_hostname:
|
2004-01-13 02:47:34 +00:00
|
|
|
continue
|
2003-06-14 21:40:02 +00:00
|
|
|
n += 1
|
|
|
|
pid = safe_read_int(get_daemon_pid_name(task)) or 0
|
|
|
|
if not pid:
|
2006-12-29 19:01:03 +00:00
|
|
|
rs = " "
|
2003-06-14 21:40:02 +00:00
|
|
|
elif is_pid_running(pid):
|
2006-12-29 19:01:03 +00:00
|
|
|
rs = " running "
|
2003-06-14 21:40:02 +00:00
|
|
|
else:
|
2006-12-29 19:01:03 +00:00
|
|
|
rs = "NOT RUNNING"
|
2003-06-14 21:40:02 +00:00
|
|
|
if is_lock_file_locked(get_task_lock_name(task)):
|
|
|
|
lu = " locked "
|
|
|
|
else:
|
|
|
|
lu = "UNLOCKED"
|
2003-12-30 19:29:54 +00:00
|
|
|
|
|
|
|
if task.disabled:
|
|
|
|
d = " yes "
|
|
|
|
else:
|
|
|
|
d = " no "
|
|
|
|
|
|
|
|
print " %2d"%n, " %5d"%pid, rs, lu, d, " ", task.cmd
|
2003-06-14 21:40:02 +00:00
|
|
|
print
|
2006-12-29 19:01:03 +00:00
|
|
|
print "TASK last run period next run lock file disabled commandline"
|
2003-06-14 21:40:02 +00:00
|
|
|
n = 0
|
|
|
|
for task in config.tasks:
|
2003-12-06 19:42:21 +00:00
|
|
|
if task.host != local_hostname:
|
2004-01-13 02:47:34 +00:00
|
|
|
continue
|
2003-06-14 21:40:02 +00:00
|
|
|
n += 1
|
|
|
|
task_run_state = lookup_task_run_state(task)
|
2003-06-14 21:40:03 +00:00
|
|
|
when_last_run = float(task_run_state.last_run)
|
|
|
|
last_run = when_last_run and timestamp(when_last_run) or '?'
|
2003-06-14 21:40:02 +00:00
|
|
|
when_next_run = when_will_task_next_run(task, lookup_task_run_state(task))
|
2004-05-13 17:00:52 +00:00
|
|
|
next_run = (when_next_run <= right_now) and 'NOW' or timestamp(when_next_run)
|
2003-06-14 21:40:02 +00:00
|
|
|
if is_lock_file_locked(get_task_lock_name(task)):
|
2003-06-14 21:40:03 +00:00
|
|
|
lu = " LOCKED "
|
2003-06-14 21:40:02 +00:00
|
|
|
else:
|
2003-06-14 21:40:03 +00:00
|
|
|
lu = "unlocked"
|
2003-12-30 19:29:54 +00:00
|
|
|
|
|
|
|
if task.disabled:
|
|
|
|
d = " yes "
|
|
|
|
else:
|
|
|
|
d = " no "
|
2003-06-14 21:40:03 +00:00
|
|
|
print " %2d"%n, last_run.center(20), task.period.ljust(10), \
|
2003-12-30 19:29:54 +00:00
|
|
|
next_run.center(20), lu, d, " ", task.cmd
|
2003-06-14 21:39:59 +00:00
|
|
|
pass
|
2003-06-14 21:39:57 +00:00
|
|
|
|
2003-06-14 21:40:00 +00:00
|
|
|
def command_show_config():
|
2003-06-14 21:40:02 +00:00
|
|
|
# TODO: - all config items (e.g. where's logdir?)
|
|
|
|
raise SystemExit('TODO')
|
|
|
|
|
2003-12-06 19:42:21 +00:00
|
|
|
# ------------- main program begins here ---------------------
|
|
|
|
|
|
|
|
local_hostname = socket.gethostname()
|
2004-11-24 07:17:46 +00:00
|
|
|
local_hostname = local_hostname.split('.')[0]
|
2004-06-11 09:54:23 +00:00
|
|
|
# print 'local hostname: ', local_hostname
|
2003-12-06 19:42:21 +00:00
|
|
|
cwd = os.getcwd()
|
2003-06-14 21:40:00 +00:00
|
|
|
program_name = os.path.basename(sys.argv[0])
|
|
|
|
if program_name == 'start':
|
|
|
|
command = command_enable_start
|
|
|
|
elif program_name == 'stop':
|
|
|
|
command = command_disable_stop
|
2003-06-14 21:40:08 +00:00
|
|
|
elif program_name == 'status':
|
|
|
|
command = command_status
|
2003-06-14 21:40:00 +00:00
|
|
|
else:
|
|
|
|
command = None
|
|
|
|
|
2003-06-14 21:39:57 +00:00
|
|
|
def help():
|
|
|
|
print >>sys.stderr, "Syntax: %s [options] [command]" % sys.argv[0]
|
2003-06-14 21:39:58 +00:00
|
|
|
print >>sys.stderr, """ Starts or stops BOINC daemons and tasks.
|
|
|
|
|
|
|
|
Commands:
|
2003-06-14 21:40:02 +00:00
|
|
|
--enable (-e) Set BOINC to ENABLED mode and start daemons
|
|
|
|
--cron (-c) If ENABLED, start daemons and run tasks
|
|
|
|
Intended to be run from real cron every 5 min.
|
2005-01-18 23:35:53 +00:00
|
|
|
--cron-tasks If ENABLED run tasks only and do not start daemons
|
|
|
|
Intended to be run from real cron every 5 min.
|
|
|
|
|
2003-06-14 21:40:02 +00:00
|
|
|
--disable (-d) Set BOINC to DISABLED mode and stop daemons
|
|
|
|
--status (-s) Show status.
|
2003-06-14 21:40:04 +00:00
|
|
|
--show-config Show configuration
|
2003-06-14 21:39:57 +00:00
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
Options:
|
2003-06-14 21:40:02 +00:00
|
|
|
--quiet (-q) Operate quietly, even if STDOUT is a tty.
|
|
|
|
--verbose (-v) Operate verbosely, even if STDOUT is not a tty.
|
|
|
|
|
2003-06-14 21:40:04 +00:00
|
|
|
--config-file= Use specified file instead of program-path/../config.xml
|
|
|
|
--run-state-file= Use specified file instead of program-path/../run_state.xml
|
2003-06-14 21:40:05 +00:00
|
|
|
--fork-delay= Seconds to sleep between daemon forks instead of 0.1
|
2003-06-14 21:40:02 +00:00
|
|
|
--ignore-timestamps Ignore timestamps; for cron mode, runs all tasks now
|
2004-06-11 09:54:23 +00:00
|
|
|
--prune-run-state Delete unused timestamps in run_state.xml
|
2003-06-14 21:39:57 +00:00
|
|
|
"""
|
2003-06-14 21:40:00 +00:00
|
|
|
if program_name == 'start':
|
|
|
|
print >>sys.stderr, "Based on the invocation name as `start', the default action is --enable."
|
|
|
|
elif program_name == 'stop':
|
|
|
|
print >>sys.stderr, "Based on the invocation name as `stop', the default action is --disable."
|
2003-06-14 21:39:57 +00:00
|
|
|
sys.exit(1)
|
|
|
|
|
2003-06-14 21:40:04 +00:00
|
|
|
program_path = os.path.realpath(os.path.dirname(sys.argv[0]))
|
|
|
|
config_filename = os.path.realpath(os.path.join(program_path, '../config.xml'))
|
2003-12-06 19:42:21 +00:00
|
|
|
run_state_filename = os.path.realpath(os.path.join(program_path, '../run_state_'+local_hostname+'.xml'))
|
2003-06-14 21:40:04 +00:00
|
|
|
|
2003-06-14 21:39:57 +00:00
|
|
|
try:
|
2003-06-14 21:39:58 +00:00
|
|
|
opts, args = getopt.getopt(sys.argv[1:], 'cedskqvh?',
|
2005-01-18 23:35:53 +00:00
|
|
|
('enable', 'cron', 'cron-tasks', 'disable',
|
2003-06-14 21:40:00 +00:00
|
|
|
'start', 'stop', 'kill', 'status',
|
|
|
|
'show-config',
|
2003-06-14 21:40:02 +00:00
|
|
|
'ignore-timestamps',
|
|
|
|
'fork-delay=',
|
2003-06-14 21:40:04 +00:00
|
|
|
'config-file=', 'run-state-file=',
|
2004-06-11 09:54:23 +00:00
|
|
|
'prune-run-state',
|
2003-06-14 21:39:57 +00:00
|
|
|
'quiet', 'verbose', 'help'))
|
|
|
|
except Exception, e:
|
|
|
|
print >>sys.stderr, e
|
|
|
|
print >>sys.stderr, "Use '%s --help' for help" % sys.argv[0]
|
|
|
|
sys.exit(1)
|
|
|
|
for opt,v in opts:
|
|
|
|
if opt == '-q' or opt == '--quiet':
|
|
|
|
verbose = 0
|
|
|
|
elif opt == '-v' or opt == '--verbose':
|
|
|
|
verbose = 1
|
2003-06-14 21:39:58 +00:00
|
|
|
elif opt == '-h' or opt == '--help' or opt == '-?':
|
2003-06-14 21:39:57 +00:00
|
|
|
help()
|
2003-06-14 21:39:58 +00:00
|
|
|
elif opt == '-e' or opt == '--enable' or opt == '--start':
|
|
|
|
command = command_enable_start
|
2003-06-14 21:39:57 +00:00
|
|
|
elif opt == '-c' or opt == '--cron':
|
2003-06-14 21:39:58 +00:00
|
|
|
command = command_cron_start
|
2005-01-20 18:50:49 +00:00
|
|
|
elif opt == '--cron-task':
|
2005-01-18 23:35:53 +00:00
|
|
|
command = command_tasks_start
|
2003-06-14 21:39:58 +00:00
|
|
|
elif opt == '-d' or opt == '--disable' or opt == '--stop' or opt == '-k' or opt == '--kill':
|
|
|
|
command = command_disable_stop
|
|
|
|
elif opt == '-s' or opt == '--status':
|
|
|
|
command = command_status
|
2003-06-14 21:40:00 +00:00
|
|
|
elif opt == '--show-config':
|
|
|
|
command = command_show_config
|
2003-06-14 21:40:02 +00:00
|
|
|
elif opt == '--ignore-timestamps':
|
|
|
|
ignore_timestamps = True
|
2004-06-11 09:54:23 +00:00
|
|
|
elif opt == '--prune-run-state':
|
|
|
|
prune_run_state = True
|
2003-06-14 21:40:04 +00:00
|
|
|
elif opt == '--config-file':
|
|
|
|
config_filename = v
|
|
|
|
elif opt == '--run-state-file':
|
|
|
|
run_state_filename = v
|
2003-06-14 21:40:02 +00:00
|
|
|
elif opt == '--fork-delay':
|
2003-06-14 21:39:59 +00:00
|
|
|
fork_delay = v
|
2003-06-14 21:39:57 +00:00
|
|
|
else: assert(False)
|
|
|
|
|
2003-06-14 21:40:00 +00:00
|
|
|
if not command:
|
2003-06-14 21:42:07 +00:00
|
|
|
raise SystemExit('No command specified and script name is not "start", "stop", or "status"')
|
2003-06-14 21:40:00 +00:00
|
|
|
|
2003-09-04 05:07:17 +00:00
|
|
|
config = configxml.ConfigFile(config_filename).read()
|
|
|
|
run_state = configxml.RunStateFile(run_state_filename).read(failopen_ok = True)
|
2003-06-14 21:39:58 +00:00
|
|
|
|
|
|
|
project_dir = os.path.realpath(config.config.__dict__.get('project_dir') or
|
|
|
|
os.path.join(program_path, '../'))
|
|
|
|
os.chdir(project_dir)
|
|
|
|
bin_dir = get_dir('bin')
|
|
|
|
cgi_bin_dir = get_dir('cgi_bin')
|
2004-07-28 02:04:02 +00:00
|
|
|
tmp_dir = ensure_get_dir('tmp_'+local_hostname)
|
2003-12-06 19:42:21 +00:00
|
|
|
log_dir = ensure_get_dir('log_'+local_hostname)
|
|
|
|
pid_dir = ensure_get_dir('pid_'+local_hostname)
|
2003-06-14 21:39:58 +00:00
|
|
|
|
2003-12-06 19:42:21 +00:00
|
|
|
is_main_host = config.config.host == local_hostname
|
|
|
|
|
|
|
|
start_lockfile = os.path.join(pid_dir, 'start.lock.'+local_hostname)
|
2003-06-14 21:39:58 +00:00
|
|
|
if lock_file(start_lockfile):
|
|
|
|
print >>sys.stderr, "start is currently running!"
|
|
|
|
sys.exit(1)
|
|
|
|
|
2003-12-30 19:29:54 +00:00
|
|
|
assign_task_defaults()
|
2003-06-14 21:39:58 +00:00
|
|
|
apply(command)
|
|
|
|
run_state.write()
|
2003-12-06 19:42:21 +00:00
|
|
|
|
2004-01-13 02:47:34 +00:00
|
|
|
if is_main_host:
|
2004-06-14 11:19:07 +00:00
|
|
|
if delegate_other_hosts_in_parallel:
|
|
|
|
wait_mode = os.P_NOWAIT
|
|
|
|
else:
|
|
|
|
wait_mode = os.P_WAIT
|
|
|
|
|
2003-12-06 19:42:21 +00:00
|
|
|
other_hosts = get_host_list()
|
|
|
|
for host in other_hosts:
|
|
|
|
if host == local_hostname:
|
|
|
|
continue
|
2004-06-14 11:19:07 +00:00
|
|
|
remote_cmd = [ 'ssh', host, 'cd', cwd, ' && ' ] + sys.argv
|
2004-01-13 02:47:34 +00:00
|
|
|
if verbose:
|
2004-06-14 11:19:07 +00:00
|
|
|
remote_cmd += [ '-v' ]
|
|
|
|
print 'running ', ' '.join(remote_cmd)
|
|
|
|
os.spawnvp(wait_mode, remote_cmd[0], remote_cmd)
|
2003-12-06 19:42:21 +00:00
|
|
|
|
2003-06-14 21:39:58 +00:00
|
|
|
os.unlink(start_lockfile)
|