Blame - server/server_job.py - platform/external/autotest

blob: e143fd1079beb004d39b8fc52b5aa9329129dce0 [file] [log] [blame]

mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	1	"""
				2	The main job wrapper for the server side.
				3
				4	This is the core infrastructure. Derived from the client side job.py
				5
				6	Copyright Martin J. Bligh, Andy Whitcroft 2007
				7	"""
				8
				9	__author__ = """
				10	Martin J. Bligh <mbligh@google.com>
				11	Andy Whitcroft <apw@shadowen.org>
				12	"""
				13
mbligh	dbdac6c	2008-03-05 15:49:58 +0000	[diff] [blame]	14	import os, sys, re, time, select, subprocess, traceback
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	15
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	16	from autotest_lib.client.bin import fd_stack
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	17	from autotest_lib.client.common_lib import error, logging
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	18	from autotest_lib.server import test, subcommand
				19	from autotest_lib.tko import db as tko_db, status_lib, utils as tko_utils
				20	from autotest_lib.server.utils import *
				21
mbligh	3f4bced	2007-11-05 17:55:53 +0000	[diff] [blame]	22
mbligh	ed5a410	2007-11-20 00:46:41 +0000	[diff] [blame]	23	# load up a control segment
				24	# these are all stored in <server_dir>/control_segments
				25	def load_control_segment(name):
				26	server_dir = os.path.dirname(os.path.abspath(__file__))
mbligh	7f86e0b	2007-11-24 19:45:07 +0000	[diff] [blame]	27	script_file = os.path.join(server_dir, "control_segments", name)
mbligh	ed5a410	2007-11-20 00:46:41 +0000	[diff] [blame]	28	if os.path.exists(script_file):
				29	return file(script_file).read()
				30	else:
				31	return ""
				32
				33
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	34	preamble = """\
				35	import os, sys
				36
mbligh	ccb9e18	2008-04-17 15:42:10 +0000	[diff] [blame]	37	from autotest_lib.server import hosts, autotest, kvm, git, standalone_profiler
				38	from autotest_lib.server import source_kernel, rpm_kernel, deb_kernel
				39	from autotest_lib.server import git_kernel
				40	from autotest_lib.server.subcommand import *
				41	from autotest_lib.server.utils import run, get_tmp_dir, sh_escape
mbligh	1965dfa	2008-06-04 19:58:37 +0000	[diff] [blame]	42	from autotest_lib.server.utils import parse_machine
mbligh	ccb9e18	2008-04-17 15:42:10 +0000	[diff] [blame]	43	from autotest_lib.client.common_lib.error import *
				44	from autotest_lib.client.common_lib import barrier
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	45
mbligh	119c12a	2007-11-12 22:13:44 +0000	[diff] [blame]	46	autotest.Autotest.job = job
mbligh	31a49de	2007-11-05 18:41:19 +0000	[diff] [blame]	47	hosts.SSHHost.job = job
mbligh	e1417fa	2007-12-10 16:55:13 +0000	[diff] [blame]	48	barrier = barrier.barrier
mbligh	1fb77cc	2008-02-27 16:41:20 +0000	[diff] [blame]	49	if len(machines) > 1:
				50	open('.machines', 'w').write('\\n'.join(machines) + '\\n')
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	51	"""
				52
				53	client_wrapper = """
				54	at = autotest.Autotest()
				55
				56	def run_client(machine):
mbligh	1965dfa	2008-06-04 19:58:37 +0000	[diff] [blame]	57	hostname, user, password, port = parse_machine(machine,
				58	ssh_user, ssh_port, ssh_pass)
				59
				60	host = hosts.SSHHost(hostname, user, port, password=password)
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	61	at.run(control, host=host)
				62
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	63	job.parallel_simple(run_client, machines)
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	64	"""
				65
mbligh	303ccac	2007-11-05 18:07:28 +0000	[diff] [blame]	66	crashdumps = """
				67	def crashdumps(machine):
mbligh	1965dfa	2008-06-04 19:58:37 +0000	[diff] [blame]	68	hostname, user, password, port = parse_machine(machine,
				69	ssh_user, ssh_port, ssh_pass)
				70
				71	host = hosts.SSHHost(hostname, user, port, initialize=False, \
				72	password=password)
mbligh	303ccac	2007-11-05 18:07:28 +0000	[diff] [blame]	73	host.get_crashdumps(test_start_time)
				74
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	75	job.parallel_simple(crashdumps, machines, log=False)
mbligh	303ccac	2007-11-05 18:07:28 +0000	[diff] [blame]	76	"""
				77
mbligh	98ff146	2007-12-19 16:27:55 +0000	[diff] [blame]	78	reboot_segment="""\
				79	def reboot(machine):
mbligh	1965dfa	2008-06-04 19:58:37 +0000	[diff] [blame]	80	hostname, user, password, port = parse_machine(machine,
				81	ssh_user, ssh_port, ssh_pass)
				82
				83	host = hosts.SSHHost(hostname, user, port, initialize=False, \
				84	password=password)
mbligh	17f0c66	2007-11-05 18:28:19 +0000	[diff] [blame]	85	host.reboot()
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	86
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	87	job.parallel_simple(reboot, machines, log=False)
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	88	"""
				89
mbligh	f36243d	2007-10-30 15:36:16 +0000	[diff] [blame]	90	install="""\
				91	def install(machine):
mbligh	1965dfa	2008-06-04 19:58:37 +0000	[diff] [blame]	92	hostname, user, password, port = parse_machine(machine,
				93	ssh_user, ssh_port, ssh_pass)
				94
				95	host = hosts.SSHHost(hostname, user, port, initialize=False, \
				96	password=password)
mbligh	17f0c66	2007-11-05 18:28:19 +0000	[diff] [blame]	97	host.machine_install()
mbligh	f36243d	2007-10-30 15:36:16 +0000	[diff] [blame]	98
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	99	job.parallel_simple(install, machines, log=False)
mbligh	f36243d	2007-10-30 15:36:16 +0000	[diff] [blame]	100	"""
				101
mbligh	7f86e0b	2007-11-24 19:45:07 +0000	[diff] [blame]	102	# load up the verifier control segment, with an optional site-specific hook
mbligh	ed5a410	2007-11-20 00:46:41 +0000	[diff] [blame]	103	verify = load_control_segment("site_verify")
				104	verify += load_control_segment("verify")
mbligh	1d42d4e	2007-11-05 22:42:00 +0000	[diff] [blame]	105
mbligh	7f86e0b	2007-11-24 19:45:07 +0000	[diff] [blame]	106	# load up the repair control segment, with an optional site-specific hook
				107	repair = load_control_segment("site_repair")
				108	repair += load_control_segment("repair")
				109
mbligh	1d42d4e	2007-11-05 22:42:00 +0000	[diff] [blame]	110
mbligh	970b94e	2008-01-24 16:29:34 +0000	[diff] [blame]	111	# load up site-specific code for generating site-specific job data
				112	try:
				113	import site_job
				114	get_site_job_data = site_job.get_site_job_data
				115	del site_job
				116	except ImportError:
				117	# by default provide a stub that generates no site data
				118	def get_site_job_data(job):
				119	return {}
				120
				121
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	122	class base_server_job:
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	123	"""The actual job against which we do everything.
				124
				125	Properties:
				126	autodir
				127	The top level autotest directory (/usr/local/autotest).
				128	serverdir
				129	<autodir>/server/
				130	clientdir
				131	<autodir>/client/
				132	conmuxdir
				133	<autodir>/conmux/
				134	testdir
				135	<autodir>/server/tests/
				136	control
				137	the control file for this job
				138	"""
				139
jadmanski	6e8bf75	2008-05-14 00:17:48 +0000	[diff] [blame]	140	STATUS_VERSION = 1
				141
				142
mbligh	e8b37a9	2007-12-19 15:54:11 +0000	[diff] [blame]	143	def __init__(self, control, args, resultdir, label, user, machines,
mbligh	1965dfa	2008-06-04 19:58:37 +0000	[diff] [blame]	144	client=False, parse_job="",
				145	ssh_user='root', ssh_port=22, ssh_pass=''):
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	146	"""
				147	control
				148	The control file (pathname of)
				149	args
				150	args to pass to the control file
				151	resultdir
				152	where to throw the results
mbligh	18420c2	2007-10-16 22:27:14 +0000	[diff] [blame]	153	label
				154	label for the job
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	155	user
				156	Username for the job (email address)
				157	client
				158	True if a client-side control file
				159	"""
mbligh	f5427bb	2008-04-09 15:55:57 +0000	[diff] [blame]	160	path = os.path.dirname(__file__)
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	161	self.autodir = os.path.abspath(os.path.join(path, '..'))
				162	self.serverdir = os.path.join(self.autodir, 'server')
mbligh	0526936	2007-10-16 16:58:11 +0000	[diff] [blame]	163	self.testdir = os.path.join(self.serverdir, 'tests')
				164	self.tmpdir = os.path.join(self.serverdir, 'tmp')
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	165	self.conmuxdir = os.path.join(self.autodir, 'conmux')
				166	self.clientdir = os.path.join(self.autodir, 'client')
mbligh	e25fd5b	2008-01-22 17:23:37 +0000	[diff] [blame]	167	if control:
				168	self.control = open(control, 'r').read()
				169	self.control = re.sub('\r', '', self.control)
				170	else:
				171	self.control = None
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	172	self.resultdir = resultdir
				173	if not os.path.exists(resultdir):
				174	os.mkdir(resultdir)
mbligh	3ccb859	2007-11-05 18:13:40 +0000	[diff] [blame]	175	self.debugdir = os.path.join(resultdir, 'debug')
				176	if not os.path.exists(self.debugdir):
				177	os.mkdir(self.debugdir)
mbligh	3dcf2c9	2007-10-16 22:24:00 +0000	[diff] [blame]	178	self.status = os.path.join(resultdir, 'status')
mbligh	18420c2	2007-10-16 22:27:14 +0000	[diff] [blame]	179	self.label = label
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	180	self.user = user
				181	self.args = args
mbligh	e8b37a9	2007-12-19 15:54:11 +0000	[diff] [blame]	182	self.machines = machines
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	183	self.client = client
				184	self.record_prefix = ''
mbligh	f4e0415	2008-02-21 16:05:53 +0000	[diff] [blame]	185	self.warning_loggers = set()
mbligh	1965dfa	2008-06-04 19:58:37 +0000	[diff] [blame]	186	self.ssh_user = ssh_user
				187	self.ssh_port = ssh_port
				188	self.ssh_pass = ssh_pass
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	189
mbligh	3f4bced	2007-11-05 17:55:53 +0000	[diff] [blame]	190	self.stdout = fd_stack.fd_stack(1, sys.stdout)
				191	self.stderr = fd_stack.fd_stack(2, sys.stderr)
				192
mbligh	3dcf2c9	2007-10-16 22:24:00 +0000	[diff] [blame]	193	if os.path.exists(self.status):
				194	os.unlink(self.status)
jadmanski	6e8bf75	2008-05-14 00:17:48 +0000	[diff] [blame]	195	job_data = {'label' : label, 'user' : user,
				196	'hostname' : ','.join(machines),
				197	'status_version' : str(self.STATUS_VERSION)}
mbligh	970b94e	2008-01-24 16:29:34 +0000	[diff] [blame]	198	job_data.update(get_site_job_data(self))
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	199	write_keyval(self.resultdir, job_data)
				200
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	201	self.parse_job = parse_job
				202	if self.parse_job and len(machines) == 1:
				203	self.using_parser = True
				204	self.init_parser(resultdir)
				205	else:
				206	self.using_parser = False
				207
				208
				209	def init_parser(self, resultdir):
				210	"""Start the continuous parsing of resultdir. This sets up
				211	the database connection and inserts the basic job object into
				212	the database if necessary."""
				213	# redirect parser debugging to .parse.log
				214	parse_log = os.path.join(resultdir, '.parse.log')
				215	parse_log = open(parse_log, 'w', 0)
				216	tko_utils.redirect_parser_debugging(parse_log)
				217	# create a job model object and set up the db
				218	self.results_db = tko_db.db(autocommit=True)
jadmanski	6e8bf75	2008-05-14 00:17:48 +0000	[diff] [blame]	219	self.parser = status_lib.parser(self.STATUS_VERSION)
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	220	self.job_model = self.parser.make_job(resultdir)
				221	self.parser.start(self.job_model)
				222	# check if a job already exists in the db and insert it if
				223	# it does not
				224	job_idx = self.results_db.find_job(self.parse_job)
				225	if job_idx is None:
				226	self.results_db.insert_job(self.parse_job,
				227	self.job_model)
				228	else:
				229	machine_idx = self.results_db.lookup_machine(
				230	self.job_model.machine)
				231	self.job_model.index = job_idx
				232	self.job_model.machine_idx = machine_idx
				233
				234
mbligh	fe0af11	2008-04-17 15:27:47 +0000	[diff] [blame]	235	def cleanup_parser(self):
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	236	"""This should be called after the server job is finished
				237	to carry out any remaining cleanup (e.g. flushing any
				238	remaining test results to the results db)"""
				239	if not self.using_parser:
				240	return
				241	final_tests = self.parser.end()
				242	for test in final_tests:
jadmanski	28816c2	2008-05-21 18:18:05 +0000	[diff] [blame]	243	self.__insert_test(test)
mbligh	fe0af11	2008-04-17 15:27:47 +0000	[diff] [blame]	244	self.using_parser = False
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	245
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	246
mbligh	e25fd5b	2008-01-22 17:23:37 +0000	[diff] [blame]	247	def verify(self):
				248	if not self.machines:
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	249	raise error.AutoservError(
				250	'No machines specified to verify')
mbligh	e25fd5b	2008-01-22 17:23:37 +0000	[diff] [blame]	251	try:
mbligh	1965dfa	2008-06-04 19:58:37 +0000	[diff] [blame]	252	namespace = {'machines' : self.machines, 'job' : self, \
				253	'ssh_user' : self.ssh_user, 'ssh_port' : ssh_port, \
				254	'ssh_pass' : ssh_pass}
mbligh	e25fd5b	2008-01-22 17:23:37 +0000	[diff] [blame]	255	exec(preamble + verify, namespace, namespace)
				256	except Exception, e:
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	257	msg = ('Verify failed\n' + str(e) + '\n'
				258	+ traceback.format_exc())
mbligh	e25fd5b	2008-01-22 17:23:37 +0000	[diff] [blame]	259	self.record('ABORT', None, None, msg)
				260	raise
				261
				262
				263	def repair(self):
				264	if not self.machines:
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	265	raise error.AutoservError(
				266	'No machines specified to repair')
mbligh	1965dfa	2008-06-04 19:58:37 +0000	[diff] [blame]	267	namespace = {'machines' : self.machines, 'job' : self, \
				268	'ssh_user' : self.ssh_user, 'ssh_port' : ssh_port, \
				269	'ssh_pass' : ssh_pass}
mbligh	16c722d	2008-03-05 00:58:44 +0000	[diff] [blame]	270	# no matter what happens during repair, go on to try to reverify
				271	try:
				272	exec(preamble + repair, namespace, namespace)
				273	except Exception, exc:
				274	print 'Exception occured during repair'
				275	traceback.print_exc()
mbligh	8141f86	2008-01-25 17:20:40 +0000	[diff] [blame]	276	self.verify()
mbligh	e25fd5b	2008-01-22 17:23:37 +0000	[diff] [blame]	277
				278
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	279	def enable_external_logging(self):
				280	"""Start or restart external logging mechanism.
				281	"""
				282	pass
				283
				284
				285	def disable_external_logging(self):
				286	""" Pause or stop external logging mechanism.
				287	"""
				288	pass
				289
				290
				291	def use_external_logging(self):
				292	"""Return True if external logging should be used.
				293	"""
				294	return False
				295
				296
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	297	def parallel_simple(self, function, machines, log=True, timeout=None):
				298	"""Run 'function' using parallel_simple, with an extra
				299	wrapper to handle the necessary setup for continuous parsing,
				300	if possible. If continuous parsing is already properly
				301	initialized then this should just work."""
				302	is_forking = not (len(machines) == 1 and
				303	self.machines == machines)
				304	if self.parse_job and is_forking:
				305	def wrapper(machine):
				306	self.parse_job += "/" + machine
				307	self.using_parser = True
				308	self.machines = [machine]
				309	self.resultdir = os.path.join(self.resultdir,
				310	machine)
				311	self.init_parser(self.resultdir)
				312	result = function(machine)
mbligh	fe0af11	2008-04-17 15:27:47 +0000	[diff] [blame]	313	self.cleanup_parser()
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	314	return result
				315	else:
				316	wrapper = function
				317	subcommand.parallel_simple(wrapper, machines, log, timeout)
				318
				319
mbligh	e8b37a9	2007-12-19 15:54:11 +0000	[diff] [blame]	320	def run(self, reboot = False, install_before = False,
mbligh	ddd5433	2008-03-07 18:14:06 +0000	[diff] [blame]	321	install_after = False, collect_crashdumps = True,
				322	namespace = {}):
mbligh	60dbd50	2007-10-26 14:59:31 +0000	[diff] [blame]	323	# use a copy so changes don't affect the original dictionary
				324	namespace = namespace.copy()
mbligh	e8b37a9	2007-12-19 15:54:11 +0000	[diff] [blame]	325	machines = self.machines
mbligh	60dbd50	2007-10-26 14:59:31 +0000	[diff] [blame]	326
mbligh	faf0cd4	2007-11-19 16:00:24 +0000	[diff] [blame]	327	self.aborted = False
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	328	namespace['machines'] = machines
				329	namespace['args'] = self.args
				330	namespace['job'] = self
mbligh	1965dfa	2008-06-04 19:58:37 +0000	[diff] [blame]	331	namespace['ssh_user'] = self.ssh_user
				332	namespace['ssh_port'] = self.ssh_port
				333	namespace['ssh_pass'] = self.ssh_pass
mbligh	6e29438	2007-11-05 18:11:29 +0000	[diff] [blame]	334	test_start_time = int(time.time())
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	335
mbligh	87c5d88	2007-10-29 17:07:24 +0000	[diff] [blame]	336	os.chdir(self.resultdir)
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	337
				338	self.enable_external_logging()
mbligh	87c5d88	2007-10-29 17:07:24 +0000	[diff] [blame]	339	status_log = os.path.join(self.resultdir, 'status.log')
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	340	try:
mbligh	f36243d	2007-10-30 15:36:16 +0000	[diff] [blame]	341	if install_before and machines:
				342	exec(preamble + install, namespace, namespace)
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	343	if self.client:
				344	namespace['control'] = self.control
				345	open('control', 'w').write(self.control)
				346	open('control.srv', 'w').write(client_wrapper)
				347	server_control = client_wrapper
				348	else:
				349	open('control.srv', 'w').write(self.control)
				350	server_control = self.control
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	351	exec(preamble + server_control, namespace, namespace)
				352
				353	finally:
mbligh	ddd5433	2008-03-07 18:14:06 +0000	[diff] [blame]	354	if machines and collect_crashdumps:
mbligh	6e29438	2007-11-05 18:11:29 +0000	[diff] [blame]	355	namespace['test_start_time'] = test_start_time
mbligh	98ff146	2007-12-19 16:27:55 +0000	[diff] [blame]	356	exec(preamble + crashdumps,
				357	namespace, namespace)
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	358	self.disable_external_logging()
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	359	if reboot and machines:
mbligh	98ff146	2007-12-19 16:27:55 +0000	[diff] [blame]	360	exec(preamble + reboot_segment,
				361	namespace, namespace)
mbligh	f36243d	2007-10-30 15:36:16 +0000	[diff] [blame]	362	if install_after and machines:
				363	exec(preamble + install, namespace, namespace)
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	364
				365
				366	def run_test(self, url, args, *dargs):
				367	"""Summon a test object and run it.
				368
				369	tag
				370	tag to add to testname
				371	url
				372	url of the test to run
				373	"""
				374
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	375	(group, testname) = test.testname(url)
				376	tag = None
				377	subdir = testname
mbligh	43ac522	2007-10-16 15:55:01 +0000	[diff] [blame]	378
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	379	if dargs.has_key('tag'):
				380	tag = dargs['tag']
				381	del dargs['tag']
				382	if tag:
				383	subdir += '.' + tag
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	384
mbligh	d660afe	2008-06-05 22:17:53 +0000	[diff] [blame]	385	outputdir = os.path.join(self.resultdir, subdir)
				386	if os.path.exists(outputdir):
				387	msg = ("%s already exists, test <%s> may have"
				388	" already run with tag <%s>"
				389	% (outputdir, testname, tag) )
				390	raise error.TestError(msg)
				391	os.mkdir(outputdir)
				392
mbligh	43ac522	2007-10-16 15:55:01 +0000	[diff] [blame]	393	try:
				394	test.runtest(self, url, tag, args, dargs)
				395	self.record('GOOD', subdir, testname, 'completed successfully')
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	396	except error.TestNAError, detail:
mbligh	d660afe	2008-06-05 22:17:53 +0000	[diff] [blame]	397	self.record('TEST_NA', subdir, testname, str(detail))
mbligh	43ac522	2007-10-16 15:55:01 +0000	[diff] [blame]	398	except Exception, detail:
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	399	info = str(detail) + "\n" + traceback.format_exc()
				400	self.record('FAIL', subdir, testname, info)
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	401
				402
				403	def run_group(self, function, args, *dargs):
				404	"""\
				405	function:
				406	subroutine to run
				407	*args:
				408	arguments for the function
				409	"""
				410
				411	result = None
				412	name = function.__name__
				413
				414	# Allow the tag for the group to be specified.
				415	if dargs.has_key('tag'):
				416	tag = dargs['tag']
				417	del dargs['tag']
				418	if tag:
				419	name = tag
				420
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	421	old_record_prefix = self.record_prefix
				422	try:
				423	try:
				424	self.record('START', None, name)
				425	self.record_prefix += '\t'
				426	result = function(args, *dargs)
jadmanski	0c10955	2008-06-02 18:02:29 +0000	[diff] [blame]	427	except Exception, e:
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	428	self.record_prefix = old_record_prefix
jadmanski	0c10955	2008-06-02 18:02:29 +0000	[diff] [blame]	429	err_msg = str(e) + '\n'
				430	err_msg += traceback.format_exc()
				431	self.record('END FAIL', None, name, err_msg)
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	432	else:
				433	self.record_prefix = old_record_prefix
				434	self.record('END GOOD', None, name)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	435
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	436	# We don't want to raise up an error higher if it's just
				437	# a TestError - we want to carry on to other tests. Hence
				438	# this outer try/except block.
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	439	except error.TestError:
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	440	pass
				441	except:
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	442	raise error.TestError(name + ' failed\n' +
mbligh	0a1727a	2008-04-21 18:10:07 +0000	[diff] [blame]	443	traceback.format_exc())
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	444
				445	return result
				446
				447
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	448	def run_reboot(self, reboot_func, get_kernel_func):
				449	"""\
				450	A specialization of run_group meant specifically for handling
				451	a reboot. Includes support for capturing the kernel version
				452	after the reboot.
				453
				454	reboot_func: a function that carries out the reboot
				455
				456	get_kernel_func: a function that returns a string
				457	representing the kernel version.
				458	"""
				459
				460	old_record_prefix = self.record_prefix
				461	try:
				462	self.record('START', None, 'reboot')
				463	self.record_prefix += '\t'
				464	reboot_func()
jadmanski	0c10955	2008-06-02 18:02:29 +0000	[diff] [blame]	465	except Exception, e:
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	466	self.record_prefix = old_record_prefix
jadmanski	0c10955	2008-06-02 18:02:29 +0000	[diff] [blame]	467	err_msg = str(e) + '\n' + traceback.format_exc()
				468	self.record('END FAIL', None, 'reboot', err_msg)
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	469	else:
				470	kernel = get_kernel_func()
				471	self.record_prefix = old_record_prefix
				472	self.record('END GOOD', None, 'reboot',
				473	optional_fields={"kernel": kernel})
				474
				475
				476	def record(self, status_code, subdir, operation, status='',
				477	optional_fields=None):
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	478	"""
				479	Record job-level status
				480
				481	The intent is to make this file both machine parseable and
				482	human readable. That involves a little more complexity, but
				483	really isn't all that bad ;-)
				484
				485	Format is <status code>\t<subdir>\t<operation>\t<status>
				486
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	487	status code: see common_lib.logging.is_valid_status()
				488	for valid status definition
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	489
				490	subdir: MUST be a relevant subdirectory in the results,
				491	or None, which will be represented as '----'
				492
				493	operation: description of what you ran (e.g. "dbench", or
				494	"mkfs -t foobar /dev/sda9")
				495
				496	status: error message or "completed sucessfully"
				497
				498	------------------------------------------------------------
				499
				500	Initial tabs indicate indent levels for grouping, and is
				501	governed by self.record_prefix
				502
				503	multiline messages have secondary lines prefaced by a double
				504	space (' ')
mbligh	f4e0415	2008-02-21 16:05:53 +0000	[diff] [blame]	505
				506	Executing this method will trigger the logging of all new
				507	warnings to date from the various console loggers.
				508	"""
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	509	# poll all our warning loggers for new warnings
				510	warnings = self._read_warnings()
				511	for timestamp, msg in warnings:
				512	self.__record("WARN", None, None, msg, timestamp)
				513
				514	# write out the actual status log line
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	515	self.__record(status_code, subdir, operation, status,
				516	optional_fields=optional_fields)
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	517
				518
				519	def _read_warnings(self):
mbligh	f4e0415	2008-02-21 16:05:53 +0000	[diff] [blame]	520	warnings = []
				521	while True:
				522	# pull in a line of output from every logger that has
				523	# output ready to be read
				524	loggers, _, _ = select.select(self.warning_loggers,
				525	[], [], 0)
				526	closed_loggers = set()
				527	for logger in loggers:
				528	line = logger.readline()
				529	# record any broken pipes (aka line == empty)
				530	if len(line) == 0:
				531	closed_loggers.add(logger)
				532	continue
				533	timestamp, msg = line.split('\t', 1)
				534	warnings.append((int(timestamp), msg.strip()))
				535
				536	# stop listening to loggers that are closed
				537	self.warning_loggers -= closed_loggers
				538
				539	# stop if none of the loggers have any output left
				540	if not loggers:
				541	break
				542
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	543	# sort into timestamp order
				544	warnings.sort()
				545	return warnings
mbligh	f4e0415	2008-02-21 16:05:53 +0000	[diff] [blame]	546
				547
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	548	def _render_record(self, status_code, subdir, operation, status='',
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	549	epoch_time=None, record_prefix=None,
				550	optional_fields=None):
mbligh	f4e0415	2008-02-21 16:05:53 +0000	[diff] [blame]	551	"""
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	552	Internal Function to generate a record to be written into a
				553	status log. For use by server_job.* classes only.
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	554	"""
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	555	if subdir:
				556	if re.match(r'[\n\t]', subdir):
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	557	raise ValueError(
				558	'Invalid character in subdir string')
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	559	substr = subdir
				560	else:
				561	substr = '----'
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	562
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	563	if not logging.is_valid_status(status_code):
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	564	raise ValueError('Invalid status code supplied: %s' %
				565	status_code)
mbligh	e25fd5b	2008-01-22 17:23:37 +0000	[diff] [blame]	566	if not operation:
				567	operation = '----'
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	568	if re.match(r'[\n\t]', operation):
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	569	raise ValueError(
				570	'Invalid character in operation string')
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	571	operation = operation.rstrip()
				572	status = status.rstrip()
				573	status = re.sub(r"\t", " ", status)
				574	# Ensure any continuation lines are marked so we can
				575	# detect them in the status file to ensure it is parsable.
				576	status = re.sub(r"\n", "\n" + self.record_prefix + " ", status)
				577
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	578	if not optional_fields:
				579	optional_fields = {}
				580
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	581	# Generate timestamps for inclusion in the logs
mbligh	f4e0415	2008-02-21 16:05:53 +0000	[diff] [blame]	582	if epoch_time is None:
				583	epoch_time = int(time.time())
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	584	local_time = time.localtime(epoch_time)
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	585	optional_fields["timestamp"] = str(epoch_time)
				586	optional_fields["localtime"] = time.strftime("%b %d %H:%M:%S",
				587	local_time)
				588
				589	fields = [status_code, substr, operation]
				590	fields += ["%s=%s" % x for x in optional_fields.iteritems()]
				591	fields.append(status)
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	592
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	593	if record_prefix is None:
				594	record_prefix = self.record_prefix
				595
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	596	msg = '\t'.join(str(x) for x in fields)
				597
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	598	return record_prefix + msg + '\n'
				599
				600
				601	def _record_prerendered(self, msg):
				602	"""
				603	Record a pre-rendered msg into the status logs. The only
				604	change this makes to the message is to add on the local
				605	indentation. Should not be called outside of server_job.*
				606	classes. Unlike __record, this does not write the message
				607	to standard output.
				608	"""
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	609	lines = []
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	610	status_file = os.path.join(self.resultdir, 'status.log')
				611	status_log = open(status_file, 'a')
				612	for line in msg.splitlines():
				613	line = self.record_prefix + line + '\n'
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	614	lines.append(line)
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	615	status_log.write(line)
				616	status_log.close()
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	617	self.__parse_status(lines)
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	618
				619
				620	def __record(self, status_code, subdir, operation, status='',
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	621	epoch_time=None, optional_fields=None):
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	622	"""
				623	Actual function for recording a single line into the status
				624	logs. Should never be called directly, only by job.record as
				625	this would bypass the console monitor logging.
				626	"""
				627
				628	msg = self._render_record(status_code, subdir, operation,
jadmanski	f35bbb6	2008-05-29 21:36:04 +0000	[diff] [blame]	629	status, epoch_time,
				630	optional_fields=optional_fields)
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	631
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	632
mbligh	31a49de	2007-11-05 18:41:19 +0000	[diff] [blame]	633	status_file = os.path.join(self.resultdir, 'status.log')
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	634	sys.stdout.write(msg)
				635	open(status_file, "a").write(msg)
mbligh	f1c5284	2007-10-16 15:21:38 +0000	[diff] [blame]	636	if subdir:
mbligh	d56eb59	2008-01-22 16:36:34 +0000	[diff] [blame]	637	test_dir = os.path.join(self.resultdir, subdir)
mbligh	d56eb59	2008-01-22 16:36:34 +0000	[diff] [blame]	638	status_file = os.path.join(test_dir, 'status')
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	639	open(status_file, "a").write(msg)
jadmanski	96bb764	2008-05-15 17:58:16 +0000	[diff] [blame]	640	self.__parse_status(msg.splitlines())
mbligh	b03ba64	2008-03-13 17:37:17 +0000	[diff] [blame]	641
				642
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	643	def __parse_status(self, new_lines):
				644	if not self.using_parser:
				645	return
				646	new_tests = self.parser.process_lines(new_lines)
				647	for test in new_tests:
jadmanski	28816c2	2008-05-21 18:18:05 +0000	[diff] [blame]	648	self.__insert_test(test)
				649
				650
				651	def __insert_test(self, test):
				652	""" An internal method to insert a new test result into the
				653	database. This method will not raise an exception, even if an
				654	error occurs during the insert, to avoid failing a test
				655	simply because of unexpected database issues."""
				656	try:
mbligh	6437ff5	2008-04-17 15:24:38 +0000	[diff] [blame]	657	self.results_db.insert_test(self.job_model, test)
jadmanski	28816c2	2008-05-21 18:18:05 +0000	[diff] [blame]	658	except Exception:
				659	msg = ("WARNING: An unexpected error occured while "
				660	"inserting test results into the database. "
				661	"Ignoring error.\n" + traceback.format_exc())
				662	print >> sys.stderr, msg
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	663
				664
				665	# a file-like object for catching stderr from an autotest client and
				666	# extracting status logs from it
				667	class client_logger(object):
				668	"""Partial file object to write to both stdout and
				669	the status log file. We only implement those methods
				670	utils.run() actually calls.
				671	"""
				672	parser = re.compile(r"^AUTOTEST_STATUS:([^:]):(.)$")
				673	extract_indent = re.compile(r"^(\t).$")
				674
				675	def __init__(self, job):
				676	self.job = job
				677	self.leftover = ""
				678	self.last_line = ""
				679	self.logs = {}
				680
				681
				682	def _process_log_dict(self, log_dict):
				683	log_list = log_dict.pop("logs", [])
				684	for key in sorted(log_dict.iterkeys()):
				685	log_list += self._process_log_dict(log_dict.pop(key))
				686	return log_list
				687
				688
				689	def _process_logs(self):
				690	"""Go through the accumulated logs in self.log and print them
				691	out to stdout and the status log. Note that this processes
				692	logs in an ordering where:
				693
				694	1) logs to different tags are never interleaved
				695	2) logs to x.y come before logs to x.y.z for all z
				696	3) logs to x.y come before x.z whenever y < z
				697
				698	Note that this will in general not be the same as the
				699	chronological ordering of the logs. However, if a chronological
				700	ordering is desired that one can be reconstructed from the
				701	status log by looking at timestamp lines."""
				702	log_list = self._process_log_dict(self.logs)
				703	for line in log_list:
				704	self.job._record_prerendered(line + '\n')
				705	if log_list:
				706	self.last_line = log_list[-1]
				707
				708
				709	def _process_quoted_line(self, tag, line):
				710	"""Process a line quoted with an AUTOTEST_STATUS flag. If the
				711	tag is blank then we want to push out all the data we've been
				712	building up in self.logs, and then the newest line. If the
				713	tag is not blank, then push the line into the logs for handling
				714	later."""
				715	print line
				716	if tag == "":
				717	self._process_logs()
				718	self.job._record_prerendered(line + '\n')
				719	self.last_line = line
				720	else:
				721	tag_parts = [int(x) for x in tag.split(".")]
				722	log_dict = self.logs
				723	for part in tag_parts:
				724	log_dict = log_dict.setdefault(part, {})
				725	log_list = log_dict.setdefault("logs", [])
				726	log_list.append(line)
				727
				728
				729	def _process_line(self, line):
				730	"""Write out a line of data to the appropriate stream. Status
				731	lines sent by autotest will be prepended with
				732	"AUTOTEST_STATUS", and all other lines are ssh error
				733	messages."""
				734	match = self.parser.search(line)
				735	if match:
				736	tag, line = match.groups()
				737	self._process_quoted_line(tag, line)
				738	else:
mbligh	fe749d2	2008-03-07 18:14:46 +0000	[diff] [blame]	739	print line
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	740
				741
				742	def _format_warnings(self, last_line, warnings):
mbligh	71d340d	2008-03-05 15:51:16 +0000	[diff] [blame]	743	# use the indentation of whatever the last log line was
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	744	indent = self.extract_indent.match(last_line).group(1)
mbligh	71d340d	2008-03-05 15:51:16 +0000	[diff] [blame]	745	# if the last line starts a new group, add an extra indent
				746	if last_line.lstrip('\t').startswith("START\t"):
				747	indent += '\t'
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	748	return [self.job._render_record("WARN", None, None, msg,
				749	timestamp, indent).rstrip('\n')
				750	for timestamp, msg in warnings]
				751
				752
				753	def _process_warnings(self, last_line, log_dict, warnings):
				754	if log_dict.keys() in ([], ["logs"]):
				755	# there are no sub-jobs, just append the warnings here
				756	warnings = self._format_warnings(last_line, warnings)
				757	log_list = log_dict.setdefault("logs", [])
				758	log_list += warnings
				759	for warning in warnings:
				760	sys.stdout.write(warning + '\n')
				761	else:
				762	# there are sub-jobs, so put the warnings in there
				763	log_list = log_dict.get("logs", [])
				764	if log_list:
				765	last_line = log_list[-1]
				766	for key in sorted(log_dict.iterkeys()):
				767	if key != "logs":
				768	self._process_warnings(last_line,
				769	log_dict[key],
				770	warnings)
				771
				772
				773	def write(self, data):
				774	# first check for any new console warnings
				775	warnings = self.job._read_warnings()
				776	self._process_warnings(self.last_line, self.logs, warnings)
				777	# now process the newest data written out
				778	data = self.leftover + data
				779	lines = data.split("\n")
				780	# process every line but the last one
				781	for line in lines[:-1]:
				782	self._process_line(line)
				783	# save the last line for later processing
				784	# since we may not have the whole line yet
				785	self.leftover = lines[-1]
				786
				787
				788	def flush(self):
				789	sys.stdout.flush()
mbligh	dab3966	2008-02-27 16:47:55 +0000	[diff] [blame]	790
				791
				792	def close(self):
				793	if self.leftover:
				794	self._process_line(self.leftover)
				795	self._process_logs()
				796	self.flush()
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	797
				798	# site_server_job.py may be non-existant or empty, make sure that an
				799	# appropriate site_server_job class is created nevertheless
				800	try:
mbligh	ccb9e18	2008-04-17 15:42:10 +0000	[diff] [blame]	801	from autotest_lib.server.site_server_job import site_server_job
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	802	except ImportError:
				803	class site_server_job(base_server_job):
				804	pass
				805
				806	class server_job(site_server_job):
				807	pass