Blame - client/bin/job.py - platform/external/autotest

blob: 7c4968360725490445368d6024be13bec2f920f8 [file] [log] [blame]

mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	1	"""The main job wrapper
mbligh	a250805	2006-05-28 21:29:53 +0000	[diff] [blame]	2
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	3	This is the core infrastructure.
				4	"""
				5
				6	__author__ = """Copyright Andy Whitcroft, Martin J. Bligh 2006"""
mbligh	a250805	2006-05-28 21:29:53 +0000	[diff] [blame]	7
mbligh	8f243ec	2006-10-10 05:55:49 +0000	[diff] [blame]	8	# standard stuff
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	9	import os, sys, re, pickle, shutil, time, traceback, types, copy
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	10
mbligh	8f243ec	2006-10-10 05:55:49 +0000	[diff] [blame]	11	# autotest stuff
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	12	from autotest_lib.client.bin import autotest_utils
				13	from autotest_lib.client.common_lib import error, barrier, logging
				14
				15	import parallel, kernel, xen, test, profilers, filesystem, fd_stack, boottool
				16	import harness, config, sysinfo, cpuset
				17
mbligh	f4c3532	2006-03-13 01:01:10 +0000	[diff] [blame]	18
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	19
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	20	JOB_PREAMBLE = """
				21	from common.error import *
				22	from autotest_utils import *
				23	"""
				24
				25
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	26	class StepError(error.AutotestError):
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	27	pass
				28
				29
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	30	class base_job:
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	31	"""The actual job against which we do everything.
				32
				33	Properties:
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	34	autodir
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	35	The top level autotest directory (/usr/local/autotest).
				36	Comes from os.environ['AUTODIR'].
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	37	bindir
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	38	<autodir>/bin/
mbligh	d5a3883	2008-01-25 18:15:39 +0000	[diff] [blame]	39	libdir
				40	<autodir>/lib/
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	41	testdir
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	42	<autodir>/tests/
mbligh	84bafdb	2008-01-26 19:43:34 +0000	[diff] [blame]	43	site_testdir
				44	<autodir>/site_tests/
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	45	profdir
				46	<autodir>/profilers/
				47	tmpdir
				48	<autodir>/tmp/
				49	resultdir
				50	<autodir>/results/<jobtag>
				51	stdout
				52	fd_stack object for stdout
				53	stderr
				54	fd_stack object for stderr
				55	profilers
				56	the profilers object for this job
apw	504a7dd	2006-10-12 17:18:37 +0000	[diff] [blame]	57	harness
				58	the server harness object for this job
apw	059e1b1	2006-10-12 17:18:26 +0000	[diff] [blame]	59	config
				60	the job configuration for this job
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	61	"""
				62
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	63	DEFAULT_LOG_FILENAME = "status"
				64
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	65	def __init__(self, control, jobtag, cont, harness_type=None,
				66	use_external_logging = False):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	67	"""
				68	control
				69	The control file (pathname of)
				70	jobtag
				71	The job tag string (eg "default")
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	72	cont
				73	If this is the continuation of this job
apw	e68a713	2006-12-01 11:21:37 +0000	[diff] [blame]	74	harness_type
				75	An alternative server harness
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	76	"""
mbligh	f4c3532	2006-03-13 01:01:10 +0000	[diff] [blame]	77	self.autodir = os.environ['AUTODIR']
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	78	self.bindir = os.path.join(self.autodir, 'bin')
mbligh	d5a3883	2008-01-25 18:15:39 +0000	[diff] [blame]	79	self.libdir = os.path.join(self.autodir, 'lib')
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	80	self.testdir = os.path.join(self.autodir, 'tests')
mbligh	84bafdb	2008-01-26 19:43:34 +0000	[diff] [blame]	81	self.site_testdir = os.path.join(self.autodir, 'site_tests')
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	82	self.profdir = os.path.join(self.autodir, 'profilers')
				83	self.tmpdir = os.path.join(self.autodir, 'tmp')
				84	self.resultdir = os.path.join(self.autodir, 'results', jobtag)
mbligh	0fb8397	2008-01-10 16:30:02 +0000	[diff] [blame]	85	self.sysinfodir = os.path.join(self.resultdir, 'sysinfo')
mbligh	8d83cdc	2007-12-03 18:09:18 +0000	[diff] [blame]	86	self.control = os.path.abspath(control)
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	87	self.state_file = self.control + '.state'
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame^]	88	self.current_step_ancestry = []
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	89	self.__load_state()
mbligh	a250805	2006-05-28 21:29:53 +0000	[diff] [blame]	90
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	91	if not cont:
mbligh	c1cbc99	2008-05-27 20:01:45 +0000	[diff] [blame]	92	"""
				93	Don't cleanup the tmp dir (which contains the lockfile)
				94	in the constructor, this would be a problem for multiple
				95	jobs starting at the same time on the same client. Instead
				96	do the delete at the server side. We simply create the tmp
				97	directory here if it does not already exist.
				98	"""
				99	if not os.path.exists(self.tmpdir):
				100	os.mkdir(self.tmpdir)
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	101
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	102	results = os.path.join(self.autodir, 'results')
				103	if not os.path.exists(results):
				104	os.mkdir(results)
mbligh	fbfb77d	2007-02-15 18:54:03 +0000	[diff] [blame]	105
apw	f3d2862	2007-09-25 16:49:17 +0000	[diff] [blame]	106	download = os.path.join(self.testdir, 'download')
mbligh	c1cbc99	2008-05-27 20:01:45 +0000	[diff] [blame]	107	if not os.path.exists(download):
				108	os.mkdir(download)
				109
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	110	if os.path.exists(self.resultdir):
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	111	autotest_utils.system('rm -rf '
				112	+ self.resultdir)
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	113	os.mkdir(self.resultdir)
mbligh	0fb8397	2008-01-10 16:30:02 +0000	[diff] [blame]	114	os.mkdir(self.sysinfodir)
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	115
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	116	os.mkdir(os.path.join(self.resultdir, 'debug'))
				117	os.mkdir(os.path.join(self.resultdir, 'analysis'))
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	118
mbligh	8d83cdc	2007-12-03 18:09:18 +0000	[diff] [blame]	119	shutil.copyfile(self.control,
				120	os.path.join(self.resultdir, 'control'))
mbligh	f4ca14f	2008-03-03 16:03:05 +0000	[diff] [blame]	121
mbligh	4b08966	2006-06-14 22:34:58 +0000	[diff] [blame]	122
apw	ecf41b7	2006-03-31 14:00:55 +0000	[diff] [blame]	123	self.control = control
mbligh	2711360	2007-10-31 21:07:51 +0000	[diff] [blame]	124	self.jobtag = jobtag
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	125	self.log_filename = self.DEFAULT_LOG_FILENAME
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	126	self.container = None
mbligh	f4c3532	2006-03-13 01:01:10 +0000	[diff] [blame]	127
mbligh	56f1fbb	2006-10-01 15:10:56 +0000	[diff] [blame]	128	self.stdout = fd_stack.fd_stack(1, sys.stdout)
				129	self.stderr = fd_stack.fd_stack(2, sys.stderr)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	130
				131	self._init_group_level()
mbligh	f4c3532	2006-03-13 01:01:10 +0000	[diff] [blame]	132
apw	059e1b1	2006-10-12 17:18:26 +0000	[diff] [blame]	133	self.config = config.config(self)
				134
apw	d27e55f	2006-12-01 11:22:08 +0000	[diff] [blame]	135	self.harness = harness.select(harness_type, self)
				136
mbligh	a35553b	2006-04-23 15:52:25 +0000	[diff] [blame]	137	self.profilers = profilers.profilers(self)
mbligh	7290556	2006-05-25 01:30:49 +0000	[diff] [blame]	138
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	139	try:
apw	90154af	2006-12-01 11:23:36 +0000	[diff] [blame]	140	tool = self.config_get('boottool.executable')
				141	self.bootloader = boottool.boottool(tool)
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	142	except:
				143	pass
				144
mbligh	0fb8397	2008-01-10 16:30:02 +0000	[diff] [blame]	145	sysinfo.log_per_reboot_data(self.sysinfodir)
mbligh	3a6d6ca	2006-04-23 15:50:24 +0000	[diff] [blame]	146
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	147	if not cont:
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	148	self.record('START', None, None)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	149	self._increment_group_level()
apw	357f50f	2006-12-01 11:22:39 +0000	[diff] [blame]	150
apw	f91efaf	2007-11-24 17:32:13 +0000	[diff] [blame]	151	self.harness.run_start()
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	152
				153	if use_external_logging:
				154	self.enable_external_logging()
apw	f91efaf	2007-11-24 17:32:13 +0000	[diff] [blame]	155
jadmanski	8415f96	2008-05-06 20:38:53 +0000	[diff] [blame]	156	# load the max disk usage rate - default to no monitoring
				157	self.max_disk_usage_rate = self.get_state('__monitor_disk',
				158	default=0.0)
				159
				160
				161	def monitor_disk_usage(self, max_rate):
				162	"""\
				163	Signal that the job should monitor disk space usage on /
				164	and generate a warning if a test uses up disk space at a
				165	rate exceeding 'max_rate'.
				166
				167	Parameters:
				168	max_rate - the maximium allowed rate of disk consumption
				169	during a test, in MB/hour, or 0 to indicate
				170	no limit.
				171	"""
				172	self.set_state('__monitor_disk', max_rate)
				173	self.max_disk_usage_rate = max_rate
				174
mbligh	0692e47	2007-08-30 16:07:53 +0000	[diff] [blame]	175
				176	def relative_path(self, path):
				177	"""\
				178	Return a patch relative to the job results directory
				179	"""
mbligh	1c250ca	2007-08-30 16:31:38 +0000	[diff] [blame]	180	head = len(self.resultdir) + 1 # remove the / inbetween
				181	return path[head:]
mbligh	0692e47	2007-08-30 16:07:53 +0000	[diff] [blame]	182
				183
mbligh	362ab3d	2007-08-30 11:24:04 +0000	[diff] [blame]	184	def control_get(self):
				185	return self.control
				186
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	187
mbligh	8d83cdc	2007-12-03 18:09:18 +0000	[diff] [blame]	188	def control_set(self, control):
				189	self.control = os.path.abspath(control)
				190
				191
apw	de1503a	2006-10-10 08:34:21 +0000	[diff] [blame]	192	def harness_select(self, which):
				193	self.harness = harness.select(which, self)
				194
				195
apw	059e1b1	2006-10-12 17:18:26 +0000	[diff] [blame]	196	def config_set(self, name, value):
				197	self.config.set(name, value)
				198
				199
				200	def config_get(self, name):
				201	return self.config.get(name)
				202
mbligh	8baa2ea	2006-12-17 23:01:24 +0000	[diff] [blame]	203	def setup_dirs(self, results_dir, tmp_dir):
mbligh	1e8858e	2006-11-24 22:18:35 +0000	[diff] [blame]	204	if not tmp_dir:
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	205	tmp_dir = os.path.join(self.tmpdir, 'build')
mbligh	1e8858e	2006-11-24 22:18:35 +0000	[diff] [blame]	206	if not os.path.exists(tmp_dir):
				207	os.mkdir(tmp_dir)
				208	if not os.path.isdir(tmp_dir):
mbligh	642b03e	2008-01-14 16:53:15 +0000	[diff] [blame]	209	e_msg = "Temp dir (%s) is not a dir - args backwards?" % self.tmpdir
				210	raise ValueError(e_msg)
mbligh	1e8858e	2006-11-24 22:18:35 +0000	[diff] [blame]	211
				212	# We label the first build "build" and then subsequent ones
				213	# as "build.2", "build.3", etc. Whilst this is a little bit
				214	# inconsistent, 99.9% of jobs will only have one build
				215	# (that's not done as kernbench, sparse, or buildtest),
				216	# so it works out much cleaner. One of life's comprimises.
				217	if not results_dir:
				218	results_dir = os.path.join(self.resultdir, 'build')
				219	i = 2
				220	while os.path.exists(results_dir):
				221	results_dir = os.path.join(self.resultdir, 'build.%d' % i)
mbligh	d9223fc	2006-11-26 17:19:54 +0000	[diff] [blame]	222	i += 1
mbligh	1e8858e	2006-11-24 22:18:35 +0000	[diff] [blame]	223	if not os.path.exists(results_dir):
				224	os.mkdir(results_dir)
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	225
mbligh	8baa2ea	2006-12-17 23:01:24 +0000	[diff] [blame]	226	return (results_dir, tmp_dir)
				227
				228
				229	def xen(self, base_tree, results_dir = '', tmp_dir = '', leave = False, \
				230	kjob = None ):
				231	"""Summon a xen object"""
				232	(results_dir, tmp_dir) = self.setup_dirs(results_dir, tmp_dir)
				233	build_dir = 'xen'
				234	return xen.xen(self, base_tree, results_dir, tmp_dir, build_dir, leave, kjob)
				235
				236
				237	def kernel(self, base_tree, results_dir = '', tmp_dir = '', leave = False):
				238	"""Summon a kernel object"""
mbligh	669caa1	2007-11-05 18:32:13 +0000	[diff] [blame]	239	(results_dir, tmp_dir) = self.setup_dirs(results_dir, tmp_dir)
mbligh	8baa2ea	2006-12-17 23:01:24 +0000	[diff] [blame]	240	build_dir = 'linux'
mbligh	6ee7ee0	2007-11-13 23:49:05 +0000	[diff] [blame]	241	return kernel.auto_kernel(self, base_tree, results_dir,
				242	tmp_dir, build_dir, leave)
mbligh	f4c3532	2006-03-13 01:01:10 +0000	[diff] [blame]	243
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	244
mbligh	6b504ff	2007-12-12 21:03:49 +0000	[diff] [blame]	245	def barrier(self, args, *kwds):
mbligh	fadca20	2006-09-23 04:40:01 +0000	[diff] [blame]	246	"""Create a barrier object"""
mbligh	6b504ff	2007-12-12 21:03:49 +0000	[diff] [blame]	247	return barrier.barrier(args, *kwds)
mbligh	fadca20	2006-09-23 04:40:01 +0000	[diff] [blame]	248
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	249
mbligh	4b08966	2006-06-14 22:34:58 +0000	[diff] [blame]	250	def setup_dep(self, deps):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	251	"""Set up the dependencies for this test.
				252
				253	deps is a list of libraries required for this test.
				254	"""
mbligh	4b08966	2006-06-14 22:34:58 +0000	[diff] [blame]	255	for dep in deps:
				256	try:
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	257	os.chdir(os.path.join(self.autodir, 'deps', dep))
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	258	autotest_utils.system('./' + dep + '.py')
mbligh	4b08966	2006-06-14 22:34:58 +0000	[diff] [blame]	259	except:
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	260	err = "setting up dependency " + dep + "\n"
				261	raise error.UnhandledError(err)
mbligh	4b08966	2006-06-14 22:34:58 +0000	[diff] [blame]	262
				263
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	264	def __runtest(self, url, tag, args, dargs):
				265	try:
mbligh	53c4150	2007-10-23 20:45:04 +0000	[diff] [blame]	266	l = lambda : test.runtest(self, url, tag, args, dargs)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	267	pid = parallel.fork_start(self.resultdir, l)
				268	parallel.fork_waitfor(self.resultdir, pid)
				269	except error.AutotestError:
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	270	raise
jadmanski	cf8c4d6	2008-05-27 22:09:14 +0000	[diff] [blame]	271	except Exception, e:
				272	msg = "Unhandled %s error occured during test\n"
				273	msg %= str(e.__class__.__name__)
				274	raise error.UnhandledError(msg)
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	275
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	276
mbligh	d016ecc	2006-11-25 21:41:07 +0000	[diff] [blame]	277	def run_test(self, url, args, *dargs):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	278	"""Summon a test object and run it.
				279
				280	tag
				281	tag to add to testname
mbligh	12a7df7	2006-10-06 03:54:33 +0000	[diff] [blame]	282	url
				283	url of the test to run
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	284	"""
mbligh	12a7df7	2006-10-06 03:54:33 +0000	[diff] [blame]	285
mbligh	d016ecc	2006-11-25 21:41:07 +0000	[diff] [blame]	286	if not url:
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	287	raise TypeError("Test name is invalid. "
				288	"Switched arguments?")
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	289	(group, testname) = test.testname(url)
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	290	tag = dargs.pop('tag', None)
mbligh	65938a2	2007-12-10 16:58:52 +0000	[diff] [blame]	291	container = dargs.pop('container', None)
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	292	subdir = testname
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	293	if tag:
				294	subdir += '.' + tag
				295
mbligh	65938a2	2007-12-10 16:58:52 +0000	[diff] [blame]	296	if container:
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	297	cname = container.get('name', None)
				298	if not cname: # get old name
				299	cname = container.get('container_name', None)
				300	mbytes = container.get('mbytes', None)
				301	if not mbytes: # get old name
				302	mbytes = container.get('mem', None)
				303	cpus = container.get('cpus', None)
				304	if not cpus: # get old name
				305	cpus = container.get('cpu', None)
jadmanski	87cbc7f	2008-05-13 18:17:10 +0000	[diff] [blame]	306	root = container.get('root', None)
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	307	self.new_container(mbytes=mbytes, cpus=cpus,
				308	root=root, name=cname)
mbligh	65938a2	2007-12-10 16:58:52 +0000	[diff] [blame]	309	# We are running in a container now...
				310
jadmanski	8415f96	2008-05-06 20:38:53 +0000	[diff] [blame]	311	def log_warning(reason):
				312	self.record("WARN", subdir, testname, reason)
				313	@disk_usage_monitor.watch(log_warning, "/",
				314	self.max_disk_usage_rate)
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	315	def group_func():
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	316	try:
mbligh	d016ecc	2006-11-25 21:41:07 +0000	[diff] [blame]	317	self.__runtest(url, tag, args, dargs)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	318	except error.TestNAError, detail:
				319	self.record('TEST_NA', subdir, testname,
				320	str(detail))
				321	raise
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	322	except Exception, detail:
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	323	self.record('FAIL', subdir, testname,
				324	str(detail))
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	325	raise
				326	else:
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	327	self.record('GOOD', subdir, testname,
				328	'completed successfully')
jadmanski	8415f96	2008-05-06 20:38:53 +0000	[diff] [blame]	329
mbligh	cfc6dd3	2007-11-20 00:44:35 +0000	[diff] [blame]	330	result, exc_info = self.__rungroup(subdir, group_func)
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	331	if container:
				332	self.release_container()
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	333	if exc_info and isinstance(exc_info[1], error.TestError):
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	334	return False
				335	elif exc_info:
mbligh	71ea249	2008-01-15 20:35:52 +0000	[diff] [blame]	336	raise exc_info[0], exc_info[1], exc_info[2]
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	337	else:
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	338	return True
				339
				340
				341	def __rungroup(self, name, function, args, *dargs):
				342	"""\
				343	name:
				344	name of the group
				345	function:
				346	subroutine to run
				347	*args:
				348	arguments for the function
				349
				350	Returns a 2-tuple (result, exc_info) where result
				351	is the return value of function, and exc_info is
				352	the sys.exc_info() of the exception thrown by the
				353	function (which may be None).
				354	"""
				355
				356	result, exc_info = None, None
				357	try:
				358	self.record('START', None, name)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	359	self._increment_group_level()
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	360	result = function(args, *dargs)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	361	self._decrement_group_level()
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	362	self.record('END GOOD', None, name)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	363	except error.TestNAError, e:
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	364	self._decrement_group_level()
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	365	self.record('END TEST_NA', None, name, str(e))
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	366	except Exception, e:
				367	exc_info = sys.exc_info()
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	368	self._decrement_group_level()
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	369	err_msg = str(e) + '\n' + traceback.format_exc()
mbligh	51144e0	2007-11-20 20:38:18 +0000	[diff] [blame]	370	self.record('END FAIL', None, name, err_msg)
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	371
				372	return result, exc_info
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	373
mbligh	d7fb4a6	2006-10-01 00:57:53 +0000	[diff] [blame]	374
apw	1da244b	2007-09-27 17:18:01 +0000	[diff] [blame]	375	def run_group(self, function, args, *dargs):
mbligh	88ab90f	2007-08-29 15:52:49 +0000	[diff] [blame]	376	"""\
				377	function:
				378	subroutine to run
				379	*args:
				380	arguments for the function
				381	"""
				382
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	383	# Allow the tag for the group to be specified
mbligh	88ab90f	2007-08-29 15:52:49 +0000	[diff] [blame]	384	name = function.__name__
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	385	tag = dargs.pop('tag', None)
				386	if tag:
				387	name = tag
apw	1da244b	2007-09-27 17:18:01 +0000	[diff] [blame]	388
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	389	result, exc_info = self.__rungroup(name, function,
				390	args, *dargs)
apw	1da244b	2007-09-27 17:18:01 +0000	[diff] [blame]	391
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	392	# if there was a non-TestError exception, raise it
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	393	if exc_info and not isinstance(exc_info[1], error.TestError):
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	394	err = ''.join(traceback.format_exception(*exc_info))
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	395	raise error.TestError(name + ' failed\n' + err)
mbligh	88ab90f	2007-08-29 15:52:49 +0000	[diff] [blame]	396
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	397	# pass back the actual return value from the function
apw	08403ca	2007-09-27 17:17:22 +0000	[diff] [blame]	398	return result
				399
mbligh	88ab90f	2007-08-29 15:52:49 +0000	[diff] [blame]	400
jadmanski	87cbc7f	2008-05-13 18:17:10 +0000	[diff] [blame]	401	def new_container(self, mbytes=None, cpus=None, root=None, name=None):
mbligh	8ea61e2	2008-05-09 18:09:37 +0000	[diff] [blame]	402	if not autotest_utils.grep('cpuset', '/proc/filesystems'):
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	403	print "Containers not enabled by latest reboot"
				404	return # containers weren't enabled in this kernel boot
				405	pid = os.getpid()
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	406	if not name:
				407	name = 'test%d' % pid # make arbitrary unique name
				408	self.container = cpuset.cpuset(name, job_size=mbytes,
mbligh	337bb76	2008-04-16 21:23:10 +0000	[diff] [blame]	409	job_pid=pid, cpus=cpus, root=root)
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	410	# This job's python shell is now running in the new container
				411	# and all forked test processes will inherit that container
				412
				413
				414	def release_container(self):
				415	if self.container:
mbligh	337bb76	2008-04-16 21:23:10 +0000	[diff] [blame]	416	self.container.release()
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	417	self.container = None
				418
				419
				420	def cpu_count(self):
				421	if self.container:
				422	return len(self.container.cpus)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	423	return autotest_utils.count_cpus() # use total system count
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	424
				425
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	426	# Check the passed kernel identifier against the command line
				427	# and the running kernel, abort the job on missmatch.
mbligh	38a4a11	2008-03-19 13:11:34 +0000	[diff] [blame]	428	def kernel_check_ident(self, expected_when, expected_id, subdir,
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	429	type = 'src', patches=[]):
mbligh	38a4a11	2008-03-19 13:11:34 +0000	[diff] [blame]	430	print (("POST BOOT: checking booted kernel " +
				431	"mark=%d identity='%s' type='%s'") %
				432	(expected_when, expected_id, type))
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	433
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	434	running_id = autotest_utils.running_os_ident()
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	435
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	436	cmdline = autotest_utils.read_one_line("/proc/cmdline")
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	437
				438	find_sum = re.compile(r'.*IDENT=(\d+)')
				439	m = find_sum.match(cmdline)
				440	cmdline_when = -1
				441	if m:
				442	cmdline_when = int(m.groups()[0])
				443
				444	# We have all the facts, see if they indicate we
				445	# booted the requested kernel or not.
				446	bad = False
mbligh	da0311e	2007-10-25 16:03:33 +0000	[diff] [blame]	447	if (type == 'src' and expected_id != running_id or
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	448	type == 'rpm' and
				449	not running_id.startswith(expected_id + '::')):
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	450	print "check_kernel_ident: kernel identifier mismatch"
				451	bad = True
				452	if expected_when != cmdline_when:
				453	print "check_kernel_ident: kernel command line mismatch"
				454	bad = True
				455
				456	if bad:
				457	print " Expected Ident: " + expected_id
				458	print " Running Ident: " + running_id
				459	print " Expected Mark: %d" % (expected_when)
				460	print "Command Line Mark: %d" % (cmdline_when)
				461	print " Command Line: " + cmdline
				462
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	463	raise error.JobError("boot failure", "reboot.verify")
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	464
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	465	kernel_info = {'kernel': expected_id}
				466	for i, patch in enumerate(patches):
				467	kernel_info["patch%d" % i] = patch
mbligh	b7fd270	2008-03-25 14:57:08 +0000	[diff] [blame]	468	self.record('GOOD', subdir, 'reboot.verify', expected_id)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	469	self._decrement_group_level()
				470	self.record('END GOOD', subdir, 'reboot',
				471	optional_fields=kernel_info)
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	472
				473
mbligh	c235985	2007-08-28 18:11:48 +0000	[diff] [blame]	474	def filesystem(self, device, mountpoint = None, loop_size = 0):
mbligh	d7fb4a6	2006-10-01 00:57:53 +0000	[diff] [blame]	475	if not mountpoint:
				476	mountpoint = self.tmpdir
mbligh	c235985	2007-08-28 18:11:48 +0000	[diff] [blame]	477	return filesystem.filesystem(self, device, mountpoint,loop_size)
mbligh	d7fb4a6	2006-10-01 00:57:53 +0000	[diff] [blame]	478
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	479
				480	def enable_external_logging(self):
				481	pass
				482
				483
				484	def disable_external_logging(self):
				485	pass
				486
				487
				488	def reboot_setup(self):
				489	pass
				490
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	491
				492	def reboot(self, tag='autotest'):
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	493	self.reboot_setup()
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	494	self.record('START', None, 'reboot')
				495	self._increment_group_level()
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	496	self.record('GOOD', None, 'reboot.start')
apw	de1503a	2006-10-10 08:34:21 +0000	[diff] [blame]	497	self.harness.run_reboot()
apw	11985b7	2007-10-04 15:44:47 +0000	[diff] [blame]	498	default = self.config_get('boot.set_default')
				499	if default:
				500	self.bootloader.set_default(tag)
				501	else:
				502	self.bootloader.boot_once(tag)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	503	cmd = "(sleep 5; reboot) </dev/null >/dev/null 2>&1 &"
				504	autotest_utils.system(cmd)
apw	0778a2f	2006-10-06 03:11:40 +0000	[diff] [blame]	505	self.quit()
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	506
				507
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	508	def noop(self, text):
				509	print "job: noop: " + text
				510
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	511
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	512	def parallel(self, *tasklist):
				513	"""Run tasks in parallel"""
apw	8fef4ac	2006-10-10 22:53:37 +0000	[diff] [blame]	514
				515	pids = []
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	516	old_log_filename = self.log_filename
				517	for i, task in enumerate(tasklist):
				518	self.log_filename = old_log_filename + (".%d" % i)
				519	task_func = lambda: task[0](*task[1:])
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	520	pids.append(parallel.fork_start(self.resultdir,
				521	task_func))
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	522
				523	old_log_path = os.path.join(self.resultdir, old_log_filename)
				524	old_log = open(old_log_path, "a")
mbligh	d509b71	2008-01-14 17:41:25 +0000	[diff] [blame]	525	exceptions = []
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	526	for i, pid in enumerate(pids):
				527	# wait for the task to finish
mbligh	d509b71	2008-01-14 17:41:25 +0000	[diff] [blame]	528	try:
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	529	parallel.fork_waitfor(self.resultdir, pid)
mbligh	d509b71	2008-01-14 17:41:25 +0000	[diff] [blame]	530	except Exception, e:
				531	exceptions.append(e)
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	532	# copy the logs from the subtask into the main log
				533	new_log_path = old_log_path + (".%d" % i)
				534	if os.path.exists(new_log_path):
				535	new_log = open(new_log_path)
				536	old_log.write(new_log.read())
				537	new_log.close()
				538	old_log.flush()
				539	os.remove(new_log_path)
				540	old_log.close()
				541
				542	self.log_filename = old_log_filename
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	543
mbligh	d509b71	2008-01-14 17:41:25 +0000	[diff] [blame]	544	# handle any exceptions raised by the parallel tasks
				545	if exceptions:
				546	msg = "%d task(s) failed" % len(exceptions)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	547	raise error.JobError(msg, str(exceptions), exceptions)
mbligh	d509b71	2008-01-14 17:41:25 +0000	[diff] [blame]	548
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	549
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	550	def quit(self):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	551	# XXX: should have a better name.
apw	de1503a	2006-10-10 08:34:21 +0000	[diff] [blame]	552	self.harness.run_pause()
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	553	raise error.JobContinue("more to come")
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	554
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	555
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	556	def complete(self, status):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	557	"""Clean up and exit"""
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	558	# We are about to exit 'complete' so clean up the control file.
				559	try:
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	560	os.unlink(self.state_file)
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	561	except:
				562	pass
mbligh	c0b10d3	2008-03-03 16:03:28 +0000	[diff] [blame]	563
mbligh	61a6c1a	2006-12-25 01:26:38 +0000	[diff] [blame]	564	self.harness.run_complete()
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	565	self.disable_external_logging()
apw	1b02190	2006-04-03 17:02:56 +0000	[diff] [blame]	566	sys.exit(status)
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	567
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	568
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	569	def set_state(self, var, val):
				570	# Deep copies make sure that the state can't be altered
				571	# without it being re-written. Perf wise, deep copies
				572	# are overshadowed by pickling/loading.
				573	self.state[var] = copy.deepcopy(val)
				574	pickle.dump(self.state, open(self.state_file, 'w'))
				575
				576
				577	def __load_state(self):
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	578	assert not hasattr(self, "state")
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	579	try:
				580	self.state = pickle.load(open(self.state_file, 'r'))
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	581	self.state_existed = True
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	582	except Exception:
				583	print "Initializing the state engine."
				584	self.state = {}
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	585	self.set_state('__steps', []) # writes pickle file
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	586	self.state_existed = False
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	587
				588
				589	def get_state(self, var, default=None):
				590	if var in self.state or default == None:
				591	val = self.state[var]
				592	else:
				593	val = default
				594	return copy.deepcopy(val)
				595
				596
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	597	def __create_step_tuple(self, fn, args, dargs):
				598	# Legacy code passes in an array where the first arg is
				599	# the function or its name.
				600	if isinstance(fn, list):
				601	assert(len(args) == 0)
				602	assert(len(dargs) == 0)
				603	args = fn[1:]
				604	fn = fn[0]
				605	# Pickling actual functions is harry, thus we have to call
				606	# them by name. Unfortunately, this means only functions
				607	# defined globally can be used as a next step.
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame^]	608	if callable(fn):
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	609	fn = fn.__name__
				610	if not isinstance(fn, types.StringTypes):
				611	raise StepError("Next steps must be functions or "
				612	"strings containing the function name")
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame^]	613	ancestry = copy.copy(self.current_step_ancestry)
				614	return (ancestry, fn, args, dargs)
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	615
				616
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	617	def next_step(self, fn, args, *dargs):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	618	"""Define the next step"""
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	619	steps = self.get_state('__steps')
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	620	steps.append(self.__create_step_tuple(fn, args, dargs))
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	621	self.set_state('__steps', steps)
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	622
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	623
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	624	def next_step_prepend(self, fn, args, *dargs):
mbligh	237bed3	2007-09-05 13:05:57 +0000	[diff] [blame]	625	"""Insert a new step, executing first"""
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	626	steps = self.get_state('__steps')
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	627	steps.insert(0, self.__create_step_tuple(fn, args, dargs))
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	628	self.set_state('__steps', steps)
mbligh	237bed3	2007-09-05 13:05:57 +0000	[diff] [blame]	629
				630
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame^]	631	def _run_step_fn(self, local_vars, fn, args, dargs):
				632	"""Run a (step) function within the given context"""
				633
				634	local_vars['__args'] = args
				635	local_vars['__dargs'] = dargs
				636	exec('__ret = %s(__args, *__dargs)' % fn,
				637	local_vars, local_vars)
				638	return local_vars['__ret']
				639
				640
				641	def _create_frame(self, global_vars, ancestry, fn_name):
				642	"""Set up the environment like it would have been when this
				643	function was first defined.
				644
				645	Child step engine 'implementations' must have 'return locals()'
				646	at end end of their steps. Because of this, we can call the
				647	parent function and get back all child functions (i.e. those
				648	defined within it).
				649
				650	Unfortunately, the call stack of the function calling
				651	job.next_step might have been deeper than the function it
				652	added. In order to make sure that the environment is what it
				653	should be, we need to then pop off the frames we built until
				654	we find the frame where the function was first defined."""
				655
				656	# The copies ensure that the parent frames are not modified
				657	# while building child frames. This matters if we then
				658	# pop some frames in the next part of this function.
				659	current_frame = copy.copy(global_vars)
				660	frames = [current_frame]
				661	for steps_fn_name in ancestry:
				662	ret = self._run_step_fn(current_frame,
				663	steps_fn_name, [], {})
				664	current_frame = copy.copy(ret)
				665	frames.append(current_frame)
				666
				667	while len(frames) > 2:
				668	if fn_name not in frames[-2]:
				669	break
				670	if frames[-2][fn_name] != frames[-1][fn_name]:
				671	break
				672	frames.pop()
				673	ancestry.pop()
				674
				675	return (frames[-1], ancestry)
				676
				677
				678	def _add_step_init(self, local_vars, current_function):
				679	"""If the function returned a dictionary that includes a
				680	function named 'step_init', prepend it to our list of steps.
				681	This will only get run the first time a function with a nested
				682	use of the step engine is run."""
				683
				684	if (isinstance(local_vars, dict) and
				685	'step_init' in local_vars and
				686	callable(local_vars['step_init'])):
				687	# The init step is a child of the function
				688	# we were just running.
				689	self.current_step_ancestry.append(current_function)
				690	self.next_step_prepend('step_init')
				691
				692
apw	83f8d77	2006-04-27 14:12:56 +0000	[diff] [blame]	693	def step_engine(self):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	694	"""the stepping engine -- if the control file defines
				695	step_init we will be using this engine to drive multiple runs.
				696	"""
				697	"""Do the next step"""
apw	83f8d77	2006-04-27 14:12:56 +0000	[diff] [blame]	698
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	699	# Set up the environment and then interpret the control file.
				700	# Some control files will have code outside of functions,
				701	# which means we need to have our state engine initialized
				702	# before reading in the file.
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame^]	703	global_control_vars = {'job': self}
				704	exec(JOB_PREAMBLE, global_control_vars, global_control_vars)
				705	execfile(self.control, global_control_vars, global_control_vars)
apw	83f8d77	2006-04-27 14:12:56 +0000	[diff] [blame]	706
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	707	# If we loaded in a mid-job state file, then we presumably
				708	# know what steps we have yet to run.
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	709	if not self.state_existed:
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame^]	710	if global_control_vars.has_key('step_init'):
				711	self.next_step(global_control_vars['step_init'])
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	712
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	713	# Iterate through the steps. If we reboot, we'll simply
				714	# continue iterating on the next step.
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	715	while len(self.get_state('__steps')) > 0:
				716	steps = self.get_state('__steps')
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame^]	717	(ancestry, fn_name, args, dargs) = steps.pop(0)
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	718	self.set_state('__steps', steps)
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	719
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame^]	720	ret = self._create_frame(global_control_vars, ancestry,
				721	fn_name)
				722	local_vars, self.current_step_ancestry = ret
				723	local_vars = self._run_step_fn(local_vars, fn_name,
				724	args, dargs)
				725	self._add_step_init(local_vars, fn_name)
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	726
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	727
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	728	def _init_group_level(self):
				729	self.group_level = self.get_state("__group_level", default=0)
				730
				731
				732	def _increment_group_level(self):
				733	self.group_level += 1
				734	self.set_state("__group_level", self.group_level)
				735
				736
				737	def _decrement_group_level(self):
				738	self.group_level -= 1
				739	self.set_state("__group_level", self.group_level)
				740
				741
				742	def record(self, status_code, subdir, operation, status = '',
				743	optional_fields=None):
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	744	"""
				745	Record job-level status
apw	7db8d0b	2006-10-09 08:10:25 +0000	[diff] [blame]	746
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	747	The intent is to make this file both machine parseable and
				748	human readable. That involves a little more complexity, but
				749	really isn't all that bad ;-)
				750
				751	Format is <status code>\t<subdir>\t<operation>\t<status>
				752
				753	status code: (GOOD\|WARN\|FAIL\|ABORT)
				754	or START
				755	or END (GOOD\|WARN\|FAIL\|ABORT)
				756
				757	subdir: MUST be a relevant subdirectory in the results,
				758	or None, which will be represented as '----'
				759
				760	operation: description of what you ran (e.g. "dbench", or
				761	"mkfs -t foobar /dev/sda9")
				762
				763	status: error message or "completed sucessfully"
				764
				765	------------------------------------------------------------
				766
				767	Initial tabs indicate indent levels for grouping, and is
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	768	governed by self.group_level
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	769
				770	multiline messages have secondary lines prefaced by a double
				771	space (' ')
				772	"""
				773
mbligh	b0570ad	2007-09-19 18:18:11 +0000	[diff] [blame]	774	if subdir:
				775	if re.match(r'[\n\t]', subdir):
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	776	raise ValueError("Invalid character in "
				777	"subdir string")
mbligh	b0570ad	2007-09-19 18:18:11 +0000	[diff] [blame]	778	substr = subdir
				779	else:
				780	substr = '----'
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	781
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	782	if not logging.is_valid_status(status_code):
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	783	raise ValueError("Invalid status code supplied: %s" %
				784	status_code)
mbligh	9c5ac32	2007-10-31 18:01:59 +0000	[diff] [blame]	785	if not operation:
				786	operation = '----'
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	787
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	788	if re.match(r'[\n\t]', operation):
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	789	raise ValueError("Invalid character in "
				790	"operation string")
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	791	operation = operation.rstrip()
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	792
				793	if not optional_fields:
				794	optional_fields = {}
				795
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	796	status = status.rstrip()
				797	status = re.sub(r"\t", " ", status)
apw	7db8d0b	2006-10-09 08:10:25 +0000	[diff] [blame]	798	# Ensure any continuation lines are marked so we can
				799	# detect them in the status file to ensure it is parsable.
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	800	status = re.sub(r"\n", "\n" + "\t" * self.group_level + " ",
				801	status)
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	802
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	803	# Generate timestamps for inclusion in the logs
				804	epoch_time = int(time.time()) # seconds since epoch, in UTC
				805	local_time = time.localtime(epoch_time)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	806	optional_fields["timestamp"] = str(epoch_time)
				807	optional_fields["localtime"] = time.strftime("%b %d %H:%M:%S",
				808	local_time)
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	809
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	810	fields = [status_code, substr, operation]
				811	fields += ["%s=%s" % x for x in optional_fields.iteritems()]
				812	fields.append(status)
				813
				814	msg = '\t'.join(str(x) for x in fields)
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	815	msg = '\t' * self.group_level + msg
apw	7db8d0b	2006-10-09 08:10:25 +0000	[diff] [blame]	816
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	817	msg_tag = ""
				818	if "." in self.log_filename:
				819	msg_tag = self.log_filename.split(".", 1)[1]
				820
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	821	self.harness.test_status_detail(status_code, substr,
				822	operation, status, msg_tag)
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	823	self.harness.test_status(msg, msg_tag)
				824
				825	# log to stdout (if enabled)
				826	#if self.log_filename == self.DEFAULT_LOG_FILENAME:
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	827	print msg
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	828
				829	# log to the "root" status log
				830	status_file = os.path.join(self.resultdir, self.log_filename)
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	831	open(status_file, "a").write(msg + "\n")
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	832
				833	# log to the subdir status log (if subdir is set)
mbligh	b0570ad	2007-09-19 18:18:11 +0000	[diff] [blame]	834	if subdir:
mbligh	adff6ca	2008-01-22 16:38:25 +0000	[diff] [blame]	835	dir = os.path.join(self.resultdir, subdir)
				836	if not os.path.exists(dir):
				837	os.mkdir(dir)
				838
				839	status_file = os.path.join(dir,
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	840	self.DEFAULT_LOG_FILENAME)
mbligh	b0570ad	2007-09-19 18:18:11 +0000	[diff] [blame]	841	open(status_file, "a").write(msg + "\n")
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	842
				843
jadmanski	8415f96	2008-05-06 20:38:53 +0000	[diff] [blame]	844	class disk_usage_monitor:
				845	def __init__(self, logging_func, device, max_mb_per_hour):
				846	self.func = logging_func
				847	self.device = device
				848	self.max_mb_per_hour = max_mb_per_hour
				849
				850
				851	def start(self):
				852	self.initial_space = autotest_utils.freespace(self.device)
				853	self.start_time = time.time()
				854
				855
				856	def stop(self):
				857	# if no maximum usage rate was set, we don't need to
				858	# generate any warnings
				859	if not self.max_mb_per_hour:
				860	return
				861
				862	final_space = autotest_utils.freespace(self.device)
				863	used_space = self.initial_space - final_space
				864	stop_time = time.time()
				865	total_time = stop_time - self.start_time
				866	# round up the time to one minute, to keep extremely short
				867	# tests from generating false positives due to short, badly
				868	# timed bursts of activity
				869	total_time = max(total_time, 60.0)
				870
				871	# determine the usage rate
				872	bytes_per_sec = used_space / total_time
				873	mb_per_sec = bytes_per_sec / 1024**2
				874	mb_per_hour = mb_per_sec * 60 * 60
				875
				876	if mb_per_hour > self.max_mb_per_hour:
				877	msg = ("disk space on %s was consumed at a rate of "
				878	"%.2f MB/hour")
				879	msg %= (self.device, mb_per_hour)
				880	self.func(msg)
				881
				882
				883	@classmethod
				884	def watch(cls, monitor_args, *monitor_dargs):
				885	""" Generic decorator to wrap a function call with the
				886	standard create-monitor -> start -> call -> stop idiom."""
				887	def decorator(func):
				888	def watched_func(args, *dargs):
				889	monitor = cls(monitor_args, *monitor_dargs)
				890	monitor.start()
				891	try:
				892	func(args, *dargs)
				893	finally:
				894	monitor.stop()
				895	return watched_func
				896	return decorator
				897
				898
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	899	def runjob(control, cont = False, tag = "default", harness_type = '',
				900	use_external_logging = False):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	901	"""The main interface to this module
				902
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	903	control
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	904	The control file to use for this job.
				905	cont
				906	Whether this is the continuation of a previously started job
				907	"""
mbligh	b4eef24	2007-07-23 18:22:49 +0000	[diff] [blame]	908	control = os.path.abspath(control)
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	909	state = control + '.state'
				910
				911	# instantiate the job object ready for the control file.
				912	myjob = None
				913	try:
				914	# Check that the control file is valid
				915	if not os.path.exists(control):
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	916	raise error.JobError(control +
				917	": control file not found")
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	918
				919	# When continuing, the job is complete when there is no
				920	# state file, ensure we don't try and continue.
mbligh	f3fef46	2006-09-13 16:05:05 +0000	[diff] [blame]	921	if cont and not os.path.exists(state):
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	922	raise error.JobComplete("all done")
mbligh	f3fef46	2006-09-13 16:05:05 +0000	[diff] [blame]	923	if cont == False and os.path.exists(state):
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	924	os.unlink(state)
				925
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	926	myjob = job(control, tag, cont, harness_type,
				927	use_external_logging)
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	928
				929	# Load in the users control file, may do any one of:
				930	# 1) execute in toto
				931	# 2) define steps, and select the first via next_step()
				932	myjob.step_engine()
				933
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	934	except error.JobContinue:
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	935	sys.exit(5)
				936
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	937	except error.JobComplete:
apw	b832e1b	2007-11-24 20:24:38 +0000	[diff] [blame]	938	sys.exit(1)
				939
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	940	except error.JobError, instance:
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	941	print "JOB ERROR: " + instance.args[0]
mbligh	9c5ac32	2007-10-31 18:01:59 +0000	[diff] [blame]	942	if myjob:
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	943	command = None
				944	if len(instance.args) > 1:
				945	command = instance.args[1]
				946	myjob.record('ABORT', None, command, instance.args[0])
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	947	myjob._decrement_group_level()
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	948	myjob.record('END ABORT', None, None)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	949	assert(myjob.group_level == 0)
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	950	myjob.complete(1)
apw	b832e1b	2007-11-24 20:24:38 +0000	[diff] [blame]	951	else:
				952	sys.exit(1)
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	953
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	954	except Exception, e:
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	955	msg = str(e) + '\n' + traceback.format_exc()
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	956	print "JOB ERROR: " + msg
mbligh	fbfb77d	2007-02-15 18:54:03 +0000	[diff] [blame]	957	if myjob:
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	958	myjob.record('ABORT', None, None, msg)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	959	myjob._decrement_group_level()
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	960	myjob.record('END ABORT', None, None)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	961	assert(myjob.group_level == 0)
mbligh	9c5ac32	2007-10-31 18:01:59 +0000	[diff] [blame]	962	myjob.complete(1)
apw	b832e1b	2007-11-24 20:24:38 +0000	[diff] [blame]	963	else:
				964	sys.exit(1)
mbligh	892d37f	2007-03-01 17:03:25 +0000	[diff] [blame]	965
mbligh	0144e5a	2008-03-07 18:17:53 +0000	[diff] [blame]	966	# If we get here, then we assume the job is complete and good.
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	967	myjob._decrement_group_level()
mbligh	0144e5a	2008-03-07 18:17:53 +0000	[diff] [blame]	968	myjob.record('END GOOD', None, None)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	969	assert(myjob.group_level == 0)
mbligh	0144e5a	2008-03-07 18:17:53 +0000	[diff] [blame]	970
mbligh	892d37f	2007-03-01 17:03:25 +0000	[diff] [blame]	971	myjob.complete(0)
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	972
				973
				974	# site_job.py may be non-existant or empty, make sure that an appropriate
				975	# site_job class is created nevertheless
				976	try:
				977	from site_job import site_job
				978	except ImportError:
				979	class site_job(base_job):
				980	pass
				981
				982	class job(site_job):
				983	pass
jadmanski	87cbc7f	2008-05-13 18:17:10 +0000	[diff] [blame]	984