Blame - client/bin/job.py - platform/external/autotest

blob: 19521e09ba987bf83cd5f82d472729be0f780a33 [file] [log] [blame]

mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	1	"""The main job wrapper
mbligh	a250805	2006-05-28 21:29:53 +0000	[diff] [blame]	2
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	3	This is the core infrastructure.
				4	"""
				5
				6	__author__ = """Copyright Andy Whitcroft, Martin J. Bligh 2006"""
mbligh	a250805	2006-05-28 21:29:53 +0000	[diff] [blame]	7
mbligh	8f243ec	2006-10-10 05:55:49 +0000	[diff] [blame]	8	# standard stuff
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	9	import os, sys, re, pickle, shutil, time, traceback, types, copy
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	10
mbligh	8f243ec	2006-10-10 05:55:49 +0000	[diff] [blame]	11	# autotest stuff
mbligh	c61fb36	2008-06-05 16:22:15 +0000	[diff] [blame^]	12	from autotest_lib.client.bin import autotest_utils, parallel, kernel, xen
				13	from autotest_lib.client.bin import profilers, fd_stack, boottool, harness
				14	from autotest_lib.client.bin import config, sysinfo, cpuset, test, filesystem
mbligh	e829ba5	2008-06-03 15:04:08 +0000	[diff] [blame]	15	from autotest_lib.client.common_lib import error, barrier, logging, utils
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	16
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	17	JOB_PREAMBLE = """
				18	from common.error import *
				19	from autotest_utils import *
				20	"""
				21
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	22	class StepError(error.AutotestError):
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	23	pass
				24
				25
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	26	class base_job:
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	27	"""The actual job against which we do everything.
				28
				29	Properties:
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	30	autodir
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	31	The top level autotest directory (/usr/local/autotest).
				32	Comes from os.environ['AUTODIR'].
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	33	bindir
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	34	<autodir>/bin/
mbligh	d5a3883	2008-01-25 18:15:39 +0000	[diff] [blame]	35	libdir
				36	<autodir>/lib/
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	37	testdir
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	38	<autodir>/tests/
mbligh	84bafdb	2008-01-26 19:43:34 +0000	[diff] [blame]	39	site_testdir
				40	<autodir>/site_tests/
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	41	profdir
				42	<autodir>/profilers/
				43	tmpdir
				44	<autodir>/tmp/
				45	resultdir
				46	<autodir>/results/<jobtag>
				47	stdout
				48	fd_stack object for stdout
				49	stderr
				50	fd_stack object for stderr
				51	profilers
				52	the profilers object for this job
apw	504a7dd	2006-10-12 17:18:37 +0000	[diff] [blame]	53	harness
				54	the server harness object for this job
apw	059e1b1	2006-10-12 17:18:26 +0000	[diff] [blame]	55	config
				56	the job configuration for this job
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	57	"""
				58
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	59	DEFAULT_LOG_FILENAME = "status"
				60
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	61	def __init__(self, control, jobtag, cont, harness_type=None,
				62	use_external_logging = False):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	63	"""
				64	control
				65	The control file (pathname of)
				66	jobtag
				67	The job tag string (eg "default")
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	68	cont
				69	If this is the continuation of this job
apw	e68a713	2006-12-01 11:21:37 +0000	[diff] [blame]	70	harness_type
				71	An alternative server harness
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	72	"""
mbligh	f4c3532	2006-03-13 01:01:10 +0000	[diff] [blame]	73	self.autodir = os.environ['AUTODIR']
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	74	self.bindir = os.path.join(self.autodir, 'bin')
mbligh	d5a3883	2008-01-25 18:15:39 +0000	[diff] [blame]	75	self.libdir = os.path.join(self.autodir, 'lib')
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	76	self.testdir = os.path.join(self.autodir, 'tests')
mbligh	84bafdb	2008-01-26 19:43:34 +0000	[diff] [blame]	77	self.site_testdir = os.path.join(self.autodir, 'site_tests')
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	78	self.profdir = os.path.join(self.autodir, 'profilers')
				79	self.tmpdir = os.path.join(self.autodir, 'tmp')
				80	self.resultdir = os.path.join(self.autodir, 'results', jobtag)
mbligh	0fb8397	2008-01-10 16:30:02 +0000	[diff] [blame]	81	self.sysinfodir = os.path.join(self.resultdir, 'sysinfo')
mbligh	8d83cdc	2007-12-03 18:09:18 +0000	[diff] [blame]	82	self.control = os.path.abspath(control)
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	83	self.state_file = self.control + '.state'
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame]	84	self.current_step_ancestry = []
mbligh	8f4d043	2008-06-02 19:42:50 +0000	[diff] [blame]	85	self.next_step_index = 0
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	86	self.__load_state()
mbligh	a250805	2006-05-28 21:29:53 +0000	[diff] [blame]	87
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	88	if not cont:
mbligh	c1cbc99	2008-05-27 20:01:45 +0000	[diff] [blame]	89	"""
				90	Don't cleanup the tmp dir (which contains the lockfile)
				91	in the constructor, this would be a problem for multiple
				92	jobs starting at the same time on the same client. Instead
				93	do the delete at the server side. We simply create the tmp
				94	directory here if it does not already exist.
				95	"""
				96	if not os.path.exists(self.tmpdir):
				97	os.mkdir(self.tmpdir)
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	98
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	99	results = os.path.join(self.autodir, 'results')
				100	if not os.path.exists(results):
				101	os.mkdir(results)
mbligh	fbfb77d	2007-02-15 18:54:03 +0000	[diff] [blame]	102
apw	f3d2862	2007-09-25 16:49:17 +0000	[diff] [blame]	103	download = os.path.join(self.testdir, 'download')
mbligh	c1cbc99	2008-05-27 20:01:45 +0000	[diff] [blame]	104	if not os.path.exists(download):
				105	os.mkdir(download)
				106
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	107	if os.path.exists(self.resultdir):
mbligh	e829ba5	2008-06-03 15:04:08 +0000	[diff] [blame]	108	utils.system('rm -rf '
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	109	+ self.resultdir)
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	110	os.mkdir(self.resultdir)
mbligh	0fb8397	2008-01-10 16:30:02 +0000	[diff] [blame]	111	os.mkdir(self.sysinfodir)
apw	96da1a4	2006-11-02 00:23:18 +0000	[diff] [blame]	112
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	113	os.mkdir(os.path.join(self.resultdir, 'debug'))
				114	os.mkdir(os.path.join(self.resultdir, 'analysis'))
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	115
mbligh	8d83cdc	2007-12-03 18:09:18 +0000	[diff] [blame]	116	shutil.copyfile(self.control,
				117	os.path.join(self.resultdir, 'control'))
mbligh	f4ca14f	2008-03-03 16:03:05 +0000	[diff] [blame]	118
mbligh	4b08966	2006-06-14 22:34:58 +0000	[diff] [blame]	119
apw	ecf41b7	2006-03-31 14:00:55 +0000	[diff] [blame]	120	self.control = control
mbligh	2711360	2007-10-31 21:07:51 +0000	[diff] [blame]	121	self.jobtag = jobtag
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	122	self.log_filename = self.DEFAULT_LOG_FILENAME
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	123	self.container = None
mbligh	f4c3532	2006-03-13 01:01:10 +0000	[diff] [blame]	124
mbligh	56f1fbb	2006-10-01 15:10:56 +0000	[diff] [blame]	125	self.stdout = fd_stack.fd_stack(1, sys.stdout)
				126	self.stderr = fd_stack.fd_stack(2, sys.stderr)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	127
				128	self._init_group_level()
mbligh	f4c3532	2006-03-13 01:01:10 +0000	[diff] [blame]	129
apw	059e1b1	2006-10-12 17:18:26 +0000	[diff] [blame]	130	self.config = config.config(self)
				131
apw	d27e55f	2006-12-01 11:22:08 +0000	[diff] [blame]	132	self.harness = harness.select(harness_type, self)
				133
mbligh	a35553b	2006-04-23 15:52:25 +0000	[diff] [blame]	134	self.profilers = profilers.profilers(self)
mbligh	7290556	2006-05-25 01:30:49 +0000	[diff] [blame]	135
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	136	try:
apw	90154af	2006-12-01 11:23:36 +0000	[diff] [blame]	137	tool = self.config_get('boottool.executable')
				138	self.bootloader = boottool.boottool(tool)
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	139	except:
				140	pass
				141
mbligh	0fb8397	2008-01-10 16:30:02 +0000	[diff] [blame]	142	sysinfo.log_per_reboot_data(self.sysinfodir)
mbligh	3a6d6ca	2006-04-23 15:50:24 +0000	[diff] [blame]	143
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	144	if not cont:
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	145	self.record('START', None, None)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	146	self._increment_group_level()
apw	357f50f	2006-12-01 11:22:39 +0000	[diff] [blame]	147
apw	f91efaf	2007-11-24 17:32:13 +0000	[diff] [blame]	148	self.harness.run_start()
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	149
				150	if use_external_logging:
				151	self.enable_external_logging()
apw	f91efaf	2007-11-24 17:32:13 +0000	[diff] [blame]	152
jadmanski	8415f96	2008-05-06 20:38:53 +0000	[diff] [blame]	153	# load the max disk usage rate - default to no monitoring
				154	self.max_disk_usage_rate = self.get_state('__monitor_disk',
				155	default=0.0)
				156
				157
				158	def monitor_disk_usage(self, max_rate):
				159	"""\
				160	Signal that the job should monitor disk space usage on /
				161	and generate a warning if a test uses up disk space at a
				162	rate exceeding 'max_rate'.
				163
				164	Parameters:
				165	max_rate - the maximium allowed rate of disk consumption
				166	during a test, in MB/hour, or 0 to indicate
				167	no limit.
				168	"""
				169	self.set_state('__monitor_disk', max_rate)
				170	self.max_disk_usage_rate = max_rate
				171
mbligh	0692e47	2007-08-30 16:07:53 +0000	[diff] [blame]	172
				173	def relative_path(self, path):
				174	"""\
				175	Return a patch relative to the job results directory
				176	"""
mbligh	1c250ca	2007-08-30 16:31:38 +0000	[diff] [blame]	177	head = len(self.resultdir) + 1 # remove the / inbetween
				178	return path[head:]
mbligh	0692e47	2007-08-30 16:07:53 +0000	[diff] [blame]	179
				180
mbligh	362ab3d	2007-08-30 11:24:04 +0000	[diff] [blame]	181	def control_get(self):
				182	return self.control
				183
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	184
mbligh	8d83cdc	2007-12-03 18:09:18 +0000	[diff] [blame]	185	def control_set(self, control):
				186	self.control = os.path.abspath(control)
				187
				188
apw	de1503a	2006-10-10 08:34:21 +0000	[diff] [blame]	189	def harness_select(self, which):
				190	self.harness = harness.select(which, self)
				191
				192
apw	059e1b1	2006-10-12 17:18:26 +0000	[diff] [blame]	193	def config_set(self, name, value):
				194	self.config.set(name, value)
				195
				196
				197	def config_get(self, name):
				198	return self.config.get(name)
				199
mbligh	8baa2ea	2006-12-17 23:01:24 +0000	[diff] [blame]	200	def setup_dirs(self, results_dir, tmp_dir):
mbligh	1e8858e	2006-11-24 22:18:35 +0000	[diff] [blame]	201	if not tmp_dir:
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	202	tmp_dir = os.path.join(self.tmpdir, 'build')
mbligh	1e8858e	2006-11-24 22:18:35 +0000	[diff] [blame]	203	if not os.path.exists(tmp_dir):
				204	os.mkdir(tmp_dir)
				205	if not os.path.isdir(tmp_dir):
mbligh	642b03e	2008-01-14 16:53:15 +0000	[diff] [blame]	206	e_msg = "Temp dir (%s) is not a dir - args backwards?" % self.tmpdir
				207	raise ValueError(e_msg)
mbligh	1e8858e	2006-11-24 22:18:35 +0000	[diff] [blame]	208
				209	# We label the first build "build" and then subsequent ones
				210	# as "build.2", "build.3", etc. Whilst this is a little bit
				211	# inconsistent, 99.9% of jobs will only have one build
				212	# (that's not done as kernbench, sparse, or buildtest),
				213	# so it works out much cleaner. One of life's comprimises.
				214	if not results_dir:
				215	results_dir = os.path.join(self.resultdir, 'build')
				216	i = 2
				217	while os.path.exists(results_dir):
				218	results_dir = os.path.join(self.resultdir, 'build.%d' % i)
mbligh	d9223fc	2006-11-26 17:19:54 +0000	[diff] [blame]	219	i += 1
mbligh	1e8858e	2006-11-24 22:18:35 +0000	[diff] [blame]	220	if not os.path.exists(results_dir):
				221	os.mkdir(results_dir)
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	222
mbligh	8baa2ea	2006-12-17 23:01:24 +0000	[diff] [blame]	223	return (results_dir, tmp_dir)
				224
				225
				226	def xen(self, base_tree, results_dir = '', tmp_dir = '', leave = False, \
				227	kjob = None ):
				228	"""Summon a xen object"""
				229	(results_dir, tmp_dir) = self.setup_dirs(results_dir, tmp_dir)
				230	build_dir = 'xen'
				231	return xen.xen(self, base_tree, results_dir, tmp_dir, build_dir, leave, kjob)
				232
				233
				234	def kernel(self, base_tree, results_dir = '', tmp_dir = '', leave = False):
				235	"""Summon a kernel object"""
mbligh	669caa1	2007-11-05 18:32:13 +0000	[diff] [blame]	236	(results_dir, tmp_dir) = self.setup_dirs(results_dir, tmp_dir)
mbligh	8baa2ea	2006-12-17 23:01:24 +0000	[diff] [blame]	237	build_dir = 'linux'
mbligh	6ee7ee0	2007-11-13 23:49:05 +0000	[diff] [blame]	238	return kernel.auto_kernel(self, base_tree, results_dir,
				239	tmp_dir, build_dir, leave)
mbligh	f4c3532	2006-03-13 01:01:10 +0000	[diff] [blame]	240
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	241
mbligh	6b504ff	2007-12-12 21:03:49 +0000	[diff] [blame]	242	def barrier(self, args, *kwds):
mbligh	fadca20	2006-09-23 04:40:01 +0000	[diff] [blame]	243	"""Create a barrier object"""
mbligh	6b504ff	2007-12-12 21:03:49 +0000	[diff] [blame]	244	return barrier.barrier(args, *kwds)
mbligh	fadca20	2006-09-23 04:40:01 +0000	[diff] [blame]	245
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	246
mbligh	4b08966	2006-06-14 22:34:58 +0000	[diff] [blame]	247	def setup_dep(self, deps):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	248	"""Set up the dependencies for this test.
				249
				250	deps is a list of libraries required for this test.
				251	"""
mbligh	4b08966	2006-06-14 22:34:58 +0000	[diff] [blame]	252	for dep in deps:
				253	try:
apw	870988b	2007-09-25 16:50:53 +0000	[diff] [blame]	254	os.chdir(os.path.join(self.autodir, 'deps', dep))
mbligh	e829ba5	2008-06-03 15:04:08 +0000	[diff] [blame]	255	utils.system('./' + dep + '.py')
mbligh	4b08966	2006-06-14 22:34:58 +0000	[diff] [blame]	256	except:
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	257	err = "setting up dependency " + dep + "\n"
				258	raise error.UnhandledError(err)
mbligh	4b08966	2006-06-14 22:34:58 +0000	[diff] [blame]	259
				260
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	261	def __runtest(self, url, tag, args, dargs):
				262	try:
mbligh	53c4150	2007-10-23 20:45:04 +0000	[diff] [blame]	263	l = lambda : test.runtest(self, url, tag, args, dargs)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	264	pid = parallel.fork_start(self.resultdir, l)
				265	parallel.fork_waitfor(self.resultdir, pid)
				266	except error.AutotestError:
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	267	raise
jadmanski	cf8c4d6	2008-05-27 22:09:14 +0000	[diff] [blame]	268	except Exception, e:
				269	msg = "Unhandled %s error occured during test\n"
				270	msg %= str(e.__class__.__name__)
				271	raise error.UnhandledError(msg)
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	272
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	273
mbligh	d016ecc	2006-11-25 21:41:07 +0000	[diff] [blame]	274	def run_test(self, url, args, *dargs):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	275	"""Summon a test object and run it.
				276
				277	tag
				278	tag to add to testname
mbligh	12a7df7	2006-10-06 03:54:33 +0000	[diff] [blame]	279	url
				280	url of the test to run
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	281	"""
mbligh	12a7df7	2006-10-06 03:54:33 +0000	[diff] [blame]	282
mbligh	d016ecc	2006-11-25 21:41:07 +0000	[diff] [blame]	283	if not url:
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	284	raise TypeError("Test name is invalid. "
				285	"Switched arguments?")
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	286	(group, testname) = test.testname(url)
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	287	tag = dargs.pop('tag', None)
mbligh	65938a2	2007-12-10 16:58:52 +0000	[diff] [blame]	288	container = dargs.pop('container', None)
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	289	subdir = testname
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	290	if tag:
				291	subdir += '.' + tag
				292
mbligh	65938a2	2007-12-10 16:58:52 +0000	[diff] [blame]	293	if container:
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	294	cname = container.get('name', None)
				295	if not cname: # get old name
				296	cname = container.get('container_name', None)
				297	mbytes = container.get('mbytes', None)
				298	if not mbytes: # get old name
				299	mbytes = container.get('mem', None)
				300	cpus = container.get('cpus', None)
				301	if not cpus: # get old name
				302	cpus = container.get('cpu', None)
jadmanski	87cbc7f	2008-05-13 18:17:10 +0000	[diff] [blame]	303	root = container.get('root', None)
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	304	self.new_container(mbytes=mbytes, cpus=cpus,
				305	root=root, name=cname)
mbligh	65938a2	2007-12-10 16:58:52 +0000	[diff] [blame]	306	# We are running in a container now...
				307
jadmanski	8415f96	2008-05-06 20:38:53 +0000	[diff] [blame]	308	def log_warning(reason):
				309	self.record("WARN", subdir, testname, reason)
				310	@disk_usage_monitor.watch(log_warning, "/",
				311	self.max_disk_usage_rate)
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	312	def group_func():
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	313	try:
mbligh	d016ecc	2006-11-25 21:41:07 +0000	[diff] [blame]	314	self.__runtest(url, tag, args, dargs)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	315	except error.TestNAError, detail:
				316	self.record('TEST_NA', subdir, testname,
				317	str(detail))
				318	raise
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	319	except Exception, detail:
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	320	self.record('FAIL', subdir, testname,
				321	str(detail))
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	322	raise
				323	else:
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	324	self.record('GOOD', subdir, testname,
				325	'completed successfully')
jadmanski	8415f96	2008-05-06 20:38:53 +0000	[diff] [blame]	326
mbligh	cfc6dd3	2007-11-20 00:44:35 +0000	[diff] [blame]	327	result, exc_info = self.__rungroup(subdir, group_func)
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	328	if container:
				329	self.release_container()
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	330	if exc_info and isinstance(exc_info[1], error.TestError):
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	331	return False
				332	elif exc_info:
mbligh	71ea249	2008-01-15 20:35:52 +0000	[diff] [blame]	333	raise exc_info[0], exc_info[1], exc_info[2]
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	334	else:
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	335	return True
				336
				337
				338	def __rungroup(self, name, function, args, *dargs):
				339	"""\
				340	name:
				341	name of the group
				342	function:
				343	subroutine to run
				344	*args:
				345	arguments for the function
				346
				347	Returns a 2-tuple (result, exc_info) where result
				348	is the return value of function, and exc_info is
				349	the sys.exc_info() of the exception thrown by the
				350	function (which may be None).
				351	"""
				352
				353	result, exc_info = None, None
				354	try:
				355	self.record('START', None, name)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	356	self._increment_group_level()
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	357	result = function(args, *dargs)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	358	self._decrement_group_level()
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	359	self.record('END GOOD', None, name)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	360	except error.TestNAError, e:
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	361	self._decrement_group_level()
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	362	self.record('END TEST_NA', None, name, str(e))
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	363	except Exception, e:
				364	exc_info = sys.exc_info()
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	365	self._decrement_group_level()
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	366	err_msg = str(e) + '\n' + traceback.format_exc()
mbligh	51144e0	2007-11-20 20:38:18 +0000	[diff] [blame]	367	self.record('END FAIL', None, name, err_msg)
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	368
				369	return result, exc_info
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	370
mbligh	d7fb4a6	2006-10-01 00:57:53 +0000	[diff] [blame]	371
apw	1da244b	2007-09-27 17:18:01 +0000	[diff] [blame]	372	def run_group(self, function, args, *dargs):
mbligh	88ab90f	2007-08-29 15:52:49 +0000	[diff] [blame]	373	"""\
				374	function:
				375	subroutine to run
				376	*args:
				377	arguments for the function
				378	"""
				379
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	380	# Allow the tag for the group to be specified
mbligh	88ab90f	2007-08-29 15:52:49 +0000	[diff] [blame]	381	name = function.__name__
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	382	tag = dargs.pop('tag', None)
				383	if tag:
				384	name = tag
apw	1da244b	2007-09-27 17:18:01 +0000	[diff] [blame]	385
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	386	result, exc_info = self.__rungroup(name, function,
				387	args, *dargs)
apw	1da244b	2007-09-27 17:18:01 +0000	[diff] [blame]	388
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	389	# if there was a non-TestError exception, raise it
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	390	if exc_info and not isinstance(exc_info[1], error.TestError):
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	391	err = ''.join(traceback.format_exception(*exc_info))
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	392	raise error.TestError(name + ' failed\n' + err)
mbligh	88ab90f	2007-08-29 15:52:49 +0000	[diff] [blame]	393
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	394	# pass back the actual return value from the function
apw	08403ca	2007-09-27 17:17:22 +0000	[diff] [blame]	395	return result
				396
mbligh	88ab90f	2007-08-29 15:52:49 +0000	[diff] [blame]	397
jadmanski	87cbc7f	2008-05-13 18:17:10 +0000	[diff] [blame]	398	def new_container(self, mbytes=None, cpus=None, root=None, name=None):
mbligh	8ea61e2	2008-05-09 18:09:37 +0000	[diff] [blame]	399	if not autotest_utils.grep('cpuset', '/proc/filesystems'):
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	400	print "Containers not enabled by latest reboot"
				401	return # containers weren't enabled in this kernel boot
				402	pid = os.getpid()
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	403	if not name:
				404	name = 'test%d' % pid # make arbitrary unique name
				405	self.container = cpuset.cpuset(name, job_size=mbytes,
mbligh	337bb76	2008-04-16 21:23:10 +0000	[diff] [blame]	406	job_pid=pid, cpus=cpus, root=root)
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	407	# This job's python shell is now running in the new container
				408	# and all forked test processes will inherit that container
				409
				410
				411	def release_container(self):
				412	if self.container:
mbligh	337bb76	2008-04-16 21:23:10 +0000	[diff] [blame]	413	self.container.release()
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	414	self.container = None
				415
				416
				417	def cpu_count(self):
				418	if self.container:
				419	return len(self.container.cpus)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	420	return autotest_utils.count_cpus() # use total system count
mbligh	6811958	2008-01-25 18:16:41 +0000	[diff] [blame]	421
				422
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	423	# Check the passed kernel identifier against the command line
				424	# and the running kernel, abort the job on missmatch.
mbligh	38a4a11	2008-03-19 13:11:34 +0000	[diff] [blame]	425	def kernel_check_ident(self, expected_when, expected_id, subdir,
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	426	type = 'src', patches=[]):
mbligh	38a4a11	2008-03-19 13:11:34 +0000	[diff] [blame]	427	print (("POST BOOT: checking booted kernel " +
				428	"mark=%d identity='%s' type='%s'") %
				429	(expected_when, expected_id, type))
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	430
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	431	running_id = autotest_utils.running_os_ident()
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	432
mbligh	e829ba5	2008-06-03 15:04:08 +0000	[diff] [blame]	433	cmdline = utils.read_one_line("/proc/cmdline")
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	434
				435	find_sum = re.compile(r'.*IDENT=(\d+)')
				436	m = find_sum.match(cmdline)
				437	cmdline_when = -1
				438	if m:
				439	cmdline_when = int(m.groups()[0])
				440
				441	# We have all the facts, see if they indicate we
				442	# booted the requested kernel or not.
				443	bad = False
mbligh	da0311e	2007-10-25 16:03:33 +0000	[diff] [blame]	444	if (type == 'src' and expected_id != running_id or
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	445	type == 'rpm' and
				446	not running_id.startswith(expected_id + '::')):
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	447	print "check_kernel_ident: kernel identifier mismatch"
				448	bad = True
				449	if expected_when != cmdline_when:
				450	print "check_kernel_ident: kernel command line mismatch"
				451	bad = True
				452
				453	if bad:
				454	print " Expected Ident: " + expected_id
				455	print " Running Ident: " + running_id
				456	print " Expected Mark: %d" % (expected_when)
				457	print "Command Line Mark: %d" % (cmdline_when)
				458	print " Command Line: " + cmdline
				459
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	460	raise error.JobError("boot failure", "reboot.verify")
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	461
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	462	kernel_info = {'kernel': expected_id}
				463	for i, patch in enumerate(patches):
				464	kernel_info["patch%d" % i] = patch
mbligh	b7fd270	2008-03-25 14:57:08 +0000	[diff] [blame]	465	self.record('GOOD', subdir, 'reboot.verify', expected_id)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	466	self._decrement_group_level()
				467	self.record('END GOOD', subdir, 'reboot',
				468	optional_fields=kernel_info)
apw	ce73d89	2007-09-25 16:53:05 +0000	[diff] [blame]	469
				470
mbligh	c235985	2007-08-28 18:11:48 +0000	[diff] [blame]	471	def filesystem(self, device, mountpoint = None, loop_size = 0):
mbligh	d7fb4a6	2006-10-01 00:57:53 +0000	[diff] [blame]	472	if not mountpoint:
				473	mountpoint = self.tmpdir
mbligh	c235985	2007-08-28 18:11:48 +0000	[diff] [blame]	474	return filesystem.filesystem(self, device, mountpoint,loop_size)
mbligh	d7fb4a6	2006-10-01 00:57:53 +0000	[diff] [blame]	475
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	476
				477	def enable_external_logging(self):
				478	pass
				479
				480
				481	def disable_external_logging(self):
				482	pass
				483
				484
				485	def reboot_setup(self):
				486	pass
				487
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	488
				489	def reboot(self, tag='autotest'):
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	490	self.reboot_setup()
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	491	self.record('START', None, 'reboot')
				492	self._increment_group_level()
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	493	self.record('GOOD', None, 'reboot.start')
apw	de1503a	2006-10-10 08:34:21 +0000	[diff] [blame]	494	self.harness.run_reboot()
apw	11985b7	2007-10-04 15:44:47 +0000	[diff] [blame]	495	default = self.config_get('boot.set_default')
				496	if default:
				497	self.bootloader.set_default(tag)
				498	else:
				499	self.bootloader.boot_once(tag)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	500	cmd = "(sleep 5; reboot) </dev/null >/dev/null 2>&1 &"
mbligh	e829ba5	2008-06-03 15:04:08 +0000	[diff] [blame]	501	utils.system(cmd)
apw	0778a2f	2006-10-06 03:11:40 +0000	[diff] [blame]	502	self.quit()
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	503
				504
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	505	def noop(self, text):
				506	print "job: noop: " + text
				507
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	508
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	509	def parallel(self, *tasklist):
				510	"""Run tasks in parallel"""
apw	8fef4ac	2006-10-10 22:53:37 +0000	[diff] [blame]	511
				512	pids = []
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	513	old_log_filename = self.log_filename
				514	for i, task in enumerate(tasklist):
				515	self.log_filename = old_log_filename + (".%d" % i)
				516	task_func = lambda: task[0](*task[1:])
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	517	pids.append(parallel.fork_start(self.resultdir,
				518	task_func))
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	519
				520	old_log_path = os.path.join(self.resultdir, old_log_filename)
				521	old_log = open(old_log_path, "a")
mbligh	d509b71	2008-01-14 17:41:25 +0000	[diff] [blame]	522	exceptions = []
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	523	for i, pid in enumerate(pids):
				524	# wait for the task to finish
mbligh	d509b71	2008-01-14 17:41:25 +0000	[diff] [blame]	525	try:
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	526	parallel.fork_waitfor(self.resultdir, pid)
mbligh	d509b71	2008-01-14 17:41:25 +0000	[diff] [blame]	527	except Exception, e:
				528	exceptions.append(e)
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	529	# copy the logs from the subtask into the main log
				530	new_log_path = old_log_path + (".%d" % i)
				531	if os.path.exists(new_log_path):
				532	new_log = open(new_log_path)
				533	old_log.write(new_log.read())
				534	new_log.close()
				535	old_log.flush()
				536	os.remove(new_log_path)
				537	old_log.close()
				538
				539	self.log_filename = old_log_filename
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	540
mbligh	d509b71	2008-01-14 17:41:25 +0000	[diff] [blame]	541	# handle any exceptions raised by the parallel tasks
				542	if exceptions:
				543	msg = "%d task(s) failed" % len(exceptions)
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	544	raise error.JobError(msg, str(exceptions), exceptions)
mbligh	d509b71	2008-01-14 17:41:25 +0000	[diff] [blame]	545
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	546
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	547	def quit(self):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	548	# XXX: should have a better name.
apw	de1503a	2006-10-10 08:34:21 +0000	[diff] [blame]	549	self.harness.run_pause()
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	550	raise error.JobContinue("more to come")
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	551
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	552
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	553	def complete(self, status):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	554	"""Clean up and exit"""
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	555	# We are about to exit 'complete' so clean up the control file.
				556	try:
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	557	os.unlink(self.state_file)
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	558	except:
				559	pass
mbligh	c0b10d3	2008-03-03 16:03:28 +0000	[diff] [blame]	560
mbligh	61a6c1a	2006-12-25 01:26:38 +0000	[diff] [blame]	561	self.harness.run_complete()
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	562	self.disable_external_logging()
apw	1b02190	2006-04-03 17:02:56 +0000	[diff] [blame]	563	sys.exit(status)
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	564
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	565
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	566	def set_state(self, var, val):
				567	# Deep copies make sure that the state can't be altered
				568	# without it being re-written. Perf wise, deep copies
				569	# are overshadowed by pickling/loading.
				570	self.state[var] = copy.deepcopy(val)
				571	pickle.dump(self.state, open(self.state_file, 'w'))
				572
				573
				574	def __load_state(self):
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	575	assert not hasattr(self, "state")
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	576	try:
				577	self.state = pickle.load(open(self.state_file, 'r'))
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	578	self.state_existed = True
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	579	except Exception:
				580	print "Initializing the state engine."
				581	self.state = {}
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	582	self.set_state('__steps', []) # writes pickle file
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	583	self.state_existed = False
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	584
				585
				586	def get_state(self, var, default=None):
				587	if var in self.state or default == None:
				588	val = self.state[var]
				589	else:
				590	val = default
				591	return copy.deepcopy(val)
				592
				593
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	594	def __create_step_tuple(self, fn, args, dargs):
				595	# Legacy code passes in an array where the first arg is
				596	# the function or its name.
				597	if isinstance(fn, list):
				598	assert(len(args) == 0)
				599	assert(len(dargs) == 0)
				600	args = fn[1:]
				601	fn = fn[0]
				602	# Pickling actual functions is harry, thus we have to call
				603	# them by name. Unfortunately, this means only functions
				604	# defined globally can be used as a next step.
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame]	605	if callable(fn):
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	606	fn = fn.__name__
				607	if not isinstance(fn, types.StringTypes):
				608	raise StepError("Next steps must be functions or "
				609	"strings containing the function name")
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame]	610	ancestry = copy.copy(self.current_step_ancestry)
				611	return (ancestry, fn, args, dargs)
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	612
				613
mbligh	8f4d043	2008-06-02 19:42:50 +0000	[diff] [blame]	614	def next_step_append(self, fn, args, *dargs):
				615	"""Define the next step and place it at the end"""
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	616	steps = self.get_state('__steps')
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	617	steps.append(self.__create_step_tuple(fn, args, dargs))
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	618	self.set_state('__steps', steps)
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	619
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	620
mbligh	8f4d043	2008-06-02 19:42:50 +0000	[diff] [blame]	621	def next_step(self, fn, args, *dargs):
				622	"""Create a new step and place it after any steps added
				623	while running the current step but before any steps added in
				624	previous steps"""
				625	steps = self.get_state('__steps')
				626	steps.insert(self.next_step_index,
				627	self.__create_step_tuple(fn, args, dargs))
				628	self.next_step_index += 1
				629	self.set_state('__steps', steps)
				630
				631
mbligh	12a04cb	2008-04-25 16:07:20 +0000	[diff] [blame]	632	def next_step_prepend(self, fn, args, *dargs):
mbligh	237bed3	2007-09-05 13:05:57 +0000	[diff] [blame]	633	"""Insert a new step, executing first"""
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	634	steps = self.get_state('__steps')
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	635	steps.insert(0, self.__create_step_tuple(fn, args, dargs))
mbligh	8f4d043	2008-06-02 19:42:50 +0000	[diff] [blame]	636	self.next_step_index += 1
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	637	self.set_state('__steps', steps)
mbligh	237bed3	2007-09-05 13:05:57 +0000	[diff] [blame]	638
				639
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame]	640	def _run_step_fn(self, local_vars, fn, args, dargs):
				641	"""Run a (step) function within the given context"""
				642
				643	local_vars['__args'] = args
				644	local_vars['__dargs'] = dargs
				645	exec('__ret = %s(__args, *__dargs)' % fn,
				646	local_vars, local_vars)
				647	return local_vars['__ret']
				648
				649
				650	def _create_frame(self, global_vars, ancestry, fn_name):
				651	"""Set up the environment like it would have been when this
				652	function was first defined.
				653
				654	Child step engine 'implementations' must have 'return locals()'
				655	at end end of their steps. Because of this, we can call the
				656	parent function and get back all child functions (i.e. those
				657	defined within it).
				658
				659	Unfortunately, the call stack of the function calling
				660	job.next_step might have been deeper than the function it
				661	added. In order to make sure that the environment is what it
				662	should be, we need to then pop off the frames we built until
				663	we find the frame where the function was first defined."""
				664
				665	# The copies ensure that the parent frames are not modified
				666	# while building child frames. This matters if we then
				667	# pop some frames in the next part of this function.
				668	current_frame = copy.copy(global_vars)
				669	frames = [current_frame]
				670	for steps_fn_name in ancestry:
				671	ret = self._run_step_fn(current_frame,
				672	steps_fn_name, [], {})
				673	current_frame = copy.copy(ret)
				674	frames.append(current_frame)
				675
				676	while len(frames) > 2:
				677	if fn_name not in frames[-2]:
				678	break
				679	if frames[-2][fn_name] != frames[-1][fn_name]:
				680	break
				681	frames.pop()
				682	ancestry.pop()
				683
				684	return (frames[-1], ancestry)
				685
				686
				687	def _add_step_init(self, local_vars, current_function):
				688	"""If the function returned a dictionary that includes a
				689	function named 'step_init', prepend it to our list of steps.
				690	This will only get run the first time a function with a nested
				691	use of the step engine is run."""
				692
				693	if (isinstance(local_vars, dict) and
				694	'step_init' in local_vars and
				695	callable(local_vars['step_init'])):
				696	# The init step is a child of the function
				697	# we were just running.
				698	self.current_step_ancestry.append(current_function)
				699	self.next_step_prepend('step_init')
				700
				701
apw	83f8d77	2006-04-27 14:12:56 +0000	[diff] [blame]	702	def step_engine(self):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	703	"""the stepping engine -- if the control file defines
				704	step_init we will be using this engine to drive multiple runs.
				705	"""
				706	"""Do the next step"""
apw	83f8d77	2006-04-27 14:12:56 +0000	[diff] [blame]	707
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	708	# Set up the environment and then interpret the control file.
				709	# Some control files will have code outside of functions,
				710	# which means we need to have our state engine initialized
				711	# before reading in the file.
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame]	712	global_control_vars = {'job': self}
				713	exec(JOB_PREAMBLE, global_control_vars, global_control_vars)
				714	execfile(self.control, global_control_vars, global_control_vars)
apw	83f8d77	2006-04-27 14:12:56 +0000	[diff] [blame]	715
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	716	# If we loaded in a mid-job state file, then we presumably
				717	# know what steps we have yet to run.
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	718	if not self.state_existed:
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame]	719	if global_control_vars.has_key('step_init'):
				720	self.next_step(global_control_vars['step_init'])
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	721
mbligh	366ff1b	2008-04-25 16:07:56 +0000	[diff] [blame]	722	# Iterate through the steps. If we reboot, we'll simply
				723	# continue iterating on the next step.
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	724	while len(self.get_state('__steps')) > 0:
				725	steps = self.get_state('__steps')
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame]	726	(ancestry, fn_name, args, dargs) = steps.pop(0)
mbligh	f1ae0a4	2008-04-25 16:09:20 +0000	[diff] [blame]	727	self.set_state('__steps', steps)
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	728
mbligh	8f4d043	2008-06-02 19:42:50 +0000	[diff] [blame]	729	self.next_step_index = 0
mbligh	b274ef5	2008-06-02 19:40:01 +0000	[diff] [blame]	730	ret = self._create_frame(global_control_vars, ancestry,
				731	fn_name)
				732	local_vars, self.current_step_ancestry = ret
				733	local_vars = self._run_step_fn(local_vars, fn_name,
				734	args, dargs)
				735	self._add_step_init(local_vars, fn_name)
apw	0865f48	2006-03-30 18:50:19 +0000	[diff] [blame]	736
mbligh	caa605c	2006-10-02 00:37:35 +0000	[diff] [blame]	737
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	738	def _init_group_level(self):
				739	self.group_level = self.get_state("__group_level", default=0)
				740
				741
				742	def _increment_group_level(self):
				743	self.group_level += 1
				744	self.set_state("__group_level", self.group_level)
				745
				746
				747	def _decrement_group_level(self):
				748	self.group_level -= 1
				749	self.set_state("__group_level", self.group_level)
				750
				751
				752	def record(self, status_code, subdir, operation, status = '',
				753	optional_fields=None):
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	754	"""
				755	Record job-level status
apw	7db8d0b	2006-10-09 08:10:25 +0000	[diff] [blame]	756
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	757	The intent is to make this file both machine parseable and
				758	human readable. That involves a little more complexity, but
				759	really isn't all that bad ;-)
				760
				761	Format is <status code>\t<subdir>\t<operation>\t<status>
				762
				763	status code: (GOOD\|WARN\|FAIL\|ABORT)
				764	or START
				765	or END (GOOD\|WARN\|FAIL\|ABORT)
				766
				767	subdir: MUST be a relevant subdirectory in the results,
				768	or None, which will be represented as '----'
				769
				770	operation: description of what you ran (e.g. "dbench", or
				771	"mkfs -t foobar /dev/sda9")
				772
				773	status: error message or "completed sucessfully"
				774
				775	------------------------------------------------------------
				776
				777	Initial tabs indicate indent levels for grouping, and is
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	778	governed by self.group_level
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	779
				780	multiline messages have secondary lines prefaced by a double
				781	space (' ')
				782	"""
				783
mbligh	b0570ad	2007-09-19 18:18:11 +0000	[diff] [blame]	784	if subdir:
				785	if re.match(r'[\n\t]', subdir):
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	786	raise ValueError("Invalid character in "
				787	"subdir string")
mbligh	b0570ad	2007-09-19 18:18:11 +0000	[diff] [blame]	788	substr = subdir
				789	else:
				790	substr = '----'
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	791
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	792	if not logging.is_valid_status(status_code):
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	793	raise ValueError("Invalid status code supplied: %s" %
				794	status_code)
mbligh	9c5ac32	2007-10-31 18:01:59 +0000	[diff] [blame]	795	if not operation:
				796	operation = '----'
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	797
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	798	if re.match(r'[\n\t]', operation):
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	799	raise ValueError("Invalid character in "
				800	"operation string")
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	801	operation = operation.rstrip()
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	802
				803	if not optional_fields:
				804	optional_fields = {}
				805
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	806	status = status.rstrip()
				807	status = re.sub(r"\t", " ", status)
apw	7db8d0b	2006-10-09 08:10:25 +0000	[diff] [blame]	808	# Ensure any continuation lines are marked so we can
				809	# detect them in the status file to ensure it is parsable.
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	810	status = re.sub(r"\n", "\n" + "\t" * self.group_level + " ",
				811	status)
mbligh	09f288a	2007-09-18 21:34:57 +0000	[diff] [blame]	812
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	813	# Generate timestamps for inclusion in the logs
				814	epoch_time = int(time.time()) # seconds since epoch, in UTC
				815	local_time = time.localtime(epoch_time)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	816	optional_fields["timestamp"] = str(epoch_time)
				817	optional_fields["localtime"] = time.strftime("%b %d %H:%M:%S",
				818	local_time)
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	819
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	820	fields = [status_code, substr, operation]
				821	fields += ["%s=%s" % x for x in optional_fields.iteritems()]
				822	fields.append(status)
				823
				824	msg = '\t'.join(str(x) for x in fields)
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	825	msg = '\t' * self.group_level + msg
apw	7db8d0b	2006-10-09 08:10:25 +0000	[diff] [blame]	826
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	827	msg_tag = ""
				828	if "." in self.log_filename:
				829	msg_tag = self.log_filename.split(".", 1)[1]
				830
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	831	self.harness.test_status_detail(status_code, substr,
				832	operation, status, msg_tag)
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	833	self.harness.test_status(msg, msg_tag)
				834
				835	# log to stdout (if enabled)
				836	#if self.log_filename == self.DEFAULT_LOG_FILENAME:
apw	f1a8116	2006-04-25 10:10:29 +0000	[diff] [blame]	837	print msg
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	838
				839	# log to the "root" status log
				840	status_file = os.path.join(self.resultdir, self.log_filename)
mbligh	7dd510c	2007-11-13 17:11:22 +0000	[diff] [blame]	841	open(status_file, "a").write(msg + "\n")
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	842
				843	# log to the subdir status log (if subdir is set)
mbligh	b0570ad	2007-09-19 18:18:11 +0000	[diff] [blame]	844	if subdir:
mbligh	adff6ca	2008-01-22 16:38:25 +0000	[diff] [blame]	845	dir = os.path.join(self.resultdir, subdir)
				846	if not os.path.exists(dir):
				847	os.mkdir(dir)
				848
				849	status_file = os.path.join(dir,
mbligh	d528d30	2007-12-19 16:19:05 +0000	[diff] [blame]	850	self.DEFAULT_LOG_FILENAME)
mbligh	b0570ad	2007-09-19 18:18:11 +0000	[diff] [blame]	851	open(status_file, "a").write(msg + "\n")
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	852
				853
jadmanski	8415f96	2008-05-06 20:38:53 +0000	[diff] [blame]	854	class disk_usage_monitor:
				855	def __init__(self, logging_func, device, max_mb_per_hour):
				856	self.func = logging_func
				857	self.device = device
				858	self.max_mb_per_hour = max_mb_per_hour
				859
				860
				861	def start(self):
				862	self.initial_space = autotest_utils.freespace(self.device)
				863	self.start_time = time.time()
				864
				865
				866	def stop(self):
				867	# if no maximum usage rate was set, we don't need to
				868	# generate any warnings
				869	if not self.max_mb_per_hour:
				870	return
				871
				872	final_space = autotest_utils.freespace(self.device)
				873	used_space = self.initial_space - final_space
				874	stop_time = time.time()
				875	total_time = stop_time - self.start_time
				876	# round up the time to one minute, to keep extremely short
				877	# tests from generating false positives due to short, badly
				878	# timed bursts of activity
				879	total_time = max(total_time, 60.0)
				880
				881	# determine the usage rate
				882	bytes_per_sec = used_space / total_time
				883	mb_per_sec = bytes_per_sec / 1024**2
				884	mb_per_hour = mb_per_sec * 60 * 60
				885
				886	if mb_per_hour > self.max_mb_per_hour:
				887	msg = ("disk space on %s was consumed at a rate of "
				888	"%.2f MB/hour")
				889	msg %= (self.device, mb_per_hour)
				890	self.func(msg)
				891
				892
				893	@classmethod
				894	def watch(cls, monitor_args, *monitor_dargs):
				895	""" Generic decorator to wrap a function call with the
				896	standard create-monitor -> start -> call -> stop idiom."""
				897	def decorator(func):
				898	def watched_func(args, *dargs):
				899	monitor = cls(monitor_args, *monitor_dargs)
				900	monitor.start()
				901	try:
				902	func(args, *dargs)
				903	finally:
				904	monitor.stop()
				905	return watched_func
				906	return decorator
				907
				908
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	909	def runjob(control, cont = False, tag = "default", harness_type = '',
				910	use_external_logging = False):
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	911	"""The main interface to this module
				912
mbligh	72b88fc	2006-12-16 18:41:35 +0000	[diff] [blame]	913	control
mbligh	c86b0b4	2006-07-28 17:35:28 +0000	[diff] [blame]	914	The control file to use for this job.
				915	cont
				916	Whether this is the continuation of a previously started job
				917	"""
mbligh	b4eef24	2007-07-23 18:22:49 +0000	[diff] [blame]	918	control = os.path.abspath(control)
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	919	state = control + '.state'
				920
				921	# instantiate the job object ready for the control file.
				922	myjob = None
				923	try:
				924	# Check that the control file is valid
				925	if not os.path.exists(control):
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	926	raise error.JobError(control +
				927	": control file not found")
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	928
				929	# When continuing, the job is complete when there is no
				930	# state file, ensure we don't try and continue.
mbligh	f3fef46	2006-09-13 16:05:05 +0000	[diff] [blame]	931	if cont and not os.path.exists(state):
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	932	raise error.JobComplete("all done")
mbligh	f3fef46	2006-09-13 16:05:05 +0000	[diff] [blame]	933	if cont == False and os.path.exists(state):
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	934	os.unlink(state)
				935
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	936	myjob = job(control, tag, cont, harness_type,
				937	use_external_logging)
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	938
				939	# Load in the users control file, may do any one of:
				940	# 1) execute in toto
				941	# 2) define steps, and select the first via next_step()
				942	myjob.step_engine()
				943
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	944	except error.JobContinue:
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	945	sys.exit(5)
				946
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	947	except error.JobComplete:
apw	b832e1b	2007-11-24 20:24:38 +0000	[diff] [blame]	948	sys.exit(1)
				949
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	950	except error.JobError, instance:
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	951	print "JOB ERROR: " + instance.args[0]
mbligh	9c5ac32	2007-10-31 18:01:59 +0000	[diff] [blame]	952	if myjob:
mbligh	3027030	2007-11-05 20:33:52 +0000	[diff] [blame]	953	command = None
				954	if len(instance.args) > 1:
				955	command = instance.args[1]
				956	myjob.record('ABORT', None, command, instance.args[0])
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	957	myjob._decrement_group_level()
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	958	myjob.record('END ABORT', None, None)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	959	assert(myjob.group_level == 0)
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	960	myjob.complete(1)
apw	b832e1b	2007-11-24 20:24:38 +0000	[diff] [blame]	961	else:
				962	sys.exit(1)
apw	ce9abe9	2006-04-27 14:14:04 +0000	[diff] [blame]	963
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	964	except Exception, e:
mbligh	302482e	2008-05-01 20:06:16 +0000	[diff] [blame]	965	msg = str(e) + '\n' + traceback.format_exc()
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	966	print "JOB ERROR: " + msg
mbligh	fbfb77d	2007-02-15 18:54:03 +0000	[diff] [blame]	967	if myjob:
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	968	myjob.record('ABORT', None, None, msg)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	969	myjob._decrement_group_level()
mbligh	c343016	2007-11-14 23:57:19 +0000	[diff] [blame]	970	myjob.record('END ABORT', None, None)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	971	assert(myjob.group_level == 0)
mbligh	9c5ac32	2007-10-31 18:01:59 +0000	[diff] [blame]	972	myjob.complete(1)
apw	b832e1b	2007-11-24 20:24:38 +0000	[diff] [blame]	973	else:
				974	sys.exit(1)
mbligh	892d37f	2007-03-01 17:03:25 +0000	[diff] [blame]	975
mbligh	0144e5a	2008-03-07 18:17:53 +0000	[diff] [blame]	976	# If we get here, then we assume the job is complete and good.
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	977	myjob._decrement_group_level()
mbligh	0144e5a	2008-03-07 18:17:53 +0000	[diff] [blame]	978	myjob.record('END GOOD', None, None)
jadmanski	a9c75c4	2008-05-01 22:05:31 +0000	[diff] [blame]	979	assert(myjob.group_level == 0)
mbligh	0144e5a	2008-03-07 18:17:53 +0000	[diff] [blame]	980
mbligh	892d37f	2007-03-01 17:03:25 +0000	[diff] [blame]	981	myjob.complete(0)
mbligh	caa62c2	2008-04-07 21:51:17 +0000	[diff] [blame]	982
				983
				984	# site_job.py may be non-existant or empty, make sure that an appropriate
				985	# site_job class is created nevertheless
				986	try:
				987	from site_job import site_job
				988	except ImportError:
				989	class site_job(base_job):
				990	pass
				991
				992	class job(site_job):
				993	pass
jadmanski	87cbc7f	2008-05-13 18:17:10 +0000	[diff] [blame]	994