blob: de2f73aa75c6254911929f1e3341e5080c42d805 [file] [log] [blame]
mblighc86b0b42006-07-28 17:35:28 +00001"""The main job wrapper
mbligha2508052006-05-28 21:29:53 +00002
mblighc86b0b42006-07-28 17:35:28 +00003This is the core infrastructure.
4"""
5
6__author__ = """Copyright Andy Whitcroft, Martin J. Bligh 2006"""
mbligha2508052006-05-28 21:29:53 +00007
mbligh8f243ec2006-10-10 05:55:49 +00008# standard stuff
mbligh366ff1b2008-04-25 16:07:56 +00009import os, sys, re, pickle, shutil, time, traceback, types, copy
mbligh302482e2008-05-01 20:06:16 +000010
mbligh8f243ec2006-10-10 05:55:49 +000011# autotest stuff
mbligh302482e2008-05-01 20:06:16 +000012from autotest_lib.client.bin import autotest_utils
13from autotest_lib.client.common_lib import error, barrier, logging
14
15import parallel, kernel, xen, test, profilers, filesystem, fd_stack, boottool
16import harness, config, sysinfo, cpuset
17
mblighf4c35322006-03-13 01:01:10 +000018
mbligh12a04cb2008-04-25 16:07:20 +000019
mbligh366ff1b2008-04-25 16:07:56 +000020JOB_PREAMBLE = """
21from common.error import *
22from autotest_utils import *
23"""
24
25
mbligh302482e2008-05-01 20:06:16 +000026class StepError(error.AutotestError):
mbligh12a04cb2008-04-25 16:07:20 +000027 pass
28
29
mblighcaa62c22008-04-07 21:51:17 +000030class base_job:
mblighc86b0b42006-07-28 17:35:28 +000031 """The actual job against which we do everything.
32
33 Properties:
mbligh72b88fc2006-12-16 18:41:35 +000034 autodir
mblighc86b0b42006-07-28 17:35:28 +000035 The top level autotest directory (/usr/local/autotest).
36 Comes from os.environ['AUTODIR'].
mbligh72b88fc2006-12-16 18:41:35 +000037 bindir
mblighc86b0b42006-07-28 17:35:28 +000038 <autodir>/bin/
mblighd5a38832008-01-25 18:15:39 +000039 libdir
40 <autodir>/lib/
mbligh72b88fc2006-12-16 18:41:35 +000041 testdir
mblighc86b0b42006-07-28 17:35:28 +000042 <autodir>/tests/
mbligh84bafdb2008-01-26 19:43:34 +000043 site_testdir
44 <autodir>/site_tests/
mblighc86b0b42006-07-28 17:35:28 +000045 profdir
46 <autodir>/profilers/
47 tmpdir
48 <autodir>/tmp/
49 resultdir
50 <autodir>/results/<jobtag>
51 stdout
52 fd_stack object for stdout
53 stderr
54 fd_stack object for stderr
55 profilers
56 the profilers object for this job
apw504a7dd2006-10-12 17:18:37 +000057 harness
58 the server harness object for this job
apw059e1b12006-10-12 17:18:26 +000059 config
60 the job configuration for this job
mblighc86b0b42006-07-28 17:35:28 +000061 """
62
mblighd528d302007-12-19 16:19:05 +000063 DEFAULT_LOG_FILENAME = "status"
64
mblighcaa62c22008-04-07 21:51:17 +000065 def __init__(self, control, jobtag, cont, harness_type=None,
66 use_external_logging = False):
mblighc86b0b42006-07-28 17:35:28 +000067 """
68 control
69 The control file (pathname of)
70 jobtag
71 The job tag string (eg "default")
apw96da1a42006-11-02 00:23:18 +000072 cont
73 If this is the continuation of this job
apwe68a7132006-12-01 11:21:37 +000074 harness_type
75 An alternative server harness
mblighc86b0b42006-07-28 17:35:28 +000076 """
mblighf4c35322006-03-13 01:01:10 +000077 self.autodir = os.environ['AUTODIR']
apw870988b2007-09-25 16:50:53 +000078 self.bindir = os.path.join(self.autodir, 'bin')
mblighd5a38832008-01-25 18:15:39 +000079 self.libdir = os.path.join(self.autodir, 'lib')
apw870988b2007-09-25 16:50:53 +000080 self.testdir = os.path.join(self.autodir, 'tests')
mbligh84bafdb2008-01-26 19:43:34 +000081 self.site_testdir = os.path.join(self.autodir, 'site_tests')
apw870988b2007-09-25 16:50:53 +000082 self.profdir = os.path.join(self.autodir, 'profilers')
83 self.tmpdir = os.path.join(self.autodir, 'tmp')
84 self.resultdir = os.path.join(self.autodir, 'results', jobtag)
mbligh0fb83972008-01-10 16:30:02 +000085 self.sysinfodir = os.path.join(self.resultdir, 'sysinfo')
mbligh8d83cdc2007-12-03 18:09:18 +000086 self.control = os.path.abspath(control)
mbligh366ff1b2008-04-25 16:07:56 +000087 self.state_file = self.control + '.state'
88 self.state = None
mbligha2508052006-05-28 21:29:53 +000089
apw96da1a42006-11-02 00:23:18 +000090 if not cont:
91 if os.path.exists(self.tmpdir):
mbligh302482e2008-05-01 20:06:16 +000092 cmd = ('umount -f %s > /dev/null 2> /dev/null'
93 % (self.tmpdir))
94 autotest_utils.system(cmd, ignorestatus=True)
95 autotest_utils.system('rm -rf ' + self.tmpdir)
apw96da1a42006-11-02 00:23:18 +000096 os.mkdir(self.tmpdir)
97
apw870988b2007-09-25 16:50:53 +000098 results = os.path.join(self.autodir, 'results')
99 if not os.path.exists(results):
100 os.mkdir(results)
mblighfbfb77d2007-02-15 18:54:03 +0000101
apwf3d28622007-09-25 16:49:17 +0000102 download = os.path.join(self.testdir, 'download')
103 if os.path.exists(download):
mbligh302482e2008-05-01 20:06:16 +0000104 autotest_utils.system('rm -rf ' + download)
apwf3d28622007-09-25 16:49:17 +0000105 os.mkdir(download)
106
apw96da1a42006-11-02 00:23:18 +0000107 if os.path.exists(self.resultdir):
mbligh302482e2008-05-01 20:06:16 +0000108 autotest_utils.system('rm -rf '
109 + self.resultdir)
apw96da1a42006-11-02 00:23:18 +0000110 os.mkdir(self.resultdir)
mbligh0fb83972008-01-10 16:30:02 +0000111 os.mkdir(self.sysinfodir)
apw96da1a42006-11-02 00:23:18 +0000112
apw870988b2007-09-25 16:50:53 +0000113 os.mkdir(os.path.join(self.resultdir, 'debug'))
114 os.mkdir(os.path.join(self.resultdir, 'analysis'))
apw870988b2007-09-25 16:50:53 +0000115
mbligh8d83cdc2007-12-03 18:09:18 +0000116 shutil.copyfile(self.control,
117 os.path.join(self.resultdir, 'control'))
mblighf4ca14f2008-03-03 16:03:05 +0000118
mbligh4b089662006-06-14 22:34:58 +0000119
apwecf41b72006-03-31 14:00:55 +0000120 self.control = control
mbligh27113602007-10-31 21:07:51 +0000121 self.jobtag = jobtag
mblighd528d302007-12-19 16:19:05 +0000122 self.log_filename = self.DEFAULT_LOG_FILENAME
mbligh68119582008-01-25 18:16:41 +0000123 self.container = None
mblighf4c35322006-03-13 01:01:10 +0000124
mbligh56f1fbb2006-10-01 15:10:56 +0000125 self.stdout = fd_stack.fd_stack(1, sys.stdout)
126 self.stderr = fd_stack.fd_stack(2, sys.stderr)
mbligh7dd510c2007-11-13 17:11:22 +0000127 self.group_level = 0
mblighf4c35322006-03-13 01:01:10 +0000128
apw059e1b12006-10-12 17:18:26 +0000129 self.config = config.config(self)
130
apwd27e55f2006-12-01 11:22:08 +0000131 self.harness = harness.select(harness_type, self)
132
mbligha35553b2006-04-23 15:52:25 +0000133 self.profilers = profilers.profilers(self)
mbligh72905562006-05-25 01:30:49 +0000134
mblighcaa605c2006-10-02 00:37:35 +0000135 try:
apw90154af2006-12-01 11:23:36 +0000136 tool = self.config_get('boottool.executable')
137 self.bootloader = boottool.boottool(tool)
mblighcaa605c2006-10-02 00:37:35 +0000138 except:
139 pass
140
mbligh0fb83972008-01-10 16:30:02 +0000141 sysinfo.log_per_reboot_data(self.sysinfodir)
mbligh3a6d6ca2006-04-23 15:50:24 +0000142
mbligh30270302007-11-05 20:33:52 +0000143 if not cont:
mblighc3430162007-11-14 23:57:19 +0000144 self.record('START', None, None)
mblighc3430162007-11-14 23:57:19 +0000145 self.group_level = 1
apw357f50f2006-12-01 11:22:39 +0000146
apwf91efaf2007-11-24 17:32:13 +0000147 self.harness.run_start()
mblighcaa62c22008-04-07 21:51:17 +0000148
149 if use_external_logging:
150 self.enable_external_logging()
apwf91efaf2007-11-24 17:32:13 +0000151
mbligh0692e472007-08-30 16:07:53 +0000152
153 def relative_path(self, path):
154 """\
155 Return a patch relative to the job results directory
156 """
mbligh1c250ca2007-08-30 16:31:38 +0000157 head = len(self.resultdir) + 1 # remove the / inbetween
158 return path[head:]
mbligh0692e472007-08-30 16:07:53 +0000159
160
mbligh362ab3d2007-08-30 11:24:04 +0000161 def control_get(self):
162 return self.control
163
mblighcaa605c2006-10-02 00:37:35 +0000164
mbligh8d83cdc2007-12-03 18:09:18 +0000165 def control_set(self, control):
166 self.control = os.path.abspath(control)
167
168
apwde1503a2006-10-10 08:34:21 +0000169 def harness_select(self, which):
170 self.harness = harness.select(which, self)
171
172
apw059e1b12006-10-12 17:18:26 +0000173 def config_set(self, name, value):
174 self.config.set(name, value)
175
176
177 def config_get(self, name):
178 return self.config.get(name)
179
mbligh8baa2ea2006-12-17 23:01:24 +0000180 def setup_dirs(self, results_dir, tmp_dir):
mbligh1e8858e2006-11-24 22:18:35 +0000181 if not tmp_dir:
apw870988b2007-09-25 16:50:53 +0000182 tmp_dir = os.path.join(self.tmpdir, 'build')
mbligh1e8858e2006-11-24 22:18:35 +0000183 if not os.path.exists(tmp_dir):
184 os.mkdir(tmp_dir)
185 if not os.path.isdir(tmp_dir):
mbligh642b03e2008-01-14 16:53:15 +0000186 e_msg = "Temp dir (%s) is not a dir - args backwards?" % self.tmpdir
187 raise ValueError(e_msg)
mbligh1e8858e2006-11-24 22:18:35 +0000188
189 # We label the first build "build" and then subsequent ones
190 # as "build.2", "build.3", etc. Whilst this is a little bit
191 # inconsistent, 99.9% of jobs will only have one build
192 # (that's not done as kernbench, sparse, or buildtest),
193 # so it works out much cleaner. One of life's comprimises.
194 if not results_dir:
195 results_dir = os.path.join(self.resultdir, 'build')
196 i = 2
197 while os.path.exists(results_dir):
198 results_dir = os.path.join(self.resultdir, 'build.%d' % i)
mblighd9223fc2006-11-26 17:19:54 +0000199 i += 1
mbligh1e8858e2006-11-24 22:18:35 +0000200 if not os.path.exists(results_dir):
201 os.mkdir(results_dir)
mbligh72b88fc2006-12-16 18:41:35 +0000202
mbligh8baa2ea2006-12-17 23:01:24 +0000203 return (results_dir, tmp_dir)
204
205
206 def xen(self, base_tree, results_dir = '', tmp_dir = '', leave = False, \
207 kjob = None ):
208 """Summon a xen object"""
209 (results_dir, tmp_dir) = self.setup_dirs(results_dir, tmp_dir)
210 build_dir = 'xen'
211 return xen.xen(self, base_tree, results_dir, tmp_dir, build_dir, leave, kjob)
212
213
214 def kernel(self, base_tree, results_dir = '', tmp_dir = '', leave = False):
215 """Summon a kernel object"""
mbligh669caa12007-11-05 18:32:13 +0000216 (results_dir, tmp_dir) = self.setup_dirs(results_dir, tmp_dir)
mbligh8baa2ea2006-12-17 23:01:24 +0000217 build_dir = 'linux'
mbligh6ee7ee02007-11-13 23:49:05 +0000218 return kernel.auto_kernel(self, base_tree, results_dir,
219 tmp_dir, build_dir, leave)
mblighf4c35322006-03-13 01:01:10 +0000220
mblighcaa605c2006-10-02 00:37:35 +0000221
mbligh6b504ff2007-12-12 21:03:49 +0000222 def barrier(self, *args, **kwds):
mblighfadca202006-09-23 04:40:01 +0000223 """Create a barrier object"""
mbligh6b504ff2007-12-12 21:03:49 +0000224 return barrier.barrier(*args, **kwds)
mblighfadca202006-09-23 04:40:01 +0000225
mblighcaa605c2006-10-02 00:37:35 +0000226
mbligh4b089662006-06-14 22:34:58 +0000227 def setup_dep(self, deps):
mblighc86b0b42006-07-28 17:35:28 +0000228 """Set up the dependencies for this test.
229
230 deps is a list of libraries required for this test.
231 """
mbligh4b089662006-06-14 22:34:58 +0000232 for dep in deps:
233 try:
apw870988b2007-09-25 16:50:53 +0000234 os.chdir(os.path.join(self.autodir, 'deps', dep))
mbligh302482e2008-05-01 20:06:16 +0000235 autotest_utils.system('./' + dep + '.py')
mbligh4b089662006-06-14 22:34:58 +0000236 except:
mbligh302482e2008-05-01 20:06:16 +0000237 err = "setting up dependency " + dep + "\n"
238 raise error.UnhandledError(err)
mbligh4b089662006-06-14 22:34:58 +0000239
240
mbligh72b88fc2006-12-16 18:41:35 +0000241 def __runtest(self, url, tag, args, dargs):
242 try:
mbligh53c41502007-10-23 20:45:04 +0000243 l = lambda : test.runtest(self, url, tag, args, dargs)
mbligh302482e2008-05-01 20:06:16 +0000244 pid = parallel.fork_start(self.resultdir, l)
245 parallel.fork_waitfor(self.resultdir, pid)
246 except error.AutotestError:
mbligh72b88fc2006-12-16 18:41:35 +0000247 raise
248 except:
mbligh302482e2008-05-01 20:06:16 +0000249 raise error.UnhandledError('running test ' + \
mbligh72b88fc2006-12-16 18:41:35 +0000250 self.__class__.__name__ + "\n")
apwf1a81162006-04-25 10:10:29 +0000251
mblighcaa605c2006-10-02 00:37:35 +0000252
mblighd016ecc2006-11-25 21:41:07 +0000253 def run_test(self, url, *args, **dargs):
mblighc86b0b42006-07-28 17:35:28 +0000254 """Summon a test object and run it.
255
256 tag
257 tag to add to testname
mbligh12a7df72006-10-06 03:54:33 +0000258 url
259 url of the test to run
mblighc86b0b42006-07-28 17:35:28 +0000260 """
mbligh12a7df72006-10-06 03:54:33 +0000261
mblighd016ecc2006-11-25 21:41:07 +0000262 if not url:
mbligh302482e2008-05-01 20:06:16 +0000263 raise TypeError("Test name is invalid. "
264 "Switched arguments?")
mbligh09f288a2007-09-18 21:34:57 +0000265 (group, testname) = test.testname(url)
mbligh7dd510c2007-11-13 17:11:22 +0000266 tag = dargs.pop('tag', None)
mbligh65938a22007-12-10 16:58:52 +0000267 container = dargs.pop('container', None)
mbligh09f288a2007-09-18 21:34:57 +0000268 subdir = testname
mbligh7dd510c2007-11-13 17:11:22 +0000269 if tag:
270 subdir += '.' + tag
271
mbligh65938a22007-12-10 16:58:52 +0000272 if container:
mbligh68119582008-01-25 18:16:41 +0000273 cname = container.get('name', None)
274 if not cname: # get old name
275 cname = container.get('container_name', None)
276 mbytes = container.get('mbytes', None)
277 if not mbytes: # get old name
278 mbytes = container.get('mem', None)
279 cpus = container.get('cpus', None)
280 if not cpus: # get old name
281 cpus = container.get('cpu', None)
mbligh9ea52602008-04-02 00:15:35 +0000282 root = container.get('root', '')
mbligh68119582008-01-25 18:16:41 +0000283 self.new_container(mbytes=mbytes, cpus=cpus,
284 root=root, name=cname)
mbligh65938a22007-12-10 16:58:52 +0000285 # We are running in a container now...
286
mbligh7dd510c2007-11-13 17:11:22 +0000287 def group_func():
apwf1a81162006-04-25 10:10:29 +0000288 try:
mblighd016ecc2006-11-25 21:41:07 +0000289 self.__runtest(url, tag, args, dargs)
mbligh302482e2008-05-01 20:06:16 +0000290 except error.TestNAError, detail:
291 self.record('TEST_NA', subdir, testname,
292 str(detail))
293 raise
apwf1a81162006-04-25 10:10:29 +0000294 except Exception, detail:
mbligh7dd510c2007-11-13 17:11:22 +0000295 self.record('FAIL', subdir, testname,
296 str(detail))
apwf1a81162006-04-25 10:10:29 +0000297 raise
298 else:
mbligh7dd510c2007-11-13 17:11:22 +0000299 self.record('GOOD', subdir, testname,
300 'completed successfully')
mblighcfc6dd32007-11-20 00:44:35 +0000301 result, exc_info = self.__rungroup(subdir, group_func)
mbligh68119582008-01-25 18:16:41 +0000302 if container:
303 self.release_container()
mbligh302482e2008-05-01 20:06:16 +0000304 if exc_info and isinstance(exc_info[1], error.TestError):
mbligh7dd510c2007-11-13 17:11:22 +0000305 return False
306 elif exc_info:
mbligh71ea2492008-01-15 20:35:52 +0000307 raise exc_info[0], exc_info[1], exc_info[2]
apwf1a81162006-04-25 10:10:29 +0000308 else:
mbligh7dd510c2007-11-13 17:11:22 +0000309 return True
310
311
312 def __rungroup(self, name, function, *args, **dargs):
313 """\
314 name:
315 name of the group
316 function:
317 subroutine to run
318 *args:
319 arguments for the function
320
321 Returns a 2-tuple (result, exc_info) where result
322 is the return value of function, and exc_info is
323 the sys.exc_info() of the exception thrown by the
324 function (which may be None).
325 """
326
327 result, exc_info = None, None
328 try:
329 self.record('START', None, name)
330 self.group_level += 1
331 result = function(*args, **dargs)
332 self.group_level -= 1
333 self.record('END GOOD', None, name)
mbligh302482e2008-05-01 20:06:16 +0000334 except error.TestNAError, e:
335 self.record('END TEST_NA', None, name, str(e))
mbligh7dd510c2007-11-13 17:11:22 +0000336 except Exception, e:
337 exc_info = sys.exc_info()
338 self.group_level -= 1
mbligh302482e2008-05-01 20:06:16 +0000339 err_msg = str(e) + '\n' + traceback.format_exc()
mbligh51144e02007-11-20 20:38:18 +0000340 self.record('END FAIL', None, name, err_msg)
mbligh7dd510c2007-11-13 17:11:22 +0000341
342 return result, exc_info
apw0865f482006-03-30 18:50:19 +0000343
mblighd7fb4a62006-10-01 00:57:53 +0000344
apw1da244b2007-09-27 17:18:01 +0000345 def run_group(self, function, *args, **dargs):
mbligh88ab90f2007-08-29 15:52:49 +0000346 """\
347 function:
348 subroutine to run
349 *args:
350 arguments for the function
351 """
352
mbligh7dd510c2007-11-13 17:11:22 +0000353 # Allow the tag for the group to be specified
mbligh88ab90f2007-08-29 15:52:49 +0000354 name = function.__name__
mbligh7dd510c2007-11-13 17:11:22 +0000355 tag = dargs.pop('tag', None)
356 if tag:
357 name = tag
apw1da244b2007-09-27 17:18:01 +0000358
mbligh7dd510c2007-11-13 17:11:22 +0000359 result, exc_info = self.__rungroup(name, function,
360 *args, **dargs)
apw1da244b2007-09-27 17:18:01 +0000361
mbligh7dd510c2007-11-13 17:11:22 +0000362 # if there was a non-TestError exception, raise it
mbligh302482e2008-05-01 20:06:16 +0000363 if exc_info and not isinstance(exc_info[1], error.TestError):
mbligh7dd510c2007-11-13 17:11:22 +0000364 err = ''.join(traceback.format_exception(*exc_info))
mbligh302482e2008-05-01 20:06:16 +0000365 raise error.TestError(name + ' failed\n' + err)
mbligh88ab90f2007-08-29 15:52:49 +0000366
mbligh7dd510c2007-11-13 17:11:22 +0000367 # pass back the actual return value from the function
apw08403ca2007-09-27 17:17:22 +0000368 return result
369
mbligh88ab90f2007-08-29 15:52:49 +0000370
mbligh1fc7ba12008-03-31 17:50:53 +0000371 def new_container(self, mbytes=None, cpus=None, root='', name=None):
mbligh6ca0d6a2008-03-03 16:22:13 +0000372 if not grep('cpuset', '/proc/filesystems'):
mbligh68119582008-01-25 18:16:41 +0000373 print "Containers not enabled by latest reboot"
374 return # containers weren't enabled in this kernel boot
375 pid = os.getpid()
mbligh68119582008-01-25 18:16:41 +0000376 if not name:
377 name = 'test%d' % pid # make arbitrary unique name
378 self.container = cpuset.cpuset(name, job_size=mbytes,
mbligh337bb762008-04-16 21:23:10 +0000379 job_pid=pid, cpus=cpus, root=root)
mbligh68119582008-01-25 18:16:41 +0000380 # This job's python shell is now running in the new container
381 # and all forked test processes will inherit that container
382
383
384 def release_container(self):
385 if self.container:
mbligh337bb762008-04-16 21:23:10 +0000386 self.container.release()
mbligh68119582008-01-25 18:16:41 +0000387 self.container = None
388
389
390 def cpu_count(self):
391 if self.container:
392 return len(self.container.cpus)
393 return count_cpus() # use total system count
394
395
apwce73d892007-09-25 16:53:05 +0000396 # Check the passed kernel identifier against the command line
397 # and the running kernel, abort the job on missmatch.
mbligh38a4a112008-03-19 13:11:34 +0000398 def kernel_check_ident(self, expected_when, expected_id, subdir,
399 type = 'src'):
400 print (("POST BOOT: checking booted kernel " +
401 "mark=%d identity='%s' type='%s'") %
402 (expected_when, expected_id, type))
apwce73d892007-09-25 16:53:05 +0000403
404 running_id = running_os_ident()
405
406 cmdline = read_one_line("/proc/cmdline")
407
408 find_sum = re.compile(r'.*IDENT=(\d+)')
409 m = find_sum.match(cmdline)
410 cmdline_when = -1
411 if m:
412 cmdline_when = int(m.groups()[0])
413
414 # We have all the facts, see if they indicate we
415 # booted the requested kernel or not.
416 bad = False
mblighda0311e2007-10-25 16:03:33 +0000417 if (type == 'src' and expected_id != running_id or
418 type == 'rpm' and not running_id.startswith(expected_id + '::')):
apwce73d892007-09-25 16:53:05 +0000419 print "check_kernel_ident: kernel identifier mismatch"
420 bad = True
421 if expected_when != cmdline_when:
422 print "check_kernel_ident: kernel command line mismatch"
423 bad = True
424
425 if bad:
426 print " Expected Ident: " + expected_id
427 print " Running Ident: " + running_id
428 print " Expected Mark: %d" % (expected_when)
429 print "Command Line Mark: %d" % (cmdline_when)
430 print " Command Line: " + cmdline
431
mbligh302482e2008-05-01 20:06:16 +0000432 raise error.JobError("boot failure", "reboot.verify")
apwce73d892007-09-25 16:53:05 +0000433
mblighb7fd2702008-03-25 14:57:08 +0000434 self.record('GOOD', subdir, 'reboot.verify', expected_id)
apwce73d892007-09-25 16:53:05 +0000435
436
mblighc2359852007-08-28 18:11:48 +0000437 def filesystem(self, device, mountpoint = None, loop_size = 0):
mblighd7fb4a62006-10-01 00:57:53 +0000438 if not mountpoint:
439 mountpoint = self.tmpdir
mblighc2359852007-08-28 18:11:48 +0000440 return filesystem.filesystem(self, device, mountpoint,loop_size)
mblighd7fb4a62006-10-01 00:57:53 +0000441
mblighcaa62c22008-04-07 21:51:17 +0000442
443 def enable_external_logging(self):
444 pass
445
446
447 def disable_external_logging(self):
448 pass
449
450
451 def reboot_setup(self):
452 pass
453
mblighcaa605c2006-10-02 00:37:35 +0000454
455 def reboot(self, tag='autotest'):
mblighcaa62c22008-04-07 21:51:17 +0000456 self.reboot_setup()
mbligh30270302007-11-05 20:33:52 +0000457 self.record('GOOD', None, 'reboot.start')
apwde1503a2006-10-10 08:34:21 +0000458 self.harness.run_reboot()
apw11985b72007-10-04 15:44:47 +0000459 default = self.config_get('boot.set_default')
460 if default:
461 self.bootloader.set_default(tag)
462 else:
463 self.bootloader.boot_once(tag)
mbligh302482e2008-05-01 20:06:16 +0000464 cmd = "(sleep 5; reboot) </dev/null >/dev/null 2>&1 &"
465 autotest_utils.system(cmd)
apw0778a2f2006-10-06 03:11:40 +0000466 self.quit()
mblighcaa605c2006-10-02 00:37:35 +0000467
468
apw0865f482006-03-30 18:50:19 +0000469 def noop(self, text):
470 print "job: noop: " + text
471
mblighcaa605c2006-10-02 00:37:35 +0000472
mblighc86b0b42006-07-28 17:35:28 +0000473 def parallel(self, *tasklist):
474 """Run tasks in parallel"""
apw8fef4ac2006-10-10 22:53:37 +0000475
476 pids = []
mblighd528d302007-12-19 16:19:05 +0000477 old_log_filename = self.log_filename
478 for i, task in enumerate(tasklist):
479 self.log_filename = old_log_filename + (".%d" % i)
480 task_func = lambda: task[0](*task[1:])
mbligh302482e2008-05-01 20:06:16 +0000481 pids.append(parallel.fork_start(self.resultdir,
482 task_func))
mblighd528d302007-12-19 16:19:05 +0000483
484 old_log_path = os.path.join(self.resultdir, old_log_filename)
485 old_log = open(old_log_path, "a")
mblighd509b712008-01-14 17:41:25 +0000486 exceptions = []
mblighd528d302007-12-19 16:19:05 +0000487 for i, pid in enumerate(pids):
488 # wait for the task to finish
mblighd509b712008-01-14 17:41:25 +0000489 try:
mbligh302482e2008-05-01 20:06:16 +0000490 parallel.fork_waitfor(self.resultdir, pid)
mblighd509b712008-01-14 17:41:25 +0000491 except Exception, e:
492 exceptions.append(e)
mblighd528d302007-12-19 16:19:05 +0000493 # copy the logs from the subtask into the main log
494 new_log_path = old_log_path + (".%d" % i)
495 if os.path.exists(new_log_path):
496 new_log = open(new_log_path)
497 old_log.write(new_log.read())
498 new_log.close()
499 old_log.flush()
500 os.remove(new_log_path)
501 old_log.close()
502
503 self.log_filename = old_log_filename
apw0865f482006-03-30 18:50:19 +0000504
mblighd509b712008-01-14 17:41:25 +0000505 # handle any exceptions raised by the parallel tasks
506 if exceptions:
507 msg = "%d task(s) failed" % len(exceptions)
mbligh302482e2008-05-01 20:06:16 +0000508 raise error.JobError(msg, str(exceptions), exceptions)
mblighd509b712008-01-14 17:41:25 +0000509
mblighcaa605c2006-10-02 00:37:35 +0000510
apw0865f482006-03-30 18:50:19 +0000511 def quit(self):
mblighc86b0b42006-07-28 17:35:28 +0000512 # XXX: should have a better name.
apwde1503a2006-10-10 08:34:21 +0000513 self.harness.run_pause()
mbligh302482e2008-05-01 20:06:16 +0000514 raise error.JobContinue("more to come")
apw0865f482006-03-30 18:50:19 +0000515
mblighcaa605c2006-10-02 00:37:35 +0000516
apw0865f482006-03-30 18:50:19 +0000517 def complete(self, status):
mblighc86b0b42006-07-28 17:35:28 +0000518 """Clean up and exit"""
apw0865f482006-03-30 18:50:19 +0000519 # We are about to exit 'complete' so clean up the control file.
520 try:
mbligh366ff1b2008-04-25 16:07:56 +0000521 os.unlink(self.state_file)
apw0865f482006-03-30 18:50:19 +0000522 except:
523 pass
mblighc0b10d32008-03-03 16:03:28 +0000524
mbligh61a6c1a2006-12-25 01:26:38 +0000525 self.harness.run_complete()
mblighcaa62c22008-04-07 21:51:17 +0000526 self.disable_external_logging()
apw1b021902006-04-03 17:02:56 +0000527 sys.exit(status)
apw0865f482006-03-30 18:50:19 +0000528
mblighcaa605c2006-10-02 00:37:35 +0000529
mbligh366ff1b2008-04-25 16:07:56 +0000530 def set_state(self, var, val):
531 # Deep copies make sure that the state can't be altered
532 # without it being re-written. Perf wise, deep copies
533 # are overshadowed by pickling/loading.
534 self.state[var] = copy.deepcopy(val)
535 pickle.dump(self.state, open(self.state_file, 'w'))
536
537
538 def __load_state(self):
539 assert(self.state == None)
540 try:
541 self.state = pickle.load(open(self.state_file, 'r'))
542 return True
543 except Exception:
544 print "Initializing the state engine."
545 self.state = {}
mblighf1ae0a42008-04-25 16:09:20 +0000546 self.set_state('__steps', []) # writes pickle file
mbligh366ff1b2008-04-25 16:07:56 +0000547 return False
548
549
550 def get_state(self, var, default=None):
551 if var in self.state or default == None:
552 val = self.state[var]
553 else:
554 val = default
555 return copy.deepcopy(val)
556
557
mbligh12a04cb2008-04-25 16:07:20 +0000558 def __create_step_tuple(self, fn, args, dargs):
559 # Legacy code passes in an array where the first arg is
560 # the function or its name.
561 if isinstance(fn, list):
562 assert(len(args) == 0)
563 assert(len(dargs) == 0)
564 args = fn[1:]
565 fn = fn[0]
566 # Pickling actual functions is harry, thus we have to call
567 # them by name. Unfortunately, this means only functions
568 # defined globally can be used as a next step.
569 if isinstance(fn, types.FunctionType):
570 fn = fn.__name__
571 if not isinstance(fn, types.StringTypes):
572 raise StepError("Next steps must be functions or "
573 "strings containing the function name")
574 return (fn, args, dargs)
575
576
mbligh12a04cb2008-04-25 16:07:20 +0000577 def next_step(self, fn, *args, **dargs):
mblighc86b0b42006-07-28 17:35:28 +0000578 """Define the next step"""
mblighf1ae0a42008-04-25 16:09:20 +0000579 steps = self.get_state('__steps')
mbligh366ff1b2008-04-25 16:07:56 +0000580 steps.append(self.__create_step_tuple(fn, args, dargs))
mblighf1ae0a42008-04-25 16:09:20 +0000581 self.set_state('__steps', steps)
apw0865f482006-03-30 18:50:19 +0000582
mblighcaa605c2006-10-02 00:37:35 +0000583
mbligh12a04cb2008-04-25 16:07:20 +0000584 def next_step_prepend(self, fn, *args, **dargs):
mbligh237bed32007-09-05 13:05:57 +0000585 """Insert a new step, executing first"""
mblighf1ae0a42008-04-25 16:09:20 +0000586 steps = self.get_state('__steps')
mbligh366ff1b2008-04-25 16:07:56 +0000587 steps.insert(0, self.__create_step_tuple(fn, args, dargs))
mblighf1ae0a42008-04-25 16:09:20 +0000588 self.set_state('__steps', steps)
mbligh237bed32007-09-05 13:05:57 +0000589
590
apw83f8d772006-04-27 14:12:56 +0000591 def step_engine(self):
mblighc86b0b42006-07-28 17:35:28 +0000592 """the stepping engine -- if the control file defines
593 step_init we will be using this engine to drive multiple runs.
594 """
595 """Do the next step"""
apw83f8d772006-04-27 14:12:56 +0000596
mbligh366ff1b2008-04-25 16:07:56 +0000597 # Set up the environment and then interpret the control file.
598 # Some control files will have code outside of functions,
599 # which means we need to have our state engine initialized
600 # before reading in the file.
601 state_existed = self.__load_state()
602 lcl = {'job': self}
603 exec(JOB_PREAMBLE, lcl, lcl)
apw83f8d772006-04-27 14:12:56 +0000604 execfile(self.control, lcl, lcl)
605
mbligh366ff1b2008-04-25 16:07:56 +0000606 # If we loaded in a mid-job state file, then we presumably
607 # know what steps we have yet to run.
608 if not state_existed:
apw83f8d772006-04-27 14:12:56 +0000609 if lcl.has_key('step_init'):
610 self.next_step([lcl['step_init']])
apw0865f482006-03-30 18:50:19 +0000611
mbligh366ff1b2008-04-25 16:07:56 +0000612 # Iterate through the steps. If we reboot, we'll simply
613 # continue iterating on the next step.
mblighf1ae0a42008-04-25 16:09:20 +0000614 while len(self.get_state('__steps')) > 0:
615 steps = self.get_state('__steps')
mbligh366ff1b2008-04-25 16:07:56 +0000616 (fn, args, dargs) = steps.pop(0)
mblighf1ae0a42008-04-25 16:09:20 +0000617 self.set_state('__steps', steps)
apw0865f482006-03-30 18:50:19 +0000618
mbligh12a04cb2008-04-25 16:07:20 +0000619 lcl['__args'] = args
620 lcl['__dargs'] = dargs
621 exec(fn + "(*__args, **__dargs)", lcl, lcl)
apw0865f482006-03-30 18:50:19 +0000622
mblighcaa605c2006-10-02 00:37:35 +0000623
mbligh09f288a2007-09-18 21:34:57 +0000624 def record(self, status_code, subdir, operation, status = ''):
625 """
626 Record job-level status
apw7db8d0b2006-10-09 08:10:25 +0000627
mbligh09f288a2007-09-18 21:34:57 +0000628 The intent is to make this file both machine parseable and
629 human readable. That involves a little more complexity, but
630 really isn't all that bad ;-)
631
632 Format is <status code>\t<subdir>\t<operation>\t<status>
633
634 status code: (GOOD|WARN|FAIL|ABORT)
635 or START
636 or END (GOOD|WARN|FAIL|ABORT)
637
638 subdir: MUST be a relevant subdirectory in the results,
639 or None, which will be represented as '----'
640
641 operation: description of what you ran (e.g. "dbench", or
642 "mkfs -t foobar /dev/sda9")
643
644 status: error message or "completed sucessfully"
645
646 ------------------------------------------------------------
647
648 Initial tabs indicate indent levels for grouping, and is
mbligh7dd510c2007-11-13 17:11:22 +0000649 governed by self.group_level
mbligh09f288a2007-09-18 21:34:57 +0000650
651 multiline messages have secondary lines prefaced by a double
652 space (' ')
653 """
654
mblighb0570ad2007-09-19 18:18:11 +0000655 if subdir:
656 if re.match(r'[\n\t]', subdir):
mbligh642b03e2008-01-14 16:53:15 +0000657 raise ValueError("Invalid character in subdir string")
mblighb0570ad2007-09-19 18:18:11 +0000658 substr = subdir
659 else:
660 substr = '----'
mbligh09f288a2007-09-18 21:34:57 +0000661
mbligh302482e2008-05-01 20:06:16 +0000662 if not logging.is_valid_status(status_code):
mbligh642b03e2008-01-14 16:53:15 +0000663 raise ValueError("Invalid status code supplied: %s" % status_code)
mbligh9c5ac322007-10-31 18:01:59 +0000664 if not operation:
665 operation = '----'
mbligh09f288a2007-09-18 21:34:57 +0000666 if re.match(r'[\n\t]', operation):
mbligh642b03e2008-01-14 16:53:15 +0000667 raise ValueError("Invalid character in operation string")
mbligh09f288a2007-09-18 21:34:57 +0000668 operation = operation.rstrip()
669 status = status.rstrip()
670 status = re.sub(r"\t", " ", status)
apw7db8d0b2006-10-09 08:10:25 +0000671 # Ensure any continuation lines are marked so we can
672 # detect them in the status file to ensure it is parsable.
mbligh7dd510c2007-11-13 17:11:22 +0000673 status = re.sub(r"\n", "\n" + "\t" * self.group_level + " ", status)
mbligh09f288a2007-09-18 21:34:57 +0000674
mbligh30270302007-11-05 20:33:52 +0000675 # Generate timestamps for inclusion in the logs
676 epoch_time = int(time.time()) # seconds since epoch, in UTC
677 local_time = time.localtime(epoch_time)
678 epoch_time_str = "timestamp=%d" % (epoch_time,)
679 local_time_str = time.strftime("localtime=%b %d %H:%M:%S",
680 local_time)
681
682 msg = '\t'.join(str(x) for x in (status_code, substr, operation,
683 epoch_time_str, local_time_str,
684 status))
mbligh7dd510c2007-11-13 17:11:22 +0000685 msg = '\t' * self.group_level + msg
apw7db8d0b2006-10-09 08:10:25 +0000686
mblighd528d302007-12-19 16:19:05 +0000687 msg_tag = ""
688 if "." in self.log_filename:
689 msg_tag = self.log_filename.split(".", 1)[1]
690
691 self.harness.test_status_detail(status_code, substr, operation,
692 status, msg_tag)
693 self.harness.test_status(msg, msg_tag)
694
695 # log to stdout (if enabled)
696 #if self.log_filename == self.DEFAULT_LOG_FILENAME:
apwf1a81162006-04-25 10:10:29 +0000697 print msg
mblighd528d302007-12-19 16:19:05 +0000698
699 # log to the "root" status log
700 status_file = os.path.join(self.resultdir, self.log_filename)
mbligh7dd510c2007-11-13 17:11:22 +0000701 open(status_file, "a").write(msg + "\n")
mblighd528d302007-12-19 16:19:05 +0000702
703 # log to the subdir status log (if subdir is set)
mblighb0570ad2007-09-19 18:18:11 +0000704 if subdir:
mblighadff6ca2008-01-22 16:38:25 +0000705 dir = os.path.join(self.resultdir, subdir)
706 if not os.path.exists(dir):
707 os.mkdir(dir)
708
709 status_file = os.path.join(dir,
mblighd528d302007-12-19 16:19:05 +0000710 self.DEFAULT_LOG_FILENAME)
mblighb0570ad2007-09-19 18:18:11 +0000711 open(status_file, "a").write(msg + "\n")
apwce9abe92006-04-27 14:14:04 +0000712
713
mblighcaa62c22008-04-07 21:51:17 +0000714def runjob(control, cont = False, tag = "default", harness_type = '',
715 use_external_logging = False):
mblighc86b0b42006-07-28 17:35:28 +0000716 """The main interface to this module
717
mbligh72b88fc2006-12-16 18:41:35 +0000718 control
mblighc86b0b42006-07-28 17:35:28 +0000719 The control file to use for this job.
720 cont
721 Whether this is the continuation of a previously started job
722 """
mblighb4eef242007-07-23 18:22:49 +0000723 control = os.path.abspath(control)
apwce9abe92006-04-27 14:14:04 +0000724 state = control + '.state'
725
726 # instantiate the job object ready for the control file.
727 myjob = None
728 try:
729 # Check that the control file is valid
730 if not os.path.exists(control):
mbligh302482e2008-05-01 20:06:16 +0000731 raise error.JobError(control +
732 ": control file not found")
apwce9abe92006-04-27 14:14:04 +0000733
734 # When continuing, the job is complete when there is no
735 # state file, ensure we don't try and continue.
mblighf3fef462006-09-13 16:05:05 +0000736 if cont and not os.path.exists(state):
mbligh302482e2008-05-01 20:06:16 +0000737 raise error.JobComplete("all done")
mblighf3fef462006-09-13 16:05:05 +0000738 if cont == False and os.path.exists(state):
apwce9abe92006-04-27 14:14:04 +0000739 os.unlink(state)
740
mblighcaa62c22008-04-07 21:51:17 +0000741 myjob = job(control, tag, cont, harness_type,
742 use_external_logging)
apwce9abe92006-04-27 14:14:04 +0000743
744 # Load in the users control file, may do any one of:
745 # 1) execute in toto
746 # 2) define steps, and select the first via next_step()
747 myjob.step_engine()
748
mbligh302482e2008-05-01 20:06:16 +0000749 except error.JobContinue:
apwce9abe92006-04-27 14:14:04 +0000750 sys.exit(5)
751
mbligh302482e2008-05-01 20:06:16 +0000752 except error.JobComplete:
apwb832e1b2007-11-24 20:24:38 +0000753 sys.exit(1)
754
mbligh302482e2008-05-01 20:06:16 +0000755 except error.JobError, instance:
apwce9abe92006-04-27 14:14:04 +0000756 print "JOB ERROR: " + instance.args[0]
mbligh9c5ac322007-10-31 18:01:59 +0000757 if myjob:
mbligh30270302007-11-05 20:33:52 +0000758 command = None
759 if len(instance.args) > 1:
760 command = instance.args[1]
mblighc3430162007-11-14 23:57:19 +0000761 myjob.group_level = 0
mbligh30270302007-11-05 20:33:52 +0000762 myjob.record('ABORT', None, command, instance.args[0])
mblighc3430162007-11-14 23:57:19 +0000763 myjob.record('END ABORT', None, None)
apwce9abe92006-04-27 14:14:04 +0000764 myjob.complete(1)
apwb832e1b2007-11-24 20:24:38 +0000765 else:
766 sys.exit(1)
apwce9abe92006-04-27 14:14:04 +0000767
mblighc3430162007-11-14 23:57:19 +0000768 except Exception, e:
mbligh302482e2008-05-01 20:06:16 +0000769 msg = str(e) + '\n' + traceback.format_exc()
mblighc3430162007-11-14 23:57:19 +0000770 print "JOB ERROR: " + msg
mblighfbfb77d2007-02-15 18:54:03 +0000771 if myjob:
mblighc3430162007-11-14 23:57:19 +0000772 myjob.group_level = 0
773 myjob.record('ABORT', None, None, msg)
774 myjob.record('END ABORT', None, None)
mbligh9c5ac322007-10-31 18:01:59 +0000775 myjob.complete(1)
apwb832e1b2007-11-24 20:24:38 +0000776 else:
777 sys.exit(1)
mbligh892d37f2007-03-01 17:03:25 +0000778
mbligh0144e5a2008-03-07 18:17:53 +0000779 # If we get here, then we assume the job is complete and good.
780 myjob.group_level = 0
781 myjob.record('END GOOD', None, None)
782
mbligh892d37f2007-03-01 17:03:25 +0000783 myjob.complete(0)
mblighcaa62c22008-04-07 21:51:17 +0000784
785
786# site_job.py may be non-existant or empty, make sure that an appropriate
787# site_job class is created nevertheless
788try:
789 from site_job import site_job
790except ImportError:
791 class site_job(base_job):
792 pass
793
794class job(site_job):
795 pass