blob: d7b2bbaef10b6cab326084a04f83a0f97ed77fd5 [file] [log] [blame]
mblighc86b0b42006-07-28 17:35:28 +00001"""The main job wrapper
mbligha2508052006-05-28 21:29:53 +00002
mblighc86b0b42006-07-28 17:35:28 +00003This is the core infrastructure.
4"""
5
6__author__ = """Copyright Andy Whitcroft, Martin J. Bligh 2006"""
mbligha2508052006-05-28 21:29:53 +00007
mbligh8f243ec2006-10-10 05:55:49 +00008# standard stuff
mbligh7dd510c2007-11-13 17:11:22 +00009import os, sys, re, pickle, shutil, time, traceback
mbligh8f243ec2006-10-10 05:55:49 +000010# autotest stuff
mblighf4c35322006-03-13 01:01:10 +000011from autotest_utils import *
apw8fef4ac2006-10-10 22:53:37 +000012from parallel import *
mbligh9c5ac322007-10-31 18:01:59 +000013from error import *
mbligh8baa2ea2006-12-17 23:01:24 +000014import kernel, xen, test, profilers, barrier, filesystem, fd_stack, boottool
apw059e1b12006-10-12 17:18:26 +000015import harness, config
mbligh83ac9942007-11-05 18:59:37 +000016import sysinfo
mblighf4c35322006-03-13 01:01:10 +000017
18class job:
mblighc86b0b42006-07-28 17:35:28 +000019 """The actual job against which we do everything.
20
21 Properties:
mbligh72b88fc2006-12-16 18:41:35 +000022 autodir
mblighc86b0b42006-07-28 17:35:28 +000023 The top level autotest directory (/usr/local/autotest).
24 Comes from os.environ['AUTODIR'].
mbligh72b88fc2006-12-16 18:41:35 +000025 bindir
mblighc86b0b42006-07-28 17:35:28 +000026 <autodir>/bin/
mbligh72b88fc2006-12-16 18:41:35 +000027 testdir
mblighc86b0b42006-07-28 17:35:28 +000028 <autodir>/tests/
29 profdir
30 <autodir>/profilers/
31 tmpdir
32 <autodir>/tmp/
33 resultdir
34 <autodir>/results/<jobtag>
35 stdout
36 fd_stack object for stdout
37 stderr
38 fd_stack object for stderr
39 profilers
40 the profilers object for this job
apw504a7dd2006-10-12 17:18:37 +000041 harness
42 the server harness object for this job
apw059e1b12006-10-12 17:18:26 +000043 config
44 the job configuration for this job
mblighc86b0b42006-07-28 17:35:28 +000045 """
46
mbligh362ab3d2007-08-30 11:24:04 +000047 def __init__(self, control, jobtag, cont, harness_type=None):
mblighc86b0b42006-07-28 17:35:28 +000048 """
49 control
50 The control file (pathname of)
51 jobtag
52 The job tag string (eg "default")
apw96da1a42006-11-02 00:23:18 +000053 cont
54 If this is the continuation of this job
apwe68a7132006-12-01 11:21:37 +000055 harness_type
56 An alternative server harness
mblighc86b0b42006-07-28 17:35:28 +000057 """
mblighf4c35322006-03-13 01:01:10 +000058 self.autodir = os.environ['AUTODIR']
apw870988b2007-09-25 16:50:53 +000059 self.bindir = os.path.join(self.autodir, 'bin')
60 self.testdir = os.path.join(self.autodir, 'tests')
61 self.profdir = os.path.join(self.autodir, 'profilers')
62 self.tmpdir = os.path.join(self.autodir, 'tmp')
63 self.resultdir = os.path.join(self.autodir, 'results', jobtag)
mbligha2508052006-05-28 21:29:53 +000064
apw96da1a42006-11-02 00:23:18 +000065 if not cont:
66 if os.path.exists(self.tmpdir):
mbligh09f288a2007-09-18 21:34:57 +000067 system('umount -f %s > /dev/null 2> /dev/null'%\
68 self.tmpdir, ignorestatus=True)
apw96da1a42006-11-02 00:23:18 +000069 system('rm -rf ' + self.tmpdir)
70 os.mkdir(self.tmpdir)
71
apw870988b2007-09-25 16:50:53 +000072 results = os.path.join(self.autodir, 'results')
73 if not os.path.exists(results):
74 os.mkdir(results)
mblighfbfb77d2007-02-15 18:54:03 +000075
apwf3d28622007-09-25 16:49:17 +000076 download = os.path.join(self.testdir, 'download')
77 if os.path.exists(download):
78 system('rm -rf ' + download)
79 os.mkdir(download)
80
apw96da1a42006-11-02 00:23:18 +000081 if os.path.exists(self.resultdir):
82 system('rm -rf ' + self.resultdir)
83 os.mkdir(self.resultdir)
84
apw870988b2007-09-25 16:50:53 +000085 os.mkdir(os.path.join(self.resultdir, 'debug'))
86 os.mkdir(os.path.join(self.resultdir, 'analysis'))
87 os.mkdir(os.path.join(self.resultdir, 'sysinfo'))
88
89 shutil.copyfile(control, os.path.join(self.resultdir, 'control'))
mbligh4b089662006-06-14 22:34:58 +000090
apwecf41b72006-03-31 14:00:55 +000091 self.control = control
mbligh27113602007-10-31 21:07:51 +000092 self.jobtag = jobtag
mblighf4c35322006-03-13 01:01:10 +000093
mbligh56f1fbb2006-10-01 15:10:56 +000094 self.stdout = fd_stack.fd_stack(1, sys.stdout)
95 self.stderr = fd_stack.fd_stack(2, sys.stderr)
mbligh7dd510c2007-11-13 17:11:22 +000096 self.group_level = 0
mblighf4c35322006-03-13 01:01:10 +000097
apw059e1b12006-10-12 17:18:26 +000098 self.config = config.config(self)
99
apwd27e55f2006-12-01 11:22:08 +0000100 self.harness = harness.select(harness_type, self)
101
mbligha35553b2006-04-23 15:52:25 +0000102 self.profilers = profilers.profilers(self)
mbligh72905562006-05-25 01:30:49 +0000103
mblighcaa605c2006-10-02 00:37:35 +0000104 try:
apw90154af2006-12-01 11:23:36 +0000105 tool = self.config_get('boottool.executable')
106 self.bootloader = boottool.boottool(tool)
mblighcaa605c2006-10-02 00:37:35 +0000107 except:
108 pass
109
mbligh83ac9942007-11-05 18:59:37 +0000110 # log "before each step" sysinfo
mbligh72b88fc2006-12-16 18:41:35 +0000111 pwd = os.getcwd()
mbligh83ac9942007-11-05 18:59:37 +0000112 try:
113 os.chdir(os.path.join(self.resultdir, 'sysinfo'))
114 sysinfo.before_each_step()
115 finally:
116 os.chdir(pwd)
mbligh3a6d6ca2006-04-23 15:50:24 +0000117
mbligh30270302007-11-05 20:33:52 +0000118 if not cont:
119 self.harness.run_start()
apw357f50f2006-12-01 11:22:39 +0000120
mbligh0692e472007-08-30 16:07:53 +0000121
122 def relative_path(self, path):
123 """\
124 Return a patch relative to the job results directory
125 """
mbligh1c250ca2007-08-30 16:31:38 +0000126 head = len(self.resultdir) + 1 # remove the / inbetween
127 return path[head:]
mbligh0692e472007-08-30 16:07:53 +0000128
129
mbligh362ab3d2007-08-30 11:24:04 +0000130 def control_get(self):
131 return self.control
132
mblighcaa605c2006-10-02 00:37:35 +0000133
apwde1503a2006-10-10 08:34:21 +0000134 def harness_select(self, which):
135 self.harness = harness.select(which, self)
136
137
apw059e1b12006-10-12 17:18:26 +0000138 def config_set(self, name, value):
139 self.config.set(name, value)
140
141
142 def config_get(self, name):
143 return self.config.get(name)
144
mbligh8baa2ea2006-12-17 23:01:24 +0000145 def setup_dirs(self, results_dir, tmp_dir):
mbligh1e8858e2006-11-24 22:18:35 +0000146 if not tmp_dir:
apw870988b2007-09-25 16:50:53 +0000147 tmp_dir = os.path.join(self.tmpdir, 'build')
mbligh1e8858e2006-11-24 22:18:35 +0000148 if not os.path.exists(tmp_dir):
149 os.mkdir(tmp_dir)
150 if not os.path.isdir(tmp_dir):
151 raise "Temp dir (%s) is not a dir - args backwards?" \
152 % self.tmpdir
153
154 # We label the first build "build" and then subsequent ones
155 # as "build.2", "build.3", etc. Whilst this is a little bit
156 # inconsistent, 99.9% of jobs will only have one build
157 # (that's not done as kernbench, sparse, or buildtest),
158 # so it works out much cleaner. One of life's comprimises.
159 if not results_dir:
160 results_dir = os.path.join(self.resultdir, 'build')
161 i = 2
162 while os.path.exists(results_dir):
163 results_dir = os.path.join(self.resultdir, 'build.%d' % i)
mblighd9223fc2006-11-26 17:19:54 +0000164 i += 1
mbligh1e8858e2006-11-24 22:18:35 +0000165 if not os.path.exists(results_dir):
166 os.mkdir(results_dir)
mbligh72b88fc2006-12-16 18:41:35 +0000167
mbligh8baa2ea2006-12-17 23:01:24 +0000168 return (results_dir, tmp_dir)
169
170
171 def xen(self, base_tree, results_dir = '', tmp_dir = '', leave = False, \
172 kjob = None ):
173 """Summon a xen object"""
174 (results_dir, tmp_dir) = self.setup_dirs(results_dir, tmp_dir)
175 build_dir = 'xen'
176 return xen.xen(self, base_tree, results_dir, tmp_dir, build_dir, leave, kjob)
177
178
179 def kernel(self, base_tree, results_dir = '', tmp_dir = '', leave = False):
180 """Summon a kernel object"""
mbligh669caa12007-11-05 18:32:13 +0000181 (results_dir, tmp_dir) = self.setup_dirs(results_dir, tmp_dir)
mbligh736adc92007-10-18 03:23:22 +0000182 if base_tree.endswith('.rpm'):
183 return kernel.rpm_kernel(self, base_tree, results_dir)
mbligh8baa2ea2006-12-17 23:01:24 +0000184 build_dir = 'linux'
185 return kernel.kernel(self, base_tree, results_dir, tmp_dir, build_dir, leave)
mblighf4c35322006-03-13 01:01:10 +0000186
mblighcaa605c2006-10-02 00:37:35 +0000187
mblighfadca202006-09-23 04:40:01 +0000188 def barrier(self, *args):
189 """Create a barrier object"""
190 return barrier.barrier(*args)
191
mblighcaa605c2006-10-02 00:37:35 +0000192
mbligh4b089662006-06-14 22:34:58 +0000193 def setup_dep(self, deps):
mblighc86b0b42006-07-28 17:35:28 +0000194 """Set up the dependencies for this test.
195
196 deps is a list of libraries required for this test.
197 """
mbligh4b089662006-06-14 22:34:58 +0000198 for dep in deps:
199 try:
apw870988b2007-09-25 16:50:53 +0000200 os.chdir(os.path.join(self.autodir, 'deps', dep))
mbligh4b089662006-06-14 22:34:58 +0000201 system('./' + dep + '.py')
202 except:
203 error = "setting up dependency " + dep + "\n"
mbligh72b88fc2006-12-16 18:41:35 +0000204 raise UnhandledError(error)
mbligh4b089662006-06-14 22:34:58 +0000205
206
mbligh72b88fc2006-12-16 18:41:35 +0000207 def __runtest(self, url, tag, args, dargs):
208 try:
mbligh53c41502007-10-23 20:45:04 +0000209 l = lambda : test.runtest(self, url, tag, args, dargs)
210 pid = fork_start(self.resultdir, l)
211 fork_waitfor(self.resultdir, pid)
mbligh72b88fc2006-12-16 18:41:35 +0000212 except AutotestError:
213 raise
214 except:
215 raise UnhandledError('running test ' + \
216 self.__class__.__name__ + "\n")
apwf1a81162006-04-25 10:10:29 +0000217
mblighcaa605c2006-10-02 00:37:35 +0000218
mblighd016ecc2006-11-25 21:41:07 +0000219 def run_test(self, url, *args, **dargs):
mblighc86b0b42006-07-28 17:35:28 +0000220 """Summon a test object and run it.
221
222 tag
223 tag to add to testname
mbligh12a7df72006-10-06 03:54:33 +0000224 url
225 url of the test to run
mblighc86b0b42006-07-28 17:35:28 +0000226 """
mbligh12a7df72006-10-06 03:54:33 +0000227
mblighd016ecc2006-11-25 21:41:07 +0000228 if not url:
229 raise "Test name is invalid. Switched arguments?"
mbligh09f288a2007-09-18 21:34:57 +0000230 (group, testname) = test.testname(url)
mbligh7dd510c2007-11-13 17:11:22 +0000231 tag = dargs.pop('tag', None)
mbligh09f288a2007-09-18 21:34:57 +0000232 subdir = testname
mbligh7dd510c2007-11-13 17:11:22 +0000233 if tag:
234 subdir += '.' + tag
235
236 def group_func():
apwf1a81162006-04-25 10:10:29 +0000237 try:
mblighd016ecc2006-11-25 21:41:07 +0000238 self.__runtest(url, tag, args, dargs)
apwf1a81162006-04-25 10:10:29 +0000239 except Exception, detail:
mbligh7dd510c2007-11-13 17:11:22 +0000240 self.record('FAIL', subdir, testname,
241 str(detail))
apwf1a81162006-04-25 10:10:29 +0000242 raise
243 else:
mbligh7dd510c2007-11-13 17:11:22 +0000244 self.record('GOOD', subdir, testname,
245 'completed successfully')
246 name = "test." + testname
247 result, exc_info = self.__rungroup(name, group_func)
248
249 if exc_info and isinstance(exc_info[1], TestError):
250 return False
251 elif exc_info:
252 raise exc_info[0], exc_info[1], exc_info[2]
apwf1a81162006-04-25 10:10:29 +0000253 else:
mbligh7dd510c2007-11-13 17:11:22 +0000254 return True
255
256
257 def __rungroup(self, name, function, *args, **dargs):
258 """\
259 name:
260 name of the group
261 function:
262 subroutine to run
263 *args:
264 arguments for the function
265
266 Returns a 2-tuple (result, exc_info) where result
267 is the return value of function, and exc_info is
268 the sys.exc_info() of the exception thrown by the
269 function (which may be None).
270 """
271
272 result, exc_info = None, None
273 try:
274 self.record('START', None, name)
275 self.group_level += 1
276 result = function(*args, **dargs)
277 self.group_level -= 1
278 self.record('END GOOD', None, name)
279 except Exception, e:
280 exc_info = sys.exc_info()
281 self.group_level -= 1
282 self.record('END FAIL', None, name, format_error())
283
284 return result, exc_info
apw0865f482006-03-30 18:50:19 +0000285
mblighd7fb4a62006-10-01 00:57:53 +0000286
apw1da244b2007-09-27 17:18:01 +0000287 def run_group(self, function, *args, **dargs):
mbligh88ab90f2007-08-29 15:52:49 +0000288 """\
289 function:
290 subroutine to run
291 *args:
292 arguments for the function
293 """
294
mbligh7dd510c2007-11-13 17:11:22 +0000295 # Allow the tag for the group to be specified
mbligh88ab90f2007-08-29 15:52:49 +0000296 name = function.__name__
mbligh7dd510c2007-11-13 17:11:22 +0000297 tag = dargs.pop('tag', None)
298 if tag:
299 name = tag
apw1da244b2007-09-27 17:18:01 +0000300
mbligh7dd510c2007-11-13 17:11:22 +0000301 result, exc_info = self.__rungroup(name, function,
302 *args, **dargs)
apw1da244b2007-09-27 17:18:01 +0000303
mbligh7dd510c2007-11-13 17:11:22 +0000304 # if there was a non-TestError exception, raise it
305 if exc_info and isinstance(exc_info[1], TestError):
306 err = ''.join(traceback.format_exception(*exc_info))
307 raise TestError(name + ' failed\n' + err)
mbligh88ab90f2007-08-29 15:52:49 +0000308
mbligh7dd510c2007-11-13 17:11:22 +0000309 # pass back the actual return value from the function
apw08403ca2007-09-27 17:17:22 +0000310 return result
311
mbligh88ab90f2007-08-29 15:52:49 +0000312
apwce73d892007-09-25 16:53:05 +0000313 # Check the passed kernel identifier against the command line
314 # and the running kernel, abort the job on missmatch.
mblighda0311e2007-10-25 16:03:33 +0000315 def kernel_check_ident(self, expected_when, expected_id, expected_cl, subdir, type = 'src'):
316 print "POST BOOT: checking booted kernel mark=%d identity='%s' changelist=%s type='%s'" \
317 % (expected_when, expected_id, expected_cl, type)
apwce73d892007-09-25 16:53:05 +0000318
319 running_id = running_os_ident()
320
321 cmdline = read_one_line("/proc/cmdline")
322
323 find_sum = re.compile(r'.*IDENT=(\d+)')
324 m = find_sum.match(cmdline)
325 cmdline_when = -1
326 if m:
327 cmdline_when = int(m.groups()[0])
328
mblighda0311e2007-10-25 16:03:33 +0000329 cl_re = re.compile(r'\d{7,}')
330 cl_match = cl_re.search(system_output('uname -v').split()[1])
331 if cl_match:
332 current_cl = cl_match.group()
333 else:
334 current_cl = None
335
apwce73d892007-09-25 16:53:05 +0000336 # We have all the facts, see if they indicate we
337 # booted the requested kernel or not.
338 bad = False
mblighda0311e2007-10-25 16:03:33 +0000339 if (type == 'src' and expected_id != running_id or
340 type == 'rpm' and not running_id.startswith(expected_id + '::')):
apwce73d892007-09-25 16:53:05 +0000341 print "check_kernel_ident: kernel identifier mismatch"
342 bad = True
343 if expected_when != cmdline_when:
344 print "check_kernel_ident: kernel command line mismatch"
345 bad = True
mblighda0311e2007-10-25 16:03:33 +0000346 if expected_cl and current_cl and str(expected_cl) != current_cl:
347 print 'check_kernel_ident: kernel changelist mismatch'
348 bad = True
apwce73d892007-09-25 16:53:05 +0000349
350 if bad:
351 print " Expected Ident: " + expected_id
352 print " Running Ident: " + running_id
353 print " Expected Mark: %d" % (expected_when)
354 print "Command Line Mark: %d" % (cmdline_when)
mblighda0311e2007-10-25 16:03:33 +0000355 print " Expected P4 CL: %s" % expected_cl
356 print " P4 CL: %s" % current_cl
apwce73d892007-09-25 16:53:05 +0000357 print " Command Line: " + cmdline
358
mbligh30270302007-11-05 20:33:52 +0000359 raise JobError("boot failure", "reboot.verify")
apwce73d892007-09-25 16:53:05 +0000360
mbligh30270302007-11-05 20:33:52 +0000361 self.record('GOOD', subdir, 'reboot.verify')
apwce73d892007-09-25 16:53:05 +0000362
363
mblighc2359852007-08-28 18:11:48 +0000364 def filesystem(self, device, mountpoint = None, loop_size = 0):
mblighd7fb4a62006-10-01 00:57:53 +0000365 if not mountpoint:
366 mountpoint = self.tmpdir
mblighc2359852007-08-28 18:11:48 +0000367 return filesystem.filesystem(self, device, mountpoint,loop_size)
mblighd7fb4a62006-10-01 00:57:53 +0000368
mblighcaa605c2006-10-02 00:37:35 +0000369
370 def reboot(self, tag='autotest'):
mbligh30270302007-11-05 20:33:52 +0000371 self.record('GOOD', None, 'reboot.start')
apwde1503a2006-10-10 08:34:21 +0000372 self.harness.run_reboot()
apw11985b72007-10-04 15:44:47 +0000373 default = self.config_get('boot.set_default')
374 if default:
375 self.bootloader.set_default(tag)
376 else:
377 self.bootloader.boot_once(tag)
mblighf3b78932007-11-07 16:52:47 +0000378 system("(sleep 5; reboot) </dev/null >/dev/null 2>&1 &")
apw0778a2f2006-10-06 03:11:40 +0000379 self.quit()
mblighcaa605c2006-10-02 00:37:35 +0000380
381
apw0865f482006-03-30 18:50:19 +0000382 def noop(self, text):
383 print "job: noop: " + text
384
mblighcaa605c2006-10-02 00:37:35 +0000385
apw0865f482006-03-30 18:50:19 +0000386 # Job control primatives.
mblighc86b0b42006-07-28 17:35:28 +0000387
apw8fef4ac2006-10-10 22:53:37 +0000388 def __parallel_execute(self, func, *args):
389 func(*args)
390
391
mblighc86b0b42006-07-28 17:35:28 +0000392 def parallel(self, *tasklist):
393 """Run tasks in parallel"""
apw8fef4ac2006-10-10 22:53:37 +0000394
395 pids = []
396 for task in tasklist:
397 pids.append(fork_start(self.resultdir,
398 lambda: self.__parallel_execute(*task)))
399 for pid in pids:
400 fork_waitfor(self.resultdir, pid)
apw0865f482006-03-30 18:50:19 +0000401
mblighcaa605c2006-10-02 00:37:35 +0000402
apw0865f482006-03-30 18:50:19 +0000403 def quit(self):
mblighc86b0b42006-07-28 17:35:28 +0000404 # XXX: should have a better name.
apwde1503a2006-10-10 08:34:21 +0000405 self.harness.run_pause()
apwf2c66602006-04-27 14:11:25 +0000406 raise JobContinue("more to come")
apw0865f482006-03-30 18:50:19 +0000407
mblighcaa605c2006-10-02 00:37:35 +0000408
apw0865f482006-03-30 18:50:19 +0000409 def complete(self, status):
mblighc86b0b42006-07-28 17:35:28 +0000410 """Clean up and exit"""
apw0865f482006-03-30 18:50:19 +0000411 # We are about to exit 'complete' so clean up the control file.
412 try:
apwecf41b72006-03-31 14:00:55 +0000413 os.unlink(self.control + '.state')
apw0865f482006-03-30 18:50:19 +0000414 except:
415 pass
mbligh61a6c1a2006-12-25 01:26:38 +0000416 self.harness.run_complete()
apw1b021902006-04-03 17:02:56 +0000417 sys.exit(status)
apw0865f482006-03-30 18:50:19 +0000418
mblighcaa605c2006-10-02 00:37:35 +0000419
apw0865f482006-03-30 18:50:19 +0000420 steps = []
421 def next_step(self, step):
mblighc86b0b42006-07-28 17:35:28 +0000422 """Define the next step"""
apwce73d892007-09-25 16:53:05 +0000423 if not isinstance(step[0], basestring):
424 step[0] = step[0].__name__
apw0865f482006-03-30 18:50:19 +0000425 self.steps.append(step)
apwecf41b72006-03-31 14:00:55 +0000426 pickle.dump(self.steps, open(self.control + '.state', 'w'))
apw0865f482006-03-30 18:50:19 +0000427
mblighcaa605c2006-10-02 00:37:35 +0000428
mbligh237bed32007-09-05 13:05:57 +0000429 def next_step_prepend(self, step):
430 """Insert a new step, executing first"""
apwce73d892007-09-25 16:53:05 +0000431 if not isinstance(step[0], basestring):
432 step[0] = step[0].__name__
mbligh237bed32007-09-05 13:05:57 +0000433 self.steps.insert(0, step)
434 pickle.dump(self.steps, open(self.control + '.state', 'w'))
435
436
apw83f8d772006-04-27 14:12:56 +0000437 def step_engine(self):
mblighc86b0b42006-07-28 17:35:28 +0000438 """the stepping engine -- if the control file defines
439 step_init we will be using this engine to drive multiple runs.
440 """
441 """Do the next step"""
apw83f8d772006-04-27 14:12:56 +0000442 lcl = dict({'job': self})
443
444 str = """
445from error import *
446from autotest_utils import *
447"""
448 exec(str, lcl, lcl)
449 execfile(self.control, lcl, lcl)
450
mblighd9223fc2006-11-26 17:19:54 +0000451 state = self.control + '.state'
apw0865f482006-03-30 18:50:19 +0000452 # If there is a mid-job state file load that in and continue
453 # where it indicates. Otherwise start stepping at the passed
454 # entry.
455 try:
mblighd9223fc2006-11-26 17:19:54 +0000456 self.steps = pickle.load(open(state, 'r'))
apw0865f482006-03-30 18:50:19 +0000457 except:
apw83f8d772006-04-27 14:12:56 +0000458 if lcl.has_key('step_init'):
459 self.next_step([lcl['step_init']])
apw0865f482006-03-30 18:50:19 +0000460
461 # Run the step list.
462 while len(self.steps) > 0:
apwfd922bb2006-04-04 07:47:00 +0000463 step = self.steps.pop(0)
mblighd9223fc2006-11-26 17:19:54 +0000464 pickle.dump(self.steps, open(state, 'w'))
apw0865f482006-03-30 18:50:19 +0000465
466 cmd = step.pop(0)
apw83f8d772006-04-27 14:12:56 +0000467 lcl['__args'] = step
apwce73d892007-09-25 16:53:05 +0000468 exec(cmd + "(*__args)", lcl, lcl)
apw0865f482006-03-30 18:50:19 +0000469
mblighcaa605c2006-10-02 00:37:35 +0000470
mbligh09f288a2007-09-18 21:34:57 +0000471 def record(self, status_code, subdir, operation, status = ''):
472 """
473 Record job-level status
apw7db8d0b2006-10-09 08:10:25 +0000474
mbligh09f288a2007-09-18 21:34:57 +0000475 The intent is to make this file both machine parseable and
476 human readable. That involves a little more complexity, but
477 really isn't all that bad ;-)
478
479 Format is <status code>\t<subdir>\t<operation>\t<status>
480
481 status code: (GOOD|WARN|FAIL|ABORT)
482 or START
483 or END (GOOD|WARN|FAIL|ABORT)
484
485 subdir: MUST be a relevant subdirectory in the results,
486 or None, which will be represented as '----'
487
488 operation: description of what you ran (e.g. "dbench", or
489 "mkfs -t foobar /dev/sda9")
490
491 status: error message or "completed sucessfully"
492
493 ------------------------------------------------------------
494
495 Initial tabs indicate indent levels for grouping, and is
mbligh7dd510c2007-11-13 17:11:22 +0000496 governed by self.group_level
mbligh09f288a2007-09-18 21:34:57 +0000497
498 multiline messages have secondary lines prefaced by a double
499 space (' ')
500 """
501
mblighb0570ad2007-09-19 18:18:11 +0000502 if subdir:
503 if re.match(r'[\n\t]', subdir):
504 raise "Invalid character in subdir string"
505 substr = subdir
506 else:
507 substr = '----'
mbligh09f288a2007-09-18 21:34:57 +0000508
509 if not re.match(r'(START|(END )?(GOOD|WARN|FAIL|ABORT))$', \
510 status_code):
511 raise "Invalid status code supplied: %s" % status_code
mbligh9c5ac322007-10-31 18:01:59 +0000512 if not operation:
513 operation = '----'
mbligh09f288a2007-09-18 21:34:57 +0000514 if re.match(r'[\n\t]', operation):
515 raise "Invalid character in operation string"
516 operation = operation.rstrip()
517 status = status.rstrip()
518 status = re.sub(r"\t", " ", status)
apw7db8d0b2006-10-09 08:10:25 +0000519 # Ensure any continuation lines are marked so we can
520 # detect them in the status file to ensure it is parsable.
mbligh7dd510c2007-11-13 17:11:22 +0000521 status = re.sub(r"\n", "\n" + "\t" * self.group_level + " ", status)
mbligh09f288a2007-09-18 21:34:57 +0000522
mbligh30270302007-11-05 20:33:52 +0000523 # Generate timestamps for inclusion in the logs
524 epoch_time = int(time.time()) # seconds since epoch, in UTC
525 local_time = time.localtime(epoch_time)
526 epoch_time_str = "timestamp=%d" % (epoch_time,)
527 local_time_str = time.strftime("localtime=%b %d %H:%M:%S",
528 local_time)
529
530 msg = '\t'.join(str(x) for x in (status_code, substr, operation,
531 epoch_time_str, local_time_str,
532 status))
mbligh7dd510c2007-11-13 17:11:22 +0000533 msg = '\t' * self.group_level + msg
apw7db8d0b2006-10-09 08:10:25 +0000534
apw4b2e4fb2007-09-25 16:52:30 +0000535 self.harness.test_status_detail(status_code, substr,
536 operation, status)
apwde1503a2006-10-10 08:34:21 +0000537 self.harness.test_status(msg)
apwf1a81162006-04-25 10:10:29 +0000538 print msg
mbligh09f288a2007-09-18 21:34:57 +0000539 status_file = os.path.join(self.resultdir, 'status')
mbligh7dd510c2007-11-13 17:11:22 +0000540 open(status_file, "a").write(msg + "\n")
mblighb0570ad2007-09-19 18:18:11 +0000541 if subdir:
542 status_file = os.path.join(self.resultdir, subdir, 'status')
543 open(status_file, "a").write(msg + "\n")
apwce9abe92006-04-27 14:14:04 +0000544
545
mbligh570e93e2006-11-26 05:15:56 +0000546def runjob(control, cont = False, tag = "default", harness_type = ''):
mblighc86b0b42006-07-28 17:35:28 +0000547 """The main interface to this module
548
mbligh72b88fc2006-12-16 18:41:35 +0000549 control
mblighc86b0b42006-07-28 17:35:28 +0000550 The control file to use for this job.
551 cont
552 Whether this is the continuation of a previously started job
553 """
mblighb4eef242007-07-23 18:22:49 +0000554 control = os.path.abspath(control)
apwce9abe92006-04-27 14:14:04 +0000555 state = control + '.state'
556
557 # instantiate the job object ready for the control file.
558 myjob = None
559 try:
560 # Check that the control file is valid
561 if not os.path.exists(control):
562 raise JobError(control + ": control file not found")
563
564 # When continuing, the job is complete when there is no
565 # state file, ensure we don't try and continue.
mblighf3fef462006-09-13 16:05:05 +0000566 if cont and not os.path.exists(state):
apwce9abe92006-04-27 14:14:04 +0000567 sys.exit(1)
mblighf3fef462006-09-13 16:05:05 +0000568 if cont == False and os.path.exists(state):
apwce9abe92006-04-27 14:14:04 +0000569 os.unlink(state)
570
mbligh570e93e2006-11-26 05:15:56 +0000571 myjob = job(control, tag, cont, harness_type)
apwce9abe92006-04-27 14:14:04 +0000572
573 # Load in the users control file, may do any one of:
574 # 1) execute in toto
575 # 2) define steps, and select the first via next_step()
576 myjob.step_engine()
577
apwce9abe92006-04-27 14:14:04 +0000578 except JobContinue:
579 sys.exit(5)
580
581 except JobError, instance:
582 print "JOB ERROR: " + instance.args[0]
mbligh9c5ac322007-10-31 18:01:59 +0000583 if myjob:
mbligh30270302007-11-05 20:33:52 +0000584 command = None
585 if len(instance.args) > 1:
586 command = instance.args[1]
587 myjob.record('ABORT', None, command, instance.args[0])
apwce9abe92006-04-27 14:14:04 +0000588 myjob.complete(1)
mbligh9c5ac322007-10-31 18:01:59 +0000589
apwce9abe92006-04-27 14:14:04 +0000590
591 except:
mbligh9c5ac322007-10-31 18:01:59 +0000592 print "JOB ERROR: " + format_error()
mblighfbfb77d2007-02-15 18:54:03 +0000593 if myjob:
mbligh9c5ac322007-10-31 18:01:59 +0000594 myjob.record('ABORT', None, None, format_error())
595 myjob.complete(1)
mbligh892d37f2007-03-01 17:03:25 +0000596
597 # If we get here, then we assume the job is complete and good.
mbligh9c5ac322007-10-31 18:01:59 +0000598 myjob.record('GOOD', None, None, 'job completed sucessfully')
mbligh892d37f2007-03-01 17:03:25 +0000599 myjob.complete(0)