blob: 665c4ecb8f45d359478e3ff2e8f0699ea3940069 [file] [log] [blame]
mblighf1c52842007-10-16 15:21:38 +00001"""
2The main job wrapper for the server side.
3
4This is the core infrastructure. Derived from the client side job.py
5
6Copyright Martin J. Bligh, Andy Whitcroft 2007
7"""
8
9__author__ = """
10Martin J. Bligh <mbligh@google.com>
11Andy Whitcroft <apw@shadowen.org>
12"""
13
14import os, sys, re
mbligh05269362007-10-16 16:58:11 +000015import test
mblighf1c52842007-10-16 15:21:38 +000016from utils import *
mbligh05269362007-10-16 16:58:11 +000017from error import *
mblighf1c52842007-10-16 15:21:38 +000018
mbligh3f4bced2007-11-05 17:55:53 +000019# this magic incantation should give us access to a client library
20server_dir = os.path.dirname(__file__)
21client_dir = os.path.join(server_dir, "..", "client", "bin")
22sys.path.append(client_dir)
23import fd_stack
24sys.path.pop()
25
mblighf1c52842007-10-16 15:21:38 +000026preamble = """\
27import os, sys
mbligh87c5d882007-10-29 17:07:24 +000028sys.stderr = __stderr
mblighf1c52842007-10-16 15:21:38 +000029
30import errors, hosts, autotest, kvm
31import source_kernel, rpm_kernel, deb_kernel
32from subcommand import *
33from utils import run, get_tmp_dir, sh_escape
34
35"""
36
37client_wrapper = """
38at = autotest.Autotest()
39
40def run_client(machine):
41 host = hosts.SSHHost(machine)
42 at.run(control, host=host)
43
44if len(machines) > 1:
45 parallel_simple(run_client, machines)
46else:
47 run_client(machines[0])
48"""
49
mbligh303ccac2007-11-05 18:07:28 +000050crashdumps = """
51def crashdumps(machine):
52 host = hosts.SSHHost(machine, initialize=False)
53 host.get_crashdumps(test_start_time)
54
55parallel_simple(crashdumps, machines, log=False)
56"""
57
mblighf1c52842007-10-16 15:21:38 +000058cleanup="""\
59def cleanup(machine):
60 host = hosts.SSHHost(machine, initialize=False)
61 host.reboot()
62
mbligh84c0ab12007-10-24 21:28:58 +000063parallel_simple(cleanup, machines, log=False)
mblighf1c52842007-10-16 15:21:38 +000064"""
65
mblighf36243d2007-10-30 15:36:16 +000066install="""\
67def install(machine):
68 host = hosts.SSHHost(machine, initialize=False)
69 host.machine_install()
70
71parallel_simple(cleanup, machines, log=False)
72"""
73
mblighf1c52842007-10-16 15:21:38 +000074class server_job:
75 """The actual job against which we do everything.
76
77 Properties:
78 autodir
79 The top level autotest directory (/usr/local/autotest).
80 serverdir
81 <autodir>/server/
82 clientdir
83 <autodir>/client/
84 conmuxdir
85 <autodir>/conmux/
86 testdir
87 <autodir>/server/tests/
88 control
89 the control file for this job
90 """
91
mbligh18420c22007-10-16 22:27:14 +000092 def __init__(self, control, args, resultdir, label, user, client=False):
mblighf1c52842007-10-16 15:21:38 +000093 """
94 control
95 The control file (pathname of)
96 args
97 args to pass to the control file
98 resultdir
99 where to throw the results
mbligh18420c22007-10-16 22:27:14 +0000100 label
101 label for the job
mblighf1c52842007-10-16 15:21:38 +0000102 user
103 Username for the job (email address)
104 client
105 True if a client-side control file
106 """
mbligh05269362007-10-16 16:58:11 +0000107 path = os.path.dirname(sys.modules['server_job'].__file__)
mblighf1c52842007-10-16 15:21:38 +0000108 self.autodir = os.path.abspath(os.path.join(path, '..'))
109 self.serverdir = os.path.join(self.autodir, 'server')
mbligh05269362007-10-16 16:58:11 +0000110 self.testdir = os.path.join(self.serverdir, 'tests')
111 self.tmpdir = os.path.join(self.serverdir, 'tmp')
mblighf1c52842007-10-16 15:21:38 +0000112 self.conmuxdir = os.path.join(self.autodir, 'conmux')
113 self.clientdir = os.path.join(self.autodir, 'client')
114 self.control = re.sub('\r\n', '\n', open(control, 'r').read())
115 self.resultdir = resultdir
116 if not os.path.exists(resultdir):
117 os.mkdir(resultdir)
mbligh3dcf2c92007-10-16 22:24:00 +0000118 self.status = os.path.join(resultdir, 'status')
mbligh18420c22007-10-16 22:27:14 +0000119 self.label = label
mblighf1c52842007-10-16 15:21:38 +0000120 self.user = user
121 self.args = args
122 self.client = client
123 self.record_prefix = ''
124
mbligh3f4bced2007-11-05 17:55:53 +0000125 self.stdout = fd_stack.fd_stack(1, sys.stdout)
126 self.stderr = fd_stack.fd_stack(2, sys.stderr)
127
mbligh3dcf2c92007-10-16 22:24:00 +0000128 if os.path.exists(self.status):
129 os.unlink(self.status)
mbligh18420c22007-10-16 22:27:14 +0000130 job_data = { 'label' : label, 'user' : user}
mblighf1c52842007-10-16 15:21:38 +0000131 write_keyval(self.resultdir, job_data)
132
133
mblighf36243d2007-10-30 15:36:16 +0000134 def run(self, machines, reboot = False, install_before = False,
135 install_after = False, namespace = {}):
mbligh60dbd502007-10-26 14:59:31 +0000136 # use a copy so changes don't affect the original dictionary
137 namespace = namespace.copy()
138
mblighf1c52842007-10-16 15:21:38 +0000139 namespace['machines'] = machines
140 namespace['args'] = self.args
141 namespace['job'] = self
142
mbligh87c5d882007-10-29 17:07:24 +0000143 os.chdir(self.resultdir)
144
145 status_log = os.path.join(self.resultdir, 'status.log')
146 namespace['__stderr'] = open(status_log, 'a', 0)
mblighf1c52842007-10-16 15:21:38 +0000147 try:
mblighf36243d2007-10-30 15:36:16 +0000148 if install_before and machines:
149 exec(preamble + install, namespace, namespace)
mblighf1c52842007-10-16 15:21:38 +0000150 if self.client:
151 namespace['control'] = self.control
152 open('control', 'w').write(self.control)
153 open('control.srv', 'w').write(client_wrapper)
154 server_control = client_wrapper
155 else:
156 open('control.srv', 'w').write(self.control)
157 server_control = self.control
mblighf1c52842007-10-16 15:21:38 +0000158 exec(preamble + server_control, namespace, namespace)
159
160 finally:
161 if reboot and machines:
162 exec(preamble + cleanup, namespace, namespace)
mblighf36243d2007-10-30 15:36:16 +0000163 if install_after and machines:
164 exec(preamble + install, namespace, namespace)
mblighf1c52842007-10-16 15:21:38 +0000165
166
167 def run_test(self, url, *args, **dargs):
168 """Summon a test object and run it.
169
170 tag
171 tag to add to testname
172 url
173 url of the test to run
174 """
175
mblighf1c52842007-10-16 15:21:38 +0000176 (group, testname) = test.testname(url)
177 tag = None
178 subdir = testname
mbligh43ac5222007-10-16 15:55:01 +0000179
mblighf1c52842007-10-16 15:21:38 +0000180 if dargs.has_key('tag'):
181 tag = dargs['tag']
182 del dargs['tag']
183 if tag:
184 subdir += '.' + tag
mblighf1c52842007-10-16 15:21:38 +0000185
mbligh43ac5222007-10-16 15:55:01 +0000186 try:
187 test.runtest(self, url, tag, args, dargs)
188 self.record('GOOD', subdir, testname, 'completed successfully')
189 except Exception, detail:
mbligh05269362007-10-16 16:58:11 +0000190 self.record('FAIL', subdir, testname, format_error())
mblighf1c52842007-10-16 15:21:38 +0000191
192
193 def run_group(self, function, *args, **dargs):
194 """\
195 function:
196 subroutine to run
197 *args:
198 arguments for the function
199 """
200
201 result = None
202 name = function.__name__
203
204 # Allow the tag for the group to be specified.
205 if dargs.has_key('tag'):
206 tag = dargs['tag']
207 del dargs['tag']
208 if tag:
209 name = tag
210
211 # if tag:
212 # name += '.' + tag
213 old_record_prefix = self.record_prefix
214 try:
215 try:
216 self.record('START', None, name)
217 self.record_prefix += '\t'
218 result = function(*args, **dargs)
219 self.record_prefix = old_record_prefix
220 self.record('END GOOD', None, name)
221 except:
222 self.record_prefix = old_record_prefix
223 self.record('END FAIL', None, name, format_error())
224 # We don't want to raise up an error higher if it's just
225 # a TestError - we want to carry on to other tests. Hence
226 # this outer try/except block.
227 except TestError:
228 pass
229 except:
230 raise TestError(name + ' failed\n' + format_error())
231
232 return result
233
234
235 def record(self, status_code, subdir, operation, status = ''):
236 """
237 Record job-level status
238
239 The intent is to make this file both machine parseable and
240 human readable. That involves a little more complexity, but
241 really isn't all that bad ;-)
242
243 Format is <status code>\t<subdir>\t<operation>\t<status>
244
245 status code: (GOOD|WARN|FAIL|ABORT)
246 or START
247 or END (GOOD|WARN|FAIL|ABORT)
248
249 subdir: MUST be a relevant subdirectory in the results,
250 or None, which will be represented as '----'
251
252 operation: description of what you ran (e.g. "dbench", or
253 "mkfs -t foobar /dev/sda9")
254
255 status: error message or "completed sucessfully"
256
257 ------------------------------------------------------------
258
259 Initial tabs indicate indent levels for grouping, and is
260 governed by self.record_prefix
261
262 multiline messages have secondary lines prefaced by a double
263 space (' ')
264 """
265
266 if subdir:
267 if re.match(r'[\n\t]', subdir):
268 raise "Invalid character in subdir string"
269 substr = subdir
270 else:
271 substr = '----'
272
273 if not re.match(r'(START|(END )?(GOOD|WARN|FAIL|ABORT))$', \
274 status_code):
275 raise "Invalid status code supplied: %s" % status_code
276 if re.match(r'[\n\t]', operation):
277 raise "Invalid character in operation string"
278 operation = operation.rstrip()
279 status = status.rstrip()
280 status = re.sub(r"\t", " ", status)
281 # Ensure any continuation lines are marked so we can
282 # detect them in the status file to ensure it is parsable.
283 status = re.sub(r"\n", "\n" + self.record_prefix + " ", status)
284
285 msg = '%s\t%s\t%s\t%s' %(status_code, substr, operation, status)
286
287 status_file = os.path.join(self.resultdir, 'status')
mblighf1c52842007-10-16 15:21:38 +0000288 print msg
289 open(status_file, "a").write(self.record_prefix + msg + "\n")
290 if subdir:
291 status_file = os.path.join(self.resultdir, subdir, 'status')
292 open(status_file, "a").write(msg + "\n")