blob: 506cc15b5c3c3f2060e2a77bb410828e8c31f0b6 [file] [log] [blame]
mblighbe630eb2008-08-01 16:41:48 +00001#
2# Copyright 2008 Google Inc. All Rights Reserved.
3
4"""
5The job module contains the objects and methods used to
6manage jobs in Autotest.
7
8The valid actions are:
9list: lists job(s)
10create: create a job
11abort: abort job(s)
12stat: detailed listing of job(s)
13
14The common options are:
15
16See topic_common.py for a High Level Design and Algorithm.
17"""
18
19import getpass, os, pwd, re, socket, sys
20from autotest_lib.cli import topic_common, action_common
21
22
23class job(topic_common.atest):
24 """Job class
25 atest job [create|list|stat|abort] <options>"""
26 usage_action = '[create|list|stat|abort]'
27 topic = msg_topic = 'job'
28 msg_items = '<job_ids>'
29
30
31 def _convert_status(self, results):
32 for result in results:
mbligh10a47332008-08-11 19:37:46 +000033 total = sum(result['status_counts'].values())
mbligh47dc4d22009-02-12 21:48:34 +000034 status = ['%s=%s(%.1f%%)' % (key, val, 100.0*float(val)/total)
mbligh10a47332008-08-11 19:37:46 +000035 for key, val in result['status_counts'].iteritems()]
mblighbe630eb2008-08-01 16:41:48 +000036 status.sort()
37 result['status_counts'] = ', '.join(status)
38
39
40class job_help(job):
41 """Just here to get the atest logic working.
42 Usage is set by its parent"""
43 pass
44
45
46class job_list_stat(action_common.atest_list, job):
47 def __split_jobs_between_ids_names(self):
48 job_ids = []
49 job_names = []
50
51 # Sort between job IDs and names
52 for job_id in self.jobs:
53 if job_id.isdigit():
54 job_ids.append(job_id)
55 else:
56 job_names.append(job_id)
57 return (job_ids, job_names)
58
59
60 def execute_on_ids_and_names(self, op, filters={},
61 check_results={'id__in': 'id',
62 'name__in': 'id'},
63 tag_id='id__in', tag_name='name__in'):
64 if not self.jobs:
65 # Want everything
66 return super(job_list_stat, self).execute(op=op, filters=filters)
67
68 all_jobs = []
69 (job_ids, job_names) = self.__split_jobs_between_ids_names()
70
71 for items, tag in [(job_ids, tag_id),
72 (job_names, tag_name)]:
73 if items:
74 new_filters = filters.copy()
75 new_filters[tag] = items
76 jobs = super(job_list_stat,
77 self).execute(op=op,
78 filters=new_filters,
79 check_results=check_results)
80 all_jobs.extend(jobs)
81
82 return all_jobs
83
84
85class job_list(job_list_stat):
86 """atest job list [<jobs>] [--all] [--running] [--user <username>]"""
87 def __init__(self):
88 super(job_list, self).__init__()
89 self.parser.add_option('-a', '--all', help='List jobs for all '
90 'users.', action='store_true', default=False)
91 self.parser.add_option('-r', '--running', help='List only running '
92 'jobs', action='store_true')
93 self.parser.add_option('-u', '--user', help='List jobs for given '
94 'user', type='string')
95
96
97 def parse(self):
98 (options, leftover) = self.parse_with_flist([('jobs', '', '', True)],
99 None)
100 self.all = options.all
101 self.data['running'] = options.running
102 if options.user:
103 if options.all:
104 self.invalid_syntax('Only specify --all or --user, not both.')
105 else:
106 self.data['owner'] = options.user
107 elif not options.all and not self.jobs:
108 self.data['owner'] = getpass.getuser()
109
110 return (options, leftover)
111
112
113 def execute(self):
114 return self.execute_on_ids_and_names(op='get_jobs_summary',
115 filters=self.data)
116
117
118 def output(self, results):
119 keys = ['id', 'owner', 'name', 'status_counts']
120 if self.verbose:
121 keys.extend(['priority', 'control_type', 'created_on'])
122 self._convert_status(results)
123 super(job_list, self).output(results, keys)
124
125
126
127class job_stat(job_list_stat):
128 """atest job stat <job>"""
129 usage_action = 'stat'
130
131 def __init__(self):
132 super(job_stat, self).__init__()
133 self.parser.add_option('-f', '--control-file',
134 help='Display the control file',
135 action='store_true', default=False)
136
137
138 def parse(self):
139 (options, leftover) = self.parse_with_flist(flists=[('jobs', '', '',
140 True)],
141 req_items='jobs')
142 if not self.jobs:
143 self.invalid_syntax('Must specify at least one job.')
144
145 self.show_control_file = options.control_file
146
147 return (options, leftover)
148
149
150 def _merge_results(self, summary, qes):
151 hosts_status = {}
152 for qe in qes:
153 if qe['host']:
154 job_id = qe['job']['id']
155 hostname = qe['host']['hostname']
156 hosts_status.setdefault(job_id,
157 {}).setdefault(qe['status'],
158 []).append(hostname)
159
160 for job in summary:
161 job_id = job['id']
162 if hosts_status.has_key(job_id):
163 this_job = hosts_status[job_id]
mbligh47dc4d22009-02-12 21:48:34 +0000164 host_per_status = ['%s=%s' %(status, ','.join(host))
mblighbe630eb2008-08-01 16:41:48 +0000165 for status, host in this_job.iteritems()]
166 job['hosts_status'] = ', '.join(host_per_status)
167 else:
168 job['hosts_status'] = ''
169 return summary
170
171
172 def execute(self):
173 summary = self.execute_on_ids_and_names(op='get_jobs_summary')
174
175 # Get the real hostnames
176 qes = self.execute_on_ids_and_names(op='get_host_queue_entries',
177 check_results={},
178 tag_id='job__in',
179 tag_name='job__name__in')
180
181 self._convert_status(summary)
182
183 return self._merge_results(summary, qes)
184
185
186 def output(self, results):
187 if not self.verbose:
188 keys = ['id', 'name', 'priority', 'status_counts', 'hosts_status']
189 else:
190 keys = ['id', 'name', 'priority', 'status_counts', 'hosts_status',
showard2bab8f42008-11-12 18:15:22 +0000191 'owner', 'control_type', 'synch_count', 'created_on',
showard21baa452008-10-21 00:08:39 +0000192 'run_verify', 'reboot_before', 'reboot_after']
mblighbe630eb2008-08-01 16:41:48 +0000193
194 if self.show_control_file:
195 keys.append('control_file')
196
197 super(job_stat, self).output(results, keys)
198
199
200class job_create(action_common.atest_create, job):
201 """atest job create [--priority <Low|Medium|High|Urgent>]
mbligha212d712009-02-11 01:22:36 +0000202 [--synch_count] [--control-file </path/to/cfile>]
mblighbe630eb2008-08-01 16:41:48 +0000203 [--on-server] [--test <test1,test2>] [--kernel <http://kernel>]
204 [--mlist </path/to/machinelist>] [--machine <host1 host2 host3>]
showardb27f4ad2009-05-01 00:08:26 +0000205 [--labels <list of labels of machines to run on>]
showard21baa452008-10-21 00:08:39 +0000206 [--reboot_before <option>] [--reboot_after <option>]
mblighce348642009-02-12 21:50:39 +0000207 [--noverify] [--timeout <timeout>] [--one-time-hosts <hosts>]
showardb27f4ad2009-05-01 00:08:26 +0000208 [--email <email>] [--dependencies <labels this job is dependent on>]
showard648a35c2009-05-01 00:08:42 +0000209 [--atomic_group <atomic group name>]
mblighae64d3a2008-10-15 04:13:52 +0000210 job_name
211
212 Creating a job is rather different from the other create operations,
213 so it only uses the __init__() and output() from its superclass.
214 """
mblighbe630eb2008-08-01 16:41:48 +0000215 op_action = 'create'
216 msg_items = 'job_name'
mblighbe630eb2008-08-01 16:41:48 +0000217
218 def __init__(self):
219 super(job_create, self).__init__()
220 self.hosts = []
221 self.ctrl_file_data = {}
222 self.data_item_key = 'name'
223 self.parser.add_option('-p', '--priority', help='Job priority (low, '
224 'medium, high, urgent), default=medium',
225 type='choice', choices=('low', 'medium', 'high',
226 'urgent'), default='medium')
showard7bce1022008-11-14 22:51:05 +0000227 self.parser.add_option('-y', '--synch_count', type=int,
showard2bab8f42008-11-12 18:15:22 +0000228 help='Number of machines to use per autoserv '
mbligh7ffdb8b2009-01-21 19:01:51 +0000229 'execution')
mblighbe630eb2008-08-01 16:41:48 +0000230 self.parser.add_option('-f', '--control-file',
231 help='use this control file', metavar='FILE')
232 self.parser.add_option('-s', '--server',
233 help='This is server-side job',
234 action='store_true', default=False)
235 self.parser.add_option('-t', '--test',
mbligh51148c72008-08-11 20:23:58 +0000236 help='List of tests to run')
mblighbe630eb2008-08-01 16:41:48 +0000237 self.parser.add_option('-k', '--kernel', help='Install kernel from this'
238 ' URL before beginning job')
showardb27f4ad2009-05-01 00:08:26 +0000239 self.parser.add_option('-d', '--dependencies', help='Comma separated '
240 'list of labels this job is dependent on.',
241 default='')
mblighb9a8b162008-10-29 16:47:29 +0000242 self.parser.add_option('-b', '--labels', help='Comma separated list of '
showardb27f4ad2009-05-01 00:08:26 +0000243 'labels to get machine list from.', default='')
showard648a35c2009-05-01 00:08:42 +0000244 self.parser.add_option('-G', '--atomic_group', help='Name of an Atomic '
245 'Group to schedule this job on.',
246 default='')
mblighbe630eb2008-08-01 16:41:48 +0000247 self.parser.add_option('-m', '--machine', help='List of machines to '
248 'run on')
249 self.parser.add_option('-M', '--mlist',
250 help='File listing machines to use',
251 type='string', metavar='MACHINE_FLIST')
mblighce348642009-02-12 21:50:39 +0000252 self.parser.add_option('--one-time-hosts',
253 help='List of one time hosts')
mbligh6fee7fd2008-10-10 15:44:39 +0000254 self.parser.add_option('-e', '--email', help='A comma seperated list '
255 'of email addresses to notify of job completion',
256 default='')
mblighb9a8b162008-10-29 16:47:29 +0000257 self.parser.add_option('-B', '--reboot_before',
showard21baa452008-10-21 00:08:39 +0000258 help='Whether or not to reboot the machine '
259 'before the job (never/if dirty/always)',
260 type='choice',
261 choices=('never', 'if dirty', 'always'))
262 self.parser.add_option('-a', '--reboot_after',
263 help='Whether or not to reboot the machine '
264 'after the job (never/if all tests passed/'
265 'always)',
266 type='choice',
267 choices=('never', 'if all tests passed',
268 'always'))
mblighfb8f0ab2008-11-13 01:11:48 +0000269 self.parser.add_option('-l', '--clone', help='Clone an existing job. '
270 'This will discard all other options except '
271 '--reuse-hosts.', default=False,
272 metavar='JOB_ID')
273 self.parser.add_option('-r', '--reuse-hosts', help='Use the exact same '
274 'hosts as cloned job. Only for use with '
275 '--clone.', action='store_true', default=False)
mbligh5d0b4b32008-12-22 14:43:01 +0000276 self.parser.add_option('-n', '--noverify',
277 help='Do not run verify for job',
278 default=False, action='store_true')
279 self.parser.add_option('-o', '--timeout', help='Job timeout in hours.',
280 metavar='TIMEOUT')
mblighbe630eb2008-08-01 16:41:48 +0000281
282
283 def parse(self):
284 flists = [('hosts', 'mlist', 'machine', False),
285 ('jobname', '', '', True)]
286 (options, leftover) = self.parse_with_flist(flists,
287 req_items='jobname')
288 self.data = {}
mblighfb8f0ab2008-11-13 01:11:48 +0000289 if len(self.jobname) > 1:
290 self.invalid_syntax('Too many arguments specified, only expected '
291 'to receive job name: %s' % self.jobname)
292 self.jobname = self.jobname[0]
293
294 if options.reuse_hosts and not options.clone:
295 self.invalid_syntax('--reuse-hosts only to be used with --clone.')
296 # If cloning skip parse, parsing is done in execute
297 self.clone_id = options.clone
298 if options.clone:
299 self.op_action = 'clone'
300 self.msg_items = 'jobid'
301 self.reuse_hosts = options.reuse_hosts
302 return (options, leftover)
mblighbe630eb2008-08-01 16:41:48 +0000303
showardb27f4ad2009-05-01 00:08:26 +0000304 if (len(self.hosts) == 0 and not options.one_time_hosts
showard648a35c2009-05-01 00:08:42 +0000305 and not options.labels and not options.atomic_group):
mblighce348642009-02-12 21:50:39 +0000306 self.invalid_syntax('Must specify at least one machine '
showard648a35c2009-05-01 00:08:42 +0000307 'or an atomic group '
308 '(-m, -M, -b, -G or --one-time-hosts).')
mblighbe630eb2008-08-01 16:41:48 +0000309 if not options.control_file and not options.test:
310 self.invalid_syntax('Must specify either --test or --control-file'
311 ' to create a job.')
312 if options.control_file and options.test:
313 self.invalid_syntax('Can only specify one of --control-file or '
314 '--test, not both.')
mbligh120351e2009-01-24 01:40:45 +0000315 if options.kernel:
316 self.ctrl_file_data['kernel'] = options.kernel
317 self.ctrl_file_data['do_push_packages'] = True
mblighbe630eb2008-08-01 16:41:48 +0000318 if options.control_file:
mblighbe630eb2008-08-01 16:41:48 +0000319 try:
mbligh120351e2009-01-24 01:40:45 +0000320 control_file_f = open(options.control_file)
321 try:
322 control_file_data = control_file_f.read()
323 finally:
324 control_file_f.close()
mblighbe630eb2008-08-01 16:41:48 +0000325 except IOError:
326 self.generic_error('Unable to read from specified '
327 'control-file: %s' % options.control_file)
mbligh120351e2009-01-24 01:40:45 +0000328 if options.kernel:
329 if options.server:
330 self.invalid_syntax(
331 'A control file and a kernel may only be specified'
332 ' together on client side jobs.')
333 # execute() will pass this to the AFE server to wrap this
334 # control file up to include the kernel installation steps.
335 self.ctrl_file_data['client_control_file'] = control_file_data
336 else:
337 self.data['control_file'] = control_file_data
mbligh4eae22a2008-10-10 16:09:46 +0000338 if options.test:
showard2bab8f42008-11-12 18:15:22 +0000339 if options.server:
mblighb9a8b162008-10-29 16:47:29 +0000340 self.invalid_syntax('If you specify tests, then the '
showard2bab8f42008-11-12 18:15:22 +0000341 'client/server setting is implicit and '
342 'cannot be overriden.')
mbligh4eae22a2008-10-10 16:09:46 +0000343 tests = [t.strip() for t in options.test.split(',') if t.strip()]
mbligh120351e2009-01-24 01:40:45 +0000344 self.ctrl_file_data['tests'] = tests
mbligh4eae22a2008-10-10 16:09:46 +0000345
mblighbe630eb2008-08-01 16:41:48 +0000346
347 if options.priority:
348 self.data['priority'] = options.priority.capitalize()
showard21baa452008-10-21 00:08:39 +0000349 if options.reboot_before:
350 self.data['reboot_before'] = options.reboot_before.capitalize()
351 if options.reboot_after:
352 self.data['reboot_after'] = options.reboot_after.capitalize()
mbligh5d0b4b32008-12-22 14:43:01 +0000353 if options.noverify:
354 self.data['run_verify'] = False
355 if options.timeout:
356 self.data['timeout'] = options.timeout
mblighbe630eb2008-08-01 16:41:48 +0000357
mblighce348642009-02-12 21:50:39 +0000358 if options.one_time_hosts:
359 one_time_hosts = self._file_list(options, opt_list='one_time_hosts')
360 self.data['one_time_hosts'] = one_time_hosts
showardb27f4ad2009-05-01 00:08:26 +0000361 if options.labels:
362 labels = options.labels.split(',')
363 labels = [label.strip() for label in labels if label.strip()]
364 label_hosts = self.execute_rpc(op='get_hosts',
365 multiple_labels=labels)
366 for host in label_hosts:
367 self.hosts.append(host['hostname'])
mblighce348642009-02-12 21:50:39 +0000368
mblighbe630eb2008-08-01 16:41:48 +0000369 self.data['name'] = self.jobname
370
371 (self.data['hosts'],
372 self.data['meta_hosts']) = self.parse_hosts(self.hosts)
373
showard648a35c2009-05-01 00:08:42 +0000374 if options.atomic_group:
375 self.data['atomic_group_name'] = options.atomic_group
376
showardb27f4ad2009-05-01 00:08:26 +0000377 deps = options.dependencies.split(',')
mblighb9a8b162008-10-29 16:47:29 +0000378 deps = [dep.strip() for dep in deps if dep.strip()]
379 self.data['dependencies'] = deps
mblighbe630eb2008-08-01 16:41:48 +0000380
mbligh6fee7fd2008-10-10 15:44:39 +0000381 self.data['email_list'] = options.email
mbligh7ffdb8b2009-01-21 19:01:51 +0000382 if options.synch_count:
383 self.data['synch_count'] = options.synch_count
mblighbe630eb2008-08-01 16:41:48 +0000384 if options.server:
385 self.data['control_type'] = 'Server'
386 else:
387 self.data['control_type'] = 'Client'
388
mblighbe630eb2008-08-01 16:41:48 +0000389 return (options, leftover)
390
391
392 def execute(self):
393 if self.ctrl_file_data:
mbligh120351e2009-01-24 01:40:45 +0000394 uploading_kernel = 'kernel' in self.ctrl_file_data
395 if uploading_kernel:
mbligh8c7b04c2009-03-25 18:01:56 +0000396 default_timeout = socket.getdefaulttimeout()
mblighbe630eb2008-08-01 16:41:48 +0000397 socket.setdefaulttimeout(topic_common.UPLOAD_SOCKET_TIMEOUT)
398 print 'Uploading Kernel: this may take a while...',
mbligh120351e2009-01-24 01:40:45 +0000399 sys.stdout.flush()
400 try:
401 cf_info = self.execute_rpc(op='generate_control_file',
402 item=self.jobname,
403 **self.ctrl_file_data)
404 finally:
405 if uploading_kernel:
mbligh8c7b04c2009-03-25 18:01:56 +0000406 socket.setdefaulttimeout(default_timeout)
407
mbligh120351e2009-01-24 01:40:45 +0000408 if uploading_kernel:
mblighbe630eb2008-08-01 16:41:48 +0000409 print 'Done'
showard989f25d2008-10-01 11:38:11 +0000410 self.data['control_file'] = cf_info['control_file']
mbligh7ffdb8b2009-01-21 19:01:51 +0000411 if 'synch_count' not in self.data:
412 self.data['synch_count'] = cf_info['synch_count']
showard989f25d2008-10-01 11:38:11 +0000413 if cf_info['is_server']:
mblighbe630eb2008-08-01 16:41:48 +0000414 self.data['control_type'] = 'Server'
415 else:
416 self.data['control_type'] = 'Client'
mblighae64d3a2008-10-15 04:13:52 +0000417
mblighb9a8b162008-10-29 16:47:29 +0000418 # Get the union of the 2 sets of dependencies
419 deps = set(self.data['dependencies'])
showarda6fe9c62008-11-03 19:04:25 +0000420 deps = sorted(deps.union(cf_info['dependencies']))
mblighb9a8b162008-10-29 16:47:29 +0000421 self.data['dependencies'] = list(deps)
mblighae64d3a2008-10-15 04:13:52 +0000422
mbligh7ffdb8b2009-01-21 19:01:51 +0000423 if 'synch_count' not in self.data:
424 self.data['synch_count'] = 1
425
mblighfb8f0ab2008-11-13 01:11:48 +0000426 if self.clone_id:
427 clone_info = self.execute_rpc(op='get_info_for_clone',
428 id=self.clone_id,
429 preserve_metahosts=self.reuse_hosts)
430 self.data = clone_info['job']
431
432 # Remove fields from clone data that cannot be reused
433 unused_fields = ('name', 'created_on', 'id', 'owner')
434 for field in unused_fields:
435 del self.data[field]
436
437 # Keyword args cannot be unicode strings
438 for key, val in self.data.iteritems():
439 del self.data[key]
440 self.data[str(key)] = val
441
442 # Convert host list from clone info that can be used for job_create
443 host_list = []
444 if clone_info['meta_host_counts']:
445 # Creates a dictionary of meta_hosts, e.g.
446 # {u'label1': 3, u'label2': 2, u'label3': 5}
447 meta_hosts = clone_info['meta_host_counts']
448 # Create a list of formatted metahosts, e.g.
449 # [u'3*label1', u'2*label2', u'5*label3']
450 meta_host_list = ['%s*%s' % (str(val), key) for key,val in
451 meta_hosts.items()]
452 host_list.extend(meta_host_list)
453 if clone_info['hosts']:
454 # Creates a list of hosts, e.g. [u'host1', u'host2']
455 hosts = [host['hostname'] for host in clone_info['hosts']]
456 host_list.extend(hosts)
457
458 (self.data['hosts'],
459 self.data['meta_hosts']) = self.parse_hosts(host_list)
460 self.data['name'] = self.jobname
461
mblighae64d3a2008-10-15 04:13:52 +0000462 job_id = self.execute_rpc(op='create_job', **self.data)
463 return ['%s (id %s)' % (self.jobname, job_id)]
mblighbe630eb2008-08-01 16:41:48 +0000464
465
466 def get_items(self):
467 return [self.jobname]
468
469
470class job_abort(job, action_common.atest_delete):
471 """atest job abort <job(s)>"""
472 usage_action = op_action = 'abort'
473 msg_done = 'Aborted'
474
475 def parse(self):
476 (options, leftover) = self.parse_with_flist([('jobids', '', '', True)],
477 req_items='jobids')
478
479
mbligh206d50a2008-11-13 01:19:25 +0000480 def execute(self):
481 data = {'job__id__in': self.jobids}
482 self.execute_rpc(op='abort_host_queue_entries', **data)
483 print 'Aborting jobs: %s' % ', '.join(self.jobids)
484
485
mblighbe630eb2008-08-01 16:41:48 +0000486 def get_items(self):
487 return self.jobids