blob: 4b88bacfb684a8e83999182fdeeb5903567dc18b [file] [log] [blame]
Aviv Keshet18308922013-02-19 17:49:49 -08001#pylint: disable-msg=C0111
mblighe8819cd2008-02-15 16:48:40 +00002"""\
3Utility functions for rpc_interface.py. We keep them in a separate file so that
4only RPC interface functions go into that file.
5"""
6
7__author__ = 'showard@google.com (Steve Howard)'
8
MK Ryu84573e12015-02-18 15:54:09 -08009import datetime
MK Ryufbb002c2015-06-08 14:13:16 -070010from functools import wraps
MK Ryu84573e12015-02-18 15:54:09 -080011import inspect
12import os
13import sys
showard3d6ae112009-05-02 00:45:48 +000014import django.http
Dan Shi07e09af2013-04-12 09:31:29 -070015from autotest_lib.frontend.afe import models, model_logic
Alex Miller4a193692013-08-21 13:59:01 -070016from autotest_lib.client.common_lib import control_data, error
Jiaxi Luo421608e2014-07-07 14:38:00 -070017from autotest_lib.client.common_lib import global_config, priorities
MK Ryu0c1a37d2015-04-30 12:00:55 -070018from autotest_lib.client.common_lib import time_utils
MK Ryu509516b2015-05-18 12:00:47 -070019from autotest_lib.client.common_lib.cros.graphite import autotest_stats
Prashanth Balasubramanian8c98ac12014-12-23 11:26:44 -080020from autotest_lib.server import utils as server_utils
MK Ryu9651ca52015-06-08 17:48:22 -070021from autotest_lib.server.cros import provision
22from autotest_lib.server.cros.dynamic_suite import frontend_wrappers
mblighe8819cd2008-02-15 16:48:40 +000023
showarda62866b2008-07-28 21:27:41 +000024NULL_DATETIME = datetime.datetime.max
25NULL_DATE = datetime.date.max
26
mblighe8819cd2008-02-15 16:48:40 +000027def prepare_for_serialization(objects):
jadmanski0afbb632008-06-06 21:10:57 +000028 """
29 Prepare Python objects to be returned via RPC.
Aviv Keshet18308922013-02-19 17:49:49 -080030 @param objects: objects to be prepared.
jadmanski0afbb632008-06-06 21:10:57 +000031 """
32 if (isinstance(objects, list) and len(objects) and
33 isinstance(objects[0], dict) and 'id' in objects[0]):
34 objects = gather_unique_dicts(objects)
35 return _prepare_data(objects)
showardb8d34242008-04-25 18:11:16 +000036
37
showardc92da832009-04-07 18:14:34 +000038def prepare_rows_as_nested_dicts(query, nested_dict_column_names):
39 """
40 Prepare a Django query to be returned via RPC as a sequence of nested
41 dictionaries.
42
43 @param query - A Django model query object with a select_related() method.
44 @param nested_dict_column_names - A list of column/attribute names for the
45 rows returned by query to expand into nested dictionaries using
46 their get_object_dict() method when not None.
47
48 @returns An list suitable to returned in an RPC.
49 """
50 all_dicts = []
51 for row in query.select_related():
52 row_dict = row.get_object_dict()
53 for column in nested_dict_column_names:
54 if row_dict[column] is not None:
55 row_dict[column] = getattr(row, column).get_object_dict()
56 all_dicts.append(row_dict)
57 return prepare_for_serialization(all_dicts)
58
59
showardb8d34242008-04-25 18:11:16 +000060def _prepare_data(data):
jadmanski0afbb632008-06-06 21:10:57 +000061 """
62 Recursively process data structures, performing necessary type
63 conversions to values in data to allow for RPC serialization:
64 -convert datetimes to strings
showard2b9a88b2008-06-13 20:55:03 +000065 -convert tuples and sets to lists
jadmanski0afbb632008-06-06 21:10:57 +000066 """
67 if isinstance(data, dict):
68 new_data = {}
69 for key, value in data.iteritems():
70 new_data[key] = _prepare_data(value)
71 return new_data
showard2b9a88b2008-06-13 20:55:03 +000072 elif (isinstance(data, list) or isinstance(data, tuple) or
73 isinstance(data, set)):
jadmanski0afbb632008-06-06 21:10:57 +000074 return [_prepare_data(item) for item in data]
showard98659972008-07-17 17:00:07 +000075 elif isinstance(data, datetime.date):
showarda62866b2008-07-28 21:27:41 +000076 if data is NULL_DATETIME or data is NULL_DATE:
77 return None
jadmanski0afbb632008-06-06 21:10:57 +000078 return str(data)
79 else:
80 return data
mblighe8819cd2008-02-15 16:48:40 +000081
82
Moises Osorio2dda22e2014-09-16 15:56:24 -070083def fetchall_as_list_of_dicts(cursor):
84 """
85 Converts each row in the cursor to a dictionary so that values can be read
86 by using the column name.
87 @param cursor: The database cursor to read from.
88 @returns: A list of each row in the cursor as a dictionary.
89 """
90 desc = cursor.description
91 return [ dict(zip([col[0] for col in desc], row))
92 for row in cursor.fetchall() ]
93
94
showard3d6ae112009-05-02 00:45:48 +000095def raw_http_response(response_data, content_type=None):
96 response = django.http.HttpResponse(response_data, mimetype=content_type)
97 response['Content-length'] = str(len(response.content))
98 return response
99
100
showardb0dfb9f2008-06-06 18:08:02 +0000101def gather_unique_dicts(dict_iterable):
jadmanski0afbb632008-06-06 21:10:57 +0000102 """\
103 Pick out unique objects (by ID) from an iterable of object dicts.
104 """
105 id_set = set()
106 result = []
107 for obj in dict_iterable:
108 if obj['id'] not in id_set:
109 id_set.add(obj['id'])
110 result.append(obj)
111 return result
showardb0dfb9f2008-06-06 18:08:02 +0000112
113
Jiaxi Luo15cbf372014-07-01 19:20:20 -0700114def extra_job_status_filters(not_yet_run=False, running=False, finished=False):
jadmanski0afbb632008-06-06 21:10:57 +0000115 """\
116 Generate a SQL WHERE clause for job status filtering, and return it in
117 a dict of keyword args to pass to query.extra(). No more than one of
118 the parameters should be passed as True.
showard6c65d252009-10-01 18:45:22 +0000119 * not_yet_run: all HQEs are Queued
120 * finished: all HQEs are complete
121 * running: everything else
jadmanski0afbb632008-06-06 21:10:57 +0000122 """
123 assert not ((not_yet_run and running) or
124 (not_yet_run and finished) or
125 (running and finished)), ('Cannot specify more than one '
126 'filter to this function')
showard6c65d252009-10-01 18:45:22 +0000127
showardeab66ce2009-12-23 00:03:56 +0000128 not_queued = ('(SELECT job_id FROM afe_host_queue_entries '
129 'WHERE status != "%s")'
showard6c65d252009-10-01 18:45:22 +0000130 % models.HostQueueEntry.Status.QUEUED)
showardeab66ce2009-12-23 00:03:56 +0000131 not_finished = ('(SELECT job_id FROM afe_host_queue_entries '
132 'WHERE not complete)')
showard6c65d252009-10-01 18:45:22 +0000133
jadmanski0afbb632008-06-06 21:10:57 +0000134 if not_yet_run:
showard6c65d252009-10-01 18:45:22 +0000135 where = ['id NOT IN ' + not_queued]
jadmanski0afbb632008-06-06 21:10:57 +0000136 elif running:
showard6c65d252009-10-01 18:45:22 +0000137 where = ['(id IN %s) AND (id IN %s)' % (not_queued, not_finished)]
jadmanski0afbb632008-06-06 21:10:57 +0000138 elif finished:
showard6c65d252009-10-01 18:45:22 +0000139 where = ['id NOT IN ' + not_finished]
jadmanski0afbb632008-06-06 21:10:57 +0000140 else:
showard10f41672009-05-13 21:28:25 +0000141 return {}
jadmanski0afbb632008-06-06 21:10:57 +0000142 return {'where': where}
mblighe8819cd2008-02-15 16:48:40 +0000143
144
Jiaxi Luo15cbf372014-07-01 19:20:20 -0700145def extra_job_type_filters(extra_args, suite=False,
146 sub=False, standalone=False):
147 """\
148 Generate a SQL WHERE clause for job status filtering, and return it in
149 a dict of keyword args to pass to query.extra().
150
151 param extra_args: a dict of existing extra_args.
152
153 No more than one of the parameters should be passed as True:
154 * suite: job which is parent of other jobs
155 * sub: job with a parent job
156 * standalone: job with no child or parent jobs
157 """
158 assert not ((suite and sub) or
159 (suite and standalone) or
160 (sub and standalone)), ('Cannot specify more than one '
161 'filter to this function')
162
163 where = extra_args.get('where', [])
164 parent_job_id = ('DISTINCT parent_job_id')
165 child_job_id = ('id')
166 filter_common = ('(SELECT %s FROM afe_jobs '
167 'WHERE parent_job_id IS NOT NULL)')
168
169 if suite:
170 where.append('id IN ' + filter_common % parent_job_id)
171 elif sub:
172 where.append('id IN ' + filter_common % child_job_id)
173 elif standalone:
174 where.append('NOT EXISTS (SELECT 1 from afe_jobs AS sub_query '
175 'WHERE parent_job_id IS NOT NULL'
176 ' AND (sub_query.parent_job_id=afe_jobs.id'
177 ' OR sub_query.id=afe_jobs.id))')
178 else:
179 return extra_args
180
181 extra_args['where'] = where
182 return extra_args
183
184
185
showard87cc38f2009-08-20 23:37:04 +0000186def extra_host_filters(multiple_labels=()):
jadmanski0afbb632008-06-06 21:10:57 +0000187 """\
188 Generate SQL WHERE clauses for matching hosts in an intersection of
189 labels.
190 """
191 extra_args = {}
showardeab66ce2009-12-23 00:03:56 +0000192 where_str = ('afe_hosts.id in (select host_id from afe_hosts_labels '
jadmanski0afbb632008-06-06 21:10:57 +0000193 'where label_id=%s)')
194 extra_args['where'] = [where_str] * len(multiple_labels)
195 extra_args['params'] = [models.Label.smart_get(label).id
196 for label in multiple_labels]
197 return extra_args
showard8e3aa5e2008-04-08 19:42:32 +0000198
199
showard87cc38f2009-08-20 23:37:04 +0000200def get_host_query(multiple_labels, exclude_only_if_needed_labels,
showard8aa84fc2009-09-16 17:17:55 +0000201 exclude_atomic_group_hosts, valid_only, filter_data):
202 if valid_only:
203 query = models.Host.valid_objects.all()
204 else:
205 query = models.Host.objects.all()
206
showard43a3d262008-11-12 18:17:05 +0000207 if exclude_only_if_needed_labels:
208 only_if_needed_labels = models.Label.valid_objects.filter(
209 only_if_needed=True)
showardf7eac6f2008-11-13 21:18:01 +0000210 if only_if_needed_labels.count() > 0:
showard87cc38f2009-08-20 23:37:04 +0000211 only_if_needed_ids = ','.join(
212 str(label['id'])
213 for label in only_if_needed_labels.values('id'))
showardf7eac6f2008-11-13 21:18:01 +0000214 query = models.Host.objects.add_join(
showardeab66ce2009-12-23 00:03:56 +0000215 query, 'afe_hosts_labels', join_key='host_id',
216 join_condition=('afe_hosts_labels_exclude_OIN.label_id IN (%s)'
showard87cc38f2009-08-20 23:37:04 +0000217 % only_if_needed_ids),
218 suffix='_exclude_OIN', exclude=True)
showard8aa84fc2009-09-16 17:17:55 +0000219
showard87cc38f2009-08-20 23:37:04 +0000220 if exclude_atomic_group_hosts:
221 atomic_group_labels = models.Label.valid_objects.filter(
222 atomic_group__isnull=False)
223 if atomic_group_labels.count() > 0:
224 atomic_group_label_ids = ','.join(
225 str(atomic_group['id'])
226 for atomic_group in atomic_group_labels.values('id'))
227 query = models.Host.objects.add_join(
showardeab66ce2009-12-23 00:03:56 +0000228 query, 'afe_hosts_labels', join_key='host_id',
229 join_condition=(
230 'afe_hosts_labels_exclude_AG.label_id IN (%s)'
231 % atomic_group_label_ids),
showard87cc38f2009-08-20 23:37:04 +0000232 suffix='_exclude_AG', exclude=True)
Fang Deng04d30612013-04-10 18:13:13 -0700233 try:
234 assert 'extra_args' not in filter_data
235 filter_data['extra_args'] = extra_host_filters(multiple_labels)
236 return models.Host.query_objects(filter_data, initial_query=query)
237 except models.Label.DoesNotExist as e:
238 return models.Host.objects.none()
showard43a3d262008-11-12 18:17:05 +0000239
240
showard8fd58242008-03-10 21:29:07 +0000241class InconsistencyException(Exception):
jadmanski0afbb632008-06-06 21:10:57 +0000242 'Raised when a list of objects does not have a consistent value'
showard8fd58242008-03-10 21:29:07 +0000243
244
245def get_consistent_value(objects, field):
mblighc5ddfd12008-08-04 17:15:00 +0000246 if not objects:
247 # well a list of nothing is consistent
248 return None
249
jadmanski0afbb632008-06-06 21:10:57 +0000250 value = getattr(objects[0], field)
251 for obj in objects:
252 this_value = getattr(obj, field)
253 if this_value != value:
254 raise InconsistencyException(objects[0], obj)
255 return value
showard8fd58242008-03-10 21:29:07 +0000256
257
Matthew Sartori10438092015-06-24 14:30:18 -0700258def afe_test_dict_to_test_object(test_dict):
259 if not isinstance(test_dict, dict):
260 return test_dict
261
262 numerized_dict = {}
263 for key, value in test_dict.iteritems():
264 try:
265 numerized_dict[key] = int(value)
266 except (ValueError, TypeError):
267 numerized_dict[key] = value
268
269 return type('TestObject', (object,), numerized_dict)
270
271
272def prepare_generate_control_file(tests, kernel, label, profilers,
273 db_tests=True):
274 if db_tests:
275 test_objects = [models.Test.smart_get(test) for test in tests]
276 else:
277 test_objects = [afe_test_dict_to_test_object(test) for test in tests]
278
showard2b9a88b2008-06-13 20:55:03 +0000279 profiler_objects = [models.Profiler.smart_get(profiler)
280 for profiler in profilers]
jadmanski0afbb632008-06-06 21:10:57 +0000281 # ensure tests are all the same type
282 try:
283 test_type = get_consistent_value(test_objects, 'test_type')
284 except InconsistencyException, exc:
285 test1, test2 = exc.args
mblighec5546d2008-06-16 16:51:28 +0000286 raise model_logic.ValidationError(
Matthew Sartori10438092015-06-24 14:30:18 -0700287 {'tests' : 'You cannot run both test_suites and server-side '
jadmanski0afbb632008-06-06 21:10:57 +0000288 'tests together (tests %s and %s differ' % (
289 test1.name, test2.name)})
showard8fd58242008-03-10 21:29:07 +0000290
Aviv Keshet3dd8beb2013-05-13 17:36:04 -0700291 is_server = (test_type == control_data.CONTROL_TYPE.SERVER)
showard14374b12009-01-31 00:11:54 +0000292 if test_objects:
293 synch_count = max(test.sync_count for test in test_objects)
294 else:
295 synch_count = 1
jadmanski0afbb632008-06-06 21:10:57 +0000296 if label:
297 label = models.Label.smart_get(label)
mblighe8819cd2008-02-15 16:48:40 +0000298
Matthew Sartori10438092015-06-24 14:30:18 -0700299 if db_tests:
300 dependencies = set(label.name for label
301 in models.Label.objects.filter(test__in=test_objects))
302 else:
303 dependencies = reduce(
304 set.union, [set(test.dependencies) for test in test_objects])
showard989f25d2008-10-01 11:38:11 +0000305
showard2bab8f42008-11-12 18:15:22 +0000306 cf_info = dict(is_server=is_server, synch_count=synch_count,
307 dependencies=list(dependencies))
308 return cf_info, test_objects, profiler_objects, label
showard989f25d2008-10-01 11:38:11 +0000309
310
311def check_job_dependencies(host_objects, job_dependencies):
312 """
313 Check that a set of machines satisfies a job's dependencies.
314 host_objects: list of models.Host objects
315 job_dependencies: list of names of labels
316 """
317 # check that hosts satisfy dependencies
318 host_ids = [host.id for host in host_objects]
319 hosts_in_job = models.Host.objects.filter(id__in=host_ids)
320 ok_hosts = hosts_in_job
321 for index, dependency in enumerate(job_dependencies):
Alex Milleraa772002014-04-10 17:51:21 -0700322 if not provision.is_for_special_action(dependency):
Aviv Keshetc68807e2013-07-31 16:13:01 -0700323 ok_hosts = ok_hosts.filter(labels__name=dependency)
showard989f25d2008-10-01 11:38:11 +0000324 failing_hosts = (set(host.hostname for host in host_objects) -
325 set(host.hostname for host in ok_hosts))
326 if failing_hosts:
327 raise model_logic.ValidationError(
Eric Lie0493a42010-11-15 13:05:43 -0800328 {'hosts' : 'Host(s) failed to meet job dependencies (' +
329 (', '.join(job_dependencies)) + '): ' +
330 (', '.join(failing_hosts))})
331
showard989f25d2008-10-01 11:38:11 +0000332
Alex Miller4a193692013-08-21 13:59:01 -0700333def check_job_metahost_dependencies(metahost_objects, job_dependencies):
334 """
335 Check that at least one machine within the metahost spec satisfies the job's
336 dependencies.
337
338 @param metahost_objects A list of label objects representing the metahosts.
339 @param job_dependencies A list of strings of the required label names.
340 @raises NoEligibleHostException If a metahost cannot run the job.
341 """
342 for metahost in metahost_objects:
343 hosts = models.Host.objects.filter(labels=metahost)
344 for label_name in job_dependencies:
Alex Milleraa772002014-04-10 17:51:21 -0700345 if not provision.is_for_special_action(label_name):
Alex Miller4a193692013-08-21 13:59:01 -0700346 hosts = hosts.filter(labels__name=label_name)
347 if not any(hosts):
348 raise error.NoEligibleHostException("No hosts within %s satisfy %s."
349 % (metahost.name, ', '.join(job_dependencies)))
350
showard2bab8f42008-11-12 18:15:22 +0000351
352def _execution_key_for(host_queue_entry):
353 return (host_queue_entry.job.id, host_queue_entry.execution_subdir)
354
355
356def check_abort_synchronous_jobs(host_queue_entries):
357 # ensure user isn't aborting part of a synchronous autoserv execution
358 count_per_execution = {}
359 for queue_entry in host_queue_entries:
360 key = _execution_key_for(queue_entry)
361 count_per_execution.setdefault(key, 0)
362 count_per_execution[key] += 1
363
364 for queue_entry in host_queue_entries:
365 if not queue_entry.execution_subdir:
366 continue
367 execution_count = count_per_execution[_execution_key_for(queue_entry)]
368 if execution_count < queue_entry.job.synch_count:
mbligh1ef218d2009-08-03 16:57:56 +0000369 raise model_logic.ValidationError(
370 {'' : 'You cannot abort part of a synchronous job execution '
371 '(%d/%s), %d included, %d expected'
372 % (queue_entry.job.id, queue_entry.execution_subdir,
373 execution_count, queue_entry.job.synch_count)})
showard8fbae652009-01-20 23:23:10 +0000374
375
showardc92da832009-04-07 18:14:34 +0000376def check_atomic_group_create_job(synch_count, host_objects, metahost_objects,
Alex Miller871291b2013-08-08 01:19:20 -0700377 dependencies, atomic_group):
showardc92da832009-04-07 18:14:34 +0000378 """
379 Attempt to reject create_job requests with an atomic group that
380 will be impossible to schedule. The checks are not perfect but
381 should catch the most obvious issues.
382
383 @param synch_count - The job's minimum synch count.
384 @param host_objects - A list of models.Host instances.
385 @param metahost_objects - A list of models.Label instances.
386 @param dependencies - A list of job dependency label names.
showardc92da832009-04-07 18:14:34 +0000387 @param labels_by_name - A dictionary mapping label names to models.Label
388 instance. Used to look up instances for dependencies.
389
390 @raises model_logic.ValidationError - When an issue is found.
391 """
392 # If specific host objects were supplied with an atomic group, verify
393 # that there are enough to satisfy the synch_count.
394 minimum_required = synch_count or 1
395 if (host_objects and not metahost_objects and
396 len(host_objects) < minimum_required):
397 raise model_logic.ValidationError(
398 {'hosts':
399 'only %d hosts provided for job with synch_count = %d' %
400 (len(host_objects), synch_count)})
401
402 # Check that the atomic group has a hope of running this job
403 # given any supplied metahosts and dependancies that may limit.
404
405 # Get a set of hostnames in the atomic group.
406 possible_hosts = set()
407 for label in atomic_group.label_set.all():
408 possible_hosts.update(h.hostname for h in label.host_set.all())
409
410 # Filter out hosts that don't match all of the job dependency labels.
Alex Miller871291b2013-08-08 01:19:20 -0700411 for label in models.Label.objects.filter(name__in=dependencies):
showardc92da832009-04-07 18:14:34 +0000412 hosts_in_label = (h.hostname for h in label.host_set.all())
413 possible_hosts.intersection_update(hosts_in_label)
414
showard225bdc12009-04-13 16:09:21 +0000415 if not host_objects and not metahost_objects:
416 # No hosts or metahosts are required to queue an atomic group Job.
417 # However, if they are given, we respect them below.
418 host_set = possible_hosts
419 else:
420 host_set = set(host.hostname for host in host_objects)
421 unusable_host_set = host_set.difference(possible_hosts)
422 if unusable_host_set:
423 raise model_logic.ValidationError(
424 {'hosts': 'Hosts "%s" are not in Atomic Group "%s"' %
425 (', '.join(sorted(unusable_host_set)), atomic_group.name)})
showardc92da832009-04-07 18:14:34 +0000426
427 # Lookup hosts provided by each meta host and merge them into the
428 # host_set for final counting.
429 for meta_host in metahost_objects:
430 meta_possible = possible_hosts.copy()
431 hosts_in_meta_host = (h.hostname for h in meta_host.host_set.all())
432 meta_possible.intersection_update(hosts_in_meta_host)
433
434 # Count all hosts that this meta_host will provide.
435 host_set.update(meta_possible)
436
437 if len(host_set) < minimum_required:
438 raise model_logic.ValidationError(
439 {'atomic_group_name':
440 'Insufficient hosts in Atomic Group "%s" with the'
441 ' supplied dependencies and meta_hosts.' %
442 (atomic_group.name,)})
443
444
showardbe0d8692009-08-20 23:42:44 +0000445def check_modify_host(update_data):
446 """
447 Sanity check modify_host* requests.
448
449 @param update_data: A dictionary with the changes to make to a host
450 or hosts.
451 """
452 # Only the scheduler (monitor_db) is allowed to modify Host status.
453 # Otherwise race conditions happen as a hosts state is changed out from
454 # beneath tasks being run on a host.
455 if 'status' in update_data:
456 raise model_logic.ValidationError({
457 'status': 'Host status can not be modified by the frontend.'})
458
459
showardce7c0922009-09-11 18:39:24 +0000460def check_modify_host_locking(host, update_data):
461 """
462 Checks when locking/unlocking has been requested if the host is already
463 locked/unlocked.
464
465 @param host: models.Host object to be modified
466 @param update_data: A dictionary with the changes to make to the host.
467 """
468 locked = update_data.get('locked', None)
Matthew Sartori68186332015-04-27 17:19:53 -0700469 lock_reason = update_data.get('lock_reason', None)
showardce7c0922009-09-11 18:39:24 +0000470 if locked is not None:
471 if locked and host.locked:
472 raise model_logic.ValidationError({
473 'locked': 'Host already locked by %s on %s.' %
474 (host.locked_by, host.lock_time)})
475 if not locked and not host.locked:
476 raise model_logic.ValidationError({
477 'locked': 'Host already unlocked.'})
Matthew Sartori68186332015-04-27 17:19:53 -0700478 if locked and not lock_reason and not host.locked:
479 raise model_logic.ValidationError({
480 'locked': 'Please provide a reason for locking'})
showardce7c0922009-09-11 18:39:24 +0000481
482
showard8fbae652009-01-20 23:23:10 +0000483def get_motd():
484 dirname = os.path.dirname(__file__)
485 filename = os.path.join(dirname, "..", "..", "motd.txt")
486 text = ''
487 try:
488 fp = open(filename, "r")
489 try:
490 text = fp.read()
491 finally:
492 fp.close()
493 except:
494 pass
495
496 return text
showard29f7cd22009-04-29 21:16:24 +0000497
498
499def _get_metahost_counts(metahost_objects):
500 metahost_counts = {}
501 for metahost in metahost_objects:
502 metahost_counts.setdefault(metahost, 0)
503 metahost_counts[metahost] += 1
504 return metahost_counts
505
506
showarda965cef2009-05-15 23:17:41 +0000507def get_job_info(job, preserve_metahosts=False, queue_entry_filter_data=None):
showard29f7cd22009-04-29 21:16:24 +0000508 hosts = []
509 one_time_hosts = []
510 meta_hosts = []
511 atomic_group = None
jamesren2275ef12010-04-12 18:25:06 +0000512 hostless = False
showard29f7cd22009-04-29 21:16:24 +0000513
showard4d077562009-05-08 18:24:36 +0000514 queue_entries = job.hostqueueentry_set.all()
showarda965cef2009-05-15 23:17:41 +0000515 if queue_entry_filter_data:
516 queue_entries = models.HostQueueEntry.query_objects(
517 queue_entry_filter_data, initial_query=queue_entries)
showard4d077562009-05-08 18:24:36 +0000518
519 for queue_entry in queue_entries:
showard29f7cd22009-04-29 21:16:24 +0000520 if (queue_entry.host and (preserve_metahosts or
521 not queue_entry.meta_host)):
522 if queue_entry.deleted:
523 continue
524 if queue_entry.host.invalid:
525 one_time_hosts.append(queue_entry.host)
526 else:
527 hosts.append(queue_entry.host)
jamesren2275ef12010-04-12 18:25:06 +0000528 elif queue_entry.meta_host:
showard29f7cd22009-04-29 21:16:24 +0000529 meta_hosts.append(queue_entry.meta_host)
jamesren2275ef12010-04-12 18:25:06 +0000530 else:
531 hostless = True
532
showard29f7cd22009-04-29 21:16:24 +0000533 if atomic_group is None:
534 if queue_entry.atomic_group is not None:
535 atomic_group = queue_entry.atomic_group
536 else:
537 assert atomic_group.name == queue_entry.atomic_group.name, (
538 'DB inconsistency. HostQueueEntries with multiple atomic'
539 ' groups on job %s: %s != %s' % (
540 id, atomic_group.name, queue_entry.atomic_group.name))
541
542 meta_host_counts = _get_metahost_counts(meta_hosts)
543
544 info = dict(dependencies=[label.name for label
545 in job.dependency_labels.all()],
546 hosts=hosts,
547 meta_hosts=meta_hosts,
548 meta_host_counts=meta_host_counts,
549 one_time_hosts=one_time_hosts,
jamesren2275ef12010-04-12 18:25:06 +0000550 atomic_group=atomic_group,
551 hostless=hostless)
showard29f7cd22009-04-29 21:16:24 +0000552 return info
553
554
showard09d80f92009-11-19 01:01:19 +0000555def check_for_duplicate_hosts(host_objects):
556 host_ids = set()
557 duplicate_hostnames = set()
558 for host in host_objects:
559 if host.id in host_ids:
560 duplicate_hostnames.add(host.hostname)
561 host_ids.add(host.id)
562
563 if duplicate_hostnames:
564 raise model_logic.ValidationError(
565 {'hosts' : 'Duplicate hosts: %s'
566 % ', '.join(duplicate_hostnames)})
567
568
showarda1e74b32009-05-12 17:32:04 +0000569def create_new_job(owner, options, host_objects, metahost_objects,
570 atomic_group=None):
showard29f7cd22009-04-29 21:16:24 +0000571 all_host_objects = host_objects + metahost_objects
572 metahost_counts = _get_metahost_counts(metahost_objects)
showarda1e74b32009-05-12 17:32:04 +0000573 dependencies = options.get('dependencies', [])
574 synch_count = options.get('synch_count')
showard29f7cd22009-04-29 21:16:24 +0000575
showard29f7cd22009-04-29 21:16:24 +0000576 if atomic_group:
577 check_atomic_group_create_job(
578 synch_count, host_objects, metahost_objects,
Alex Miller871291b2013-08-08 01:19:20 -0700579 dependencies, atomic_group)
showard29f7cd22009-04-29 21:16:24 +0000580 else:
581 if synch_count is not None and synch_count > len(all_host_objects):
582 raise model_logic.ValidationError(
583 {'hosts':
584 'only %d hosts provided for job with synch_count = %d' %
585 (len(all_host_objects), synch_count)})
586 atomic_hosts = models.Host.objects.filter(
587 id__in=[host.id for host in host_objects],
588 labels__atomic_group=True)
589 unusable_host_names = [host.hostname for host in atomic_hosts]
590 if unusable_host_names:
591 raise model_logic.ValidationError(
592 {'hosts':
593 'Host(s) "%s" are atomic group hosts but no '
594 'atomic group was specified for this job.' %
595 (', '.join(unusable_host_names),)})
596
showard09d80f92009-11-19 01:01:19 +0000597 check_for_duplicate_hosts(host_objects)
showard29f7cd22009-04-29 21:16:24 +0000598
Aviv Keshetc68807e2013-07-31 16:13:01 -0700599 for label_name in dependencies:
Alex Milleraa772002014-04-10 17:51:21 -0700600 if provision.is_for_special_action(label_name):
Aviv Keshetc68807e2013-07-31 16:13:01 -0700601 # TODO: We could save a few queries
602 # if we had a bulk ensure-label-exists function, which used
603 # a bulk .get() call. The win is probably very small.
Alex Miller871291b2013-08-08 01:19:20 -0700604 _ensure_label_exists(label_name)
Aviv Keshetc68807e2013-07-31 16:13:01 -0700605
Alex Miller4a193692013-08-21 13:59:01 -0700606 # This only checks targeted hosts, not hosts eligible due to the metahost
607 check_job_dependencies(host_objects, dependencies)
608 check_job_metahost_dependencies(metahost_objects, dependencies)
609
Alex Miller871291b2013-08-08 01:19:20 -0700610 options['dependencies'] = list(
611 models.Label.objects.filter(name__in=dependencies))
showard29f7cd22009-04-29 21:16:24 +0000612
showarda1e74b32009-05-12 17:32:04 +0000613 for label in metahost_objects + options['dependencies']:
showard29f7cd22009-04-29 21:16:24 +0000614 if label.atomic_group and not atomic_group:
615 raise model_logic.ValidationError(
616 {'atomic_group_name':
showardc8730322009-06-30 01:56:38 +0000617 'Dependency %r requires an atomic group but no '
618 'atomic_group_name or meta_host in an atomic group was '
619 'specified for this job.' % label.name})
showard29f7cd22009-04-29 21:16:24 +0000620 elif (label.atomic_group and
621 label.atomic_group.name != atomic_group.name):
622 raise model_logic.ValidationError(
623 {'atomic_group_name':
showardc8730322009-06-30 01:56:38 +0000624 'meta_hosts or dependency %r requires atomic group '
625 '%r instead of the supplied atomic_group_name=%r.' %
626 (label.name, label.atomic_group.name, atomic_group.name)})
showard29f7cd22009-04-29 21:16:24 +0000627
showarda1e74b32009-05-12 17:32:04 +0000628 job = models.Job.create(owner=owner, options=options,
629 hosts=all_host_objects)
showard29f7cd22009-04-29 21:16:24 +0000630 job.queue(all_host_objects, atomic_group=atomic_group,
showarda1e74b32009-05-12 17:32:04 +0000631 is_template=options.get('is_template', False))
showard29f7cd22009-04-29 21:16:24 +0000632 return job.id
showard0957a842009-05-11 19:25:08 +0000633
634
Aviv Keshetc68807e2013-07-31 16:13:01 -0700635def _ensure_label_exists(name):
636 """
637 Ensure that a label called |name| exists in the Django models.
638
639 This function is to be called from within afe rpcs only, as an
640 alternative to server.cros.provision.ensure_label_exists(...). It works
641 by Django model manipulation, rather than by making another create_label
642 rpc call.
643
644 @param name: the label to check for/create.
645 @raises ValidationError: There was an error in the response that was
646 not because the label already existed.
647 @returns True is a label was created, False otherwise.
648 """
649 try:
650 models.Label.objects.get(name=name)
651 except models.Label.DoesNotExist:
652 new_label = models.Label.objects.create(name=name)
653 new_label.save()
654 return True
655 return False
656
657
showard909c9142009-07-07 20:54:42 +0000658def find_platform_and_atomic_group(host):
659 """
660 Figure out the platform name and atomic group name for the given host
661 object. If none, the return value for either will be None.
662
663 @returns (platform name, atomic group name) for the given host.
664 """
showard0957a842009-05-11 19:25:08 +0000665 platforms = [label.name for label in host.label_list if label.platform]
666 if not platforms:
showard909c9142009-07-07 20:54:42 +0000667 platform = None
668 else:
669 platform = platforms[0]
showard0957a842009-05-11 19:25:08 +0000670 if len(platforms) > 1:
671 raise ValueError('Host %s has more than one platform: %s' %
672 (host.hostname, ', '.join(platforms)))
showard909c9142009-07-07 20:54:42 +0000673 for label in host.label_list:
674 if label.atomic_group:
675 atomic_group_name = label.atomic_group.name
676 break
677 else:
678 atomic_group_name = None
679 # Don't check for multiple atomic groups on a host here. That is an
680 # error but should not trip up the RPC interface. monitor_db_cleanup
681 # deals with it. This just returns the first one found.
682 return platform, atomic_group_name
showardc0ac3a72009-07-08 21:14:45 +0000683
684
685# support for get_host_queue_entries_and_special_tasks()
686
MK Ryu0c1a37d2015-04-30 12:00:55 -0700687def _common_entry_to_dict(entry, type, job_dict, exec_path, status, started_on):
showardc0ac3a72009-07-08 21:14:45 +0000688 return dict(type=type,
MK Ryu0c1a37d2015-04-30 12:00:55 -0700689 host=entry['host'],
showardc0ac3a72009-07-08 21:14:45 +0000690 job=job_dict,
MK Ryu0c1a37d2015-04-30 12:00:55 -0700691 execution_path=exec_path,
692 status=status,
693 started_on=started_on,
694 id=str(entry['id']) + type,
695 oid=entry['id'])
showardc0ac3a72009-07-08 21:14:45 +0000696
697
MK Ryu0c1a37d2015-04-30 12:00:55 -0700698def _special_task_to_dict(task, queue_entries):
699 """Transforms a special task dictionary to another form of dictionary.
700
701 @param task Special task as a dictionary type
702 @param queue_entries Host queue entries as a list of dictionaries.
703
704 @return Transformed dictionary for a special task.
705 """
showardc0ac3a72009-07-08 21:14:45 +0000706 job_dict = None
MK Ryu0c1a37d2015-04-30 12:00:55 -0700707 if task['queue_entry']:
708 # Scan queue_entries to get the job detail info.
709 for qentry in queue_entries:
710 if task['queue_entry']['id'] == qentry['id']:
711 job_dict = qentry['job']
712 break
713 # If not found, get it from DB.
714 if job_dict is None:
715 job = models.Job.objects.get(id=task['queue_entry']['job'])
716 job_dict = job.get_object_dict()
717
718 exec_path = server_utils.get_special_task_exec_path(
719 task['host']['hostname'], task['id'], task['task'],
720 time_utils.time_string_to_datetime(task['time_requested']))
721 status = server_utils.get_special_task_status(
722 task['is_complete'], task['success'], task['is_active'])
723 return _common_entry_to_dict(task, task['task'], job_dict,
724 exec_path, status, task['time_started'])
showardc0ac3a72009-07-08 21:14:45 +0000725
726
727def _queue_entry_to_dict(queue_entry):
MK Ryu0c1a37d2015-04-30 12:00:55 -0700728 job_dict = queue_entry['job']
729 tag = server_utils.get_job_tag(job_dict['id'], job_dict['owner'])
730 exec_path = server_utils.get_hqe_exec_path(tag,
731 queue_entry['execution_subdir'])
732 return _common_entry_to_dict(queue_entry, 'Job', job_dict, exec_path,
733 queue_entry['status'], queue_entry['started_on'])
734
735
736def prepare_host_queue_entries_and_special_tasks(interleaved_entries,
737 queue_entries):
738 """
739 Prepare for serialization the interleaved entries of host queue entries
740 and special tasks.
741 Each element in the entries is a dictionary type.
742 The special task dictionary has only a job id for a job and lacks
743 the detail of the job while the host queue entry dictionary has.
744 queue_entries is used to look up the job detail info.
745
746 @param interleaved_entries Host queue entries and special tasks as a list
747 of dictionaries.
748 @param queue_entries Host queue entries as a list of dictionaries.
749
750 @return A post-processed list of dictionaries that is to be serialized.
751 """
752 dict_list = []
753 for e in interleaved_entries:
754 # Distinguish the two mixed entries based on the existence of
755 # the key "task". If an entry has the key, the entry is for
756 # special task. Otherwise, host queue entry.
757 if 'task' in e:
758 dict_list.append(_special_task_to_dict(e, queue_entries))
759 else:
760 dict_list.append(_queue_entry_to_dict(e))
761 return prepare_for_serialization(dict_list)
showardc0ac3a72009-07-08 21:14:45 +0000762
763
764def _compute_next_job_for_tasks(queue_entries, special_tasks):
765 """
766 For each task, try to figure out the next job that ran after that task.
767 This is done using two pieces of information:
768 * if the task has a queue entry, we can use that entry's job ID.
769 * if the task has a time_started, we can try to compare that against the
770 started_on field of queue_entries. this isn't guaranteed to work perfectly
771 since queue_entries may also have null started_on values.
772 * if the task has neither, or if use of time_started fails, just use the
773 last computed job ID.
MK Ryu0c1a37d2015-04-30 12:00:55 -0700774
775 @param queue_entries Host queue entries as a list of dictionaries.
776 @param special_tasks Special tasks as a list of dictionaries.
showardc0ac3a72009-07-08 21:14:45 +0000777 """
778 next_job_id = None # most recently computed next job
779 hqe_index = 0 # index for scanning by started_on times
780 for task in special_tasks:
MK Ryu0c1a37d2015-04-30 12:00:55 -0700781 if task['queue_entry']:
782 next_job_id = task['queue_entry']['job']
783 elif task['time_started'] is not None:
showardc0ac3a72009-07-08 21:14:45 +0000784 for queue_entry in queue_entries[hqe_index:]:
MK Ryu0c1a37d2015-04-30 12:00:55 -0700785 if queue_entry['started_on'] is None:
showardc0ac3a72009-07-08 21:14:45 +0000786 continue
MK Ryu0c1a37d2015-04-30 12:00:55 -0700787 t1 = time_utils.time_string_to_datetime(
788 queue_entry['started_on'])
789 t2 = time_utils.time_string_to_datetime(task['time_started'])
790 if t1 < t2:
showardc0ac3a72009-07-08 21:14:45 +0000791 break
MK Ryu0c1a37d2015-04-30 12:00:55 -0700792 next_job_id = queue_entry['job']['id']
showardc0ac3a72009-07-08 21:14:45 +0000793
MK Ryu0c1a37d2015-04-30 12:00:55 -0700794 task['next_job_id'] = next_job_id
showardc0ac3a72009-07-08 21:14:45 +0000795
796 # advance hqe_index to just after next_job_id
797 if next_job_id is not None:
798 for queue_entry in queue_entries[hqe_index:]:
MK Ryu0c1a37d2015-04-30 12:00:55 -0700799 if queue_entry['job']['id'] < next_job_id:
showardc0ac3a72009-07-08 21:14:45 +0000800 break
801 hqe_index += 1
802
803
804def interleave_entries(queue_entries, special_tasks):
805 """
806 Both lists should be ordered by descending ID.
807 """
808 _compute_next_job_for_tasks(queue_entries, special_tasks)
809
810 # start with all special tasks that've run since the last job
811 interleaved_entries = []
812 for task in special_tasks:
MK Ryu0c1a37d2015-04-30 12:00:55 -0700813 if task['next_job_id'] is not None:
showardc0ac3a72009-07-08 21:14:45 +0000814 break
MK Ryu0c1a37d2015-04-30 12:00:55 -0700815 interleaved_entries.append(task)
showardc0ac3a72009-07-08 21:14:45 +0000816
817 # now interleave queue entries with the remaining special tasks
818 special_task_index = len(interleaved_entries)
819 for queue_entry in queue_entries:
MK Ryu0c1a37d2015-04-30 12:00:55 -0700820 interleaved_entries.append(queue_entry)
showardc0ac3a72009-07-08 21:14:45 +0000821 # add all tasks that ran between this job and the previous one
822 for task in special_tasks[special_task_index:]:
MK Ryu0c1a37d2015-04-30 12:00:55 -0700823 if task['next_job_id'] < queue_entry['job']['id']:
showardc0ac3a72009-07-08 21:14:45 +0000824 break
MK Ryu0c1a37d2015-04-30 12:00:55 -0700825 interleaved_entries.append(task)
showardc0ac3a72009-07-08 21:14:45 +0000826 special_task_index += 1
827
828 return interleaved_entries
jamesren4a41e012010-07-16 22:33:48 +0000829
830
Prashanth Balasubramanian6edaaf92014-11-24 16:36:25 -0800831def bucket_hosts_by_shard(host_objs, rpc_hostnames=False):
832 """Figure out which hosts are on which shards.
833
834 @param host_objs: A list of host objects.
835 @param rpc_hostnames: If True, the rpc_hostnames of a shard are returned
836 instead of the 'real' shard hostnames. This only matters for testing
837 environments.
838
839 @return: A map of shard hostname: list of hosts on the shard.
840 """
841 shard_host_map = {}
842 for host in host_objs:
843 if host.shard:
844 shard_name = (host.shard.rpc_hostname() if rpc_hostnames
845 else host.shard.hostname)
846 shard_host_map.setdefault(shard_name, []).append(host.hostname)
847 return shard_host_map
848
849
jamesren4a41e012010-07-16 22:33:48 +0000850def get_create_job_common_args(local_args):
851 """
852 Returns a dict containing only the args that apply for create_job_common
853
854 Returns a subset of local_args, which contains only the arguments that can
855 be passed in to create_job_common().
856 """
Alex Miller7d658cf2013-09-04 16:00:35 -0700857 # This code is only here to not kill suites scheduling tests when priority
858 # becomes an int instead of a string.
859 if isinstance(local_args['priority'], str):
860 local_args['priority'] = priorities.Priority.DEFAULT
861 # </migration hack>
jamesren4a41e012010-07-16 22:33:48 +0000862 arg_names, _, _, _ = inspect.getargspec(create_job_common)
863 return dict(item for item in local_args.iteritems() if item[0] in arg_names)
864
865
866def create_job_common(name, priority, control_type, control_file=None,
867 hosts=(), meta_hosts=(), one_time_hosts=(),
868 atomic_group_name=None, synch_count=None,
Simran Basi7e605742013-11-12 13:43:36 -0800869 is_template=False, timeout=None, timeout_mins=None,
870 max_runtime_mins=None, run_verify=True, email_list='',
871 dependencies=(), reboot_before=None, reboot_after=None,
jamesren4a41e012010-07-16 22:33:48 +0000872 parse_failed_repair=None, hostless=False, keyvals=None,
Aviv Keshet18308922013-02-19 17:49:49 -0800873 drone_set=None, parameterized_job=None,
Dan Shiec1d47d2015-02-13 11:38:13 -0800874 parent_job_id=None, test_retry=0, run_reset=True,
875 require_ssp=None):
Aviv Keshet18308922013-02-19 17:49:49 -0800876 #pylint: disable-msg=C0111
jamesren4a41e012010-07-16 22:33:48 +0000877 """
878 Common code between creating "standard" jobs and creating parameterized jobs
879 """
880 user = models.User.current_user()
881 owner = user.login
882
jamesren4a41e012010-07-16 22:33:48 +0000883 # input validation
884 if not (hosts or meta_hosts or one_time_hosts or atomic_group_name
885 or hostless):
886 raise model_logic.ValidationError({
887 'arguments' : "You must pass at least one of 'hosts', "
888 "'meta_hosts', 'one_time_hosts', "
889 "'atomic_group_name', or 'hostless'"
890 })
891
892 if hostless:
893 if hosts or meta_hosts or one_time_hosts or atomic_group_name:
894 raise model_logic.ValidationError({
895 'hostless': 'Hostless jobs cannot include any hosts!'})
Aviv Keshet3dd8beb2013-05-13 17:36:04 -0700896 server_type = control_data.CONTROL_TYPE_NAMES.SERVER
jamesren4a41e012010-07-16 22:33:48 +0000897 if control_type != server_type:
898 raise model_logic.ValidationError({
899 'control_type': 'Hostless jobs cannot use client-side '
900 'control files'})
901
Alex Miller871291b2013-08-08 01:19:20 -0700902 atomic_groups_by_name = dict((ag.name, ag)
jamesren4a41e012010-07-16 22:33:48 +0000903 for ag in models.AtomicGroup.objects.all())
Alex Miller871291b2013-08-08 01:19:20 -0700904 label_objects = list(models.Label.objects.filter(name__in=meta_hosts))
jamesren4a41e012010-07-16 22:33:48 +0000905
906 # Schedule on an atomic group automagically if one of the labels given
907 # is an atomic group label and no explicit atomic_group_name was supplied.
908 if not atomic_group_name:
Alex Miller871291b2013-08-08 01:19:20 -0700909 for label in label_objects:
jamesren4a41e012010-07-16 22:33:48 +0000910 if label and label.atomic_group:
911 atomic_group_name = label.atomic_group.name
912 break
jamesren4a41e012010-07-16 22:33:48 +0000913 # convert hostnames & meta hosts to host/label objects
914 host_objects = models.Host.smart_get_bulk(hosts)
Prashanth Balasubramanian8c98ac12014-12-23 11:26:44 -0800915 if not server_utils.is_shard():
Prashanth Balasubramanian6edaaf92014-11-24 16:36:25 -0800916 shard_host_map = bucket_hosts_by_shard(host_objects)
Prashanth Balasubramanian8c98ac12014-12-23 11:26:44 -0800917 num_shards = len(shard_host_map)
918 if (num_shards > 1 or (num_shards == 1 and
919 len(shard_host_map.values()[0]) != len(host_objects))):
920 # We disallow the following jobs on master:
921 # num_shards > 1: this is a job spanning across multiple shards.
922 # num_shards == 1 but number of hosts on shard is less
923 # than total number of hosts: this is a job that spans across
924 # one shard and the master.
925 raise ValueError(
926 'The following hosts are on shard(s), please create '
927 'seperate jobs for hosts on each shard: %s ' %
928 shard_host_map)
jamesren4a41e012010-07-16 22:33:48 +0000929 metahost_objects = []
Alex Miller871291b2013-08-08 01:19:20 -0700930 meta_host_labels_by_name = {label.name: label for label in label_objects}
jamesren4a41e012010-07-16 22:33:48 +0000931 for label_name in meta_hosts or []:
Alex Miller871291b2013-08-08 01:19:20 -0700932 if label_name in meta_host_labels_by_name:
933 metahost_objects.append(meta_host_labels_by_name[label_name])
jamesren4a41e012010-07-16 22:33:48 +0000934 elif label_name in atomic_groups_by_name:
935 # If given a metahost name that isn't a Label, check to
936 # see if the user was specifying an Atomic Group instead.
937 atomic_group = atomic_groups_by_name[label_name]
938 if atomic_group_name and atomic_group_name != atomic_group.name:
939 raise model_logic.ValidationError({
940 'meta_hosts': (
941 'Label "%s" not found. If assumed to be an '
942 'atomic group it would conflict with the '
943 'supplied atomic group "%s".' % (
944 label_name, atomic_group_name))})
945 atomic_group_name = atomic_group.name
946 else:
947 raise model_logic.ValidationError(
948 {'meta_hosts' : 'Label "%s" not found' % label_name})
949
950 # Create and sanity check an AtomicGroup object if requested.
951 if atomic_group_name:
952 if one_time_hosts:
953 raise model_logic.ValidationError(
954 {'one_time_hosts':
955 'One time hosts cannot be used with an Atomic Group.'})
956 atomic_group = models.AtomicGroup.smart_get(atomic_group_name)
957 if synch_count and synch_count > atomic_group.max_number_of_machines:
958 raise model_logic.ValidationError(
959 {'atomic_group_name' :
960 'You have requested a synch_count (%d) greater than the '
961 'maximum machines in the requested Atomic Group (%d).' %
962 (synch_count, atomic_group.max_number_of_machines)})
963 else:
964 atomic_group = None
965
966 for host in one_time_hosts or []:
967 this_host = models.Host.create_one_time_host(host)
968 host_objects.append(this_host)
969
970 options = dict(name=name,
971 priority=priority,
972 control_file=control_file,
973 control_type=control_type,
974 is_template=is_template,
975 timeout=timeout,
Simran Basi7e605742013-11-12 13:43:36 -0800976 timeout_mins=timeout_mins,
Simran Basi34217022012-11-06 13:43:15 -0800977 max_runtime_mins=max_runtime_mins,
jamesren4a41e012010-07-16 22:33:48 +0000978 synch_count=synch_count,
979 run_verify=run_verify,
980 email_list=email_list,
981 dependencies=dependencies,
982 reboot_before=reboot_before,
983 reboot_after=reboot_after,
984 parse_failed_repair=parse_failed_repair,
985 keyvals=keyvals,
986 drone_set=drone_set,
Aviv Keshet18308922013-02-19 17:49:49 -0800987 parameterized_job=parameterized_job,
Aviv Keshetcd1ff9b2013-03-01 14:55:19 -0800988 parent_job_id=parent_job_id,
Dan Shi07e09af2013-04-12 09:31:29 -0700989 test_retry=test_retry,
Dan Shiec1d47d2015-02-13 11:38:13 -0800990 run_reset=run_reset,
991 require_ssp=require_ssp)
jamesren4a41e012010-07-16 22:33:48 +0000992 return create_new_job(owner=owner,
993 options=options,
994 host_objects=host_objects,
995 metahost_objects=metahost_objects,
996 atomic_group=atomic_group)
Simran Basib6ec8ae2014-04-23 12:05:08 -0700997
998
999def encode_ascii(control_file):
1000 """Force a control file to only contain ascii characters.
1001
1002 @param control_file: Control file to encode.
1003
1004 @returns the control file in an ascii encoding.
1005
1006 @raises error.ControlFileMalformed: if encoding fails.
1007 """
1008 try:
1009 return control_file.encode('ascii')
1010 except UnicodeDecodeError as e:
Jiaxi Luo421608e2014-07-07 14:38:00 -07001011 raise error.ControlFileMalformed(str(e))
1012
1013
1014def get_wmatrix_url():
1015 """Get wmatrix url from config file.
1016
1017 @returns the wmatrix url or an empty string.
1018 """
1019 return global_config.global_config.get_config_value('AUTOTEST_WEB',
1020 'wmatrix_url',
Jiaxi Luo15cbf372014-07-01 19:20:20 -07001021 default='')
Jiaxi Luo57bc1952014-07-22 15:27:30 -07001022
1023
1024def inject_times_to_filter(start_time_key=None, end_time_key=None,
1025 start_time_value=None, end_time_value=None,
1026 **filter_data):
1027 """Inject the key value pairs of start and end time if provided.
1028
1029 @param start_time_key: A string represents the filter key of start_time.
1030 @param end_time_key: A string represents the filter key of end_time.
1031 @param start_time_value: Start_time value.
1032 @param end_time_value: End_time value.
1033
1034 @returns the injected filter_data.
1035 """
1036 if start_time_value:
1037 filter_data[start_time_key] = start_time_value
1038 if end_time_value:
1039 filter_data[end_time_key] = end_time_value
1040 return filter_data
1041
1042
1043def inject_times_to_hqe_special_tasks_filters(filter_data_common,
1044 start_time, end_time):
1045 """Inject start and end time to hqe and special tasks filters.
1046
1047 @param filter_data_common: Common filter for hqe and special tasks.
1048 @param start_time_key: A string represents the filter key of start_time.
1049 @param end_time_key: A string represents the filter key of end_time.
1050
1051 @returns a pair of hqe and special tasks filters.
1052 """
1053 filter_data_special_tasks = filter_data_common.copy()
1054 return (inject_times_to_filter('started_on__gte', 'started_on__lte',
1055 start_time, end_time, **filter_data_common),
1056 inject_times_to_filter('time_started__gte', 'time_started__lte',
1057 start_time, end_time,
Jakob Juelich59cfe542014-09-02 16:37:46 -07001058 **filter_data_special_tasks))
1059
1060
1061def retrieve_shard(shard_hostname):
1062 """
Jakob Juelich77457572014-09-22 17:02:43 -07001063 Retrieves the shard with the given hostname from the database.
Jakob Juelich59cfe542014-09-02 16:37:46 -07001064
1065 @param shard_hostname: Hostname of the shard to retrieve
1066
Jakob Juelich77457572014-09-22 17:02:43 -07001067 @raises models.Shard.DoesNotExist, if no shard with this hostname was found.
1068
Jakob Juelich59cfe542014-09-02 16:37:46 -07001069 @returns: Shard object
1070 """
MK Ryu509516b2015-05-18 12:00:47 -07001071 timer = autotest_stats.Timer('shard_heartbeat.retrieve_shard')
1072 with timer:
1073 return models.Shard.smart_get(shard_hostname)
Jakob Juelich59cfe542014-09-02 16:37:46 -07001074
1075
Jakob Juelich1b525742014-09-30 13:08:07 -07001076def find_records_for_shard(shard, known_job_ids, known_host_ids):
Jakob Juelich59cfe542014-09-02 16:37:46 -07001077 """Find records that should be sent to a shard.
1078
Jakob Juelicha94efe62014-09-18 16:02:49 -07001079 @param shard: Shard to find records for.
Jakob Juelich1b525742014-09-30 13:08:07 -07001080 @param known_job_ids: List of ids of jobs the shard already has.
1081 @param known_host_ids: List of ids of hosts the shard already has.
Jakob Juelicha94efe62014-09-18 16:02:49 -07001082
Fang Dengf3705992014-12-16 17:32:18 -08001083 @returns: Tuple of three lists for hosts, jobs, and suite job keyvals:
1084 (hosts, jobs, suite_job_keyvals).
Jakob Juelich59cfe542014-09-02 16:37:46 -07001085 """
MK Ryu509516b2015-05-18 12:00:47 -07001086 timer = autotest_stats.Timer('shard_heartbeat')
1087 with timer.get_client('find_hosts'):
1088 hosts = models.Host.assign_to_shard(shard, known_host_ids)
1089 with timer.get_client('find_jobs'):
1090 jobs = models.Job.assign_to_shard(shard, known_job_ids)
1091 with timer.get_client('find_suite_job_keyvals'):
1092 parent_job_ids = [job.parent_job_id for job in jobs]
1093 suite_job_keyvals = models.JobKeyval.objects.filter(
1094 job_id__in=parent_job_ids)
Fang Dengf3705992014-12-16 17:32:18 -08001095 return hosts, jobs, suite_job_keyvals
Jakob Juelicha94efe62014-09-18 16:02:49 -07001096
1097
1098def _persist_records_with_type_sent_from_shard(
1099 shard, records, record_type, *args, **kwargs):
1100 """
1101 Handle records of a specified type that were sent to the shard master.
1102
1103 @param shard: The shard the records were sent from.
1104 @param records: The records sent in their serialized format.
1105 @param record_type: Type of the objects represented by records.
1106 @param args: Additional arguments that will be passed on to the sanity
1107 checks.
1108 @param kwargs: Additional arguments that will be passed on to the sanity
1109 checks.
1110
1111 @raises error.UnallowedRecordsSentToMaster if any of the sanity checks fail.
1112
1113 @returns: List of primary keys of the processed records.
1114 """
1115 pks = []
1116 for serialized_record in records:
1117 pk = serialized_record['id']
1118 try:
1119 current_record = record_type.objects.get(pk=pk)
1120 except record_type.DoesNotExist:
1121 raise error.UnallowedRecordsSentToMaster(
1122 'Object with pk %s of type %s does not exist on master.' % (
1123 pk, record_type))
1124
1125 current_record.sanity_check_update_from_shard(
1126 shard, serialized_record, *args, **kwargs)
1127
1128 current_record.update_from_serialized(serialized_record)
1129 pks.append(pk)
1130 return pks
1131
1132
1133def persist_records_sent_from_shard(shard, jobs, hqes):
1134 """
1135 Sanity checking then saving serialized records sent to master from shard.
1136
1137 During heartbeats shards upload jobs and hostqueuentries. This performs
1138 some sanity checks on these and then updates the existing records for those
1139 entries with the updated ones from the heartbeat.
1140
1141 The sanity checks include:
1142 - Checking if the objects sent already exist on the master.
1143 - Checking if the objects sent were assigned to this shard.
1144 - hostqueueentries must be sent together with their jobs.
1145
1146 @param shard: The shard the records were sent from.
1147 @param jobs: The jobs the shard sent.
1148 @param hqes: The hostqueuentries the shart sent.
1149
1150 @raises error.UnallowedRecordsSentToMaster if any of the sanity checks fail.
1151 """
MK Ryu509516b2015-05-18 12:00:47 -07001152 timer = autotest_stats.Timer('shard_heartbeat')
1153 with timer.get_client('persist_jobs'):
1154 job_ids_sent = _persist_records_with_type_sent_from_shard(
1155 shard, jobs, models.Job)
Jakob Juelicha94efe62014-09-18 16:02:49 -07001156
MK Ryu509516b2015-05-18 12:00:47 -07001157 with timer.get_client('persist_hqes'):
1158 _persist_records_with_type_sent_from_shard(
1159 shard, hqes, models.HostQueueEntry, job_ids_sent=job_ids_sent)
Jakob Juelich50e91f72014-10-01 12:43:23 -07001160
1161
Jakob Juelich50e91f72014-10-01 12:43:23 -07001162def forward_single_host_rpc_to_shard(func):
1163 """This decorator forwards rpc calls that modify a host to a shard.
1164
1165 If a host is assigned to a shard, rpcs that change his attributes should be
1166 forwarded to the shard.
1167
1168 This assumes the first argument of the function represents a host id.
1169
1170 @param func: The function to decorate
1171
1172 @returns: The function to replace func with.
1173 """
1174 def replacement(**kwargs):
1175 # Only keyword arguments can be accepted here, as we need the argument
1176 # names to send the rpc. serviceHandler always provides arguments with
1177 # their keywords, so this is not a problem.
1178 host = models.Host.smart_get(kwargs['id'])
Prashanth Balasubramanian8c98ac12014-12-23 11:26:44 -08001179 if host.shard and not server_utils.is_shard():
MK Ryu26f0c932015-05-28 18:14:33 -07001180 run_rpc_on_multiple_hostnames(func.func_name,
1181 [host.shard.rpc_hostname()],
Jakob Juelich50e91f72014-10-01 12:43:23 -07001182 **kwargs)
1183 return func(**kwargs)
1184
1185 return replacement
1186
1187
Prashanth Balasubramanian5949b4a2014-11-23 12:58:30 -08001188def forward_multi_host_rpc_to_shards(func):
1189 """This decorator forwards rpc calls that modify multiple hosts.
1190
1191 If a host is assigned to a shard, rpcs that change his attributes should be
1192 forwarded to the shard. Some calls however, take a list of hosts and a
1193 single id to modify, eg: label_add_hosts. This wrapper will sift through
1194 the list of hosts, find each of their shards, and forward the rpc for
1195 those hosts to that shard before calling the local version of the given rpc.
1196
1197 This assumes:
1198 1. The rpc call uses `smart_get` to retrieve host objects, not the
1199 stock django `get` call. This is true for most, if not all rpcs in
1200 the rpc_interface.
1201 2. The kwargs to the function contain either a list of host ids or
1202 hostnames, keyed under 'hosts'. This is true for all the rpc
1203 functions that use 'smart_get'.
1204
1205 @param func: The function to decorate
1206
1207 @returns: The function to replace func with.
1208 """
1209 def replacement(**kwargs):
MK Ryu9c5fbbe2015-02-11 15:46:22 -08001210 fanout_rpc(
1211 models.Host.smart_get_bulk(kwargs['hosts']),
1212 func.func_name, **kwargs)
Prashanth Balasubramanian5949b4a2014-11-23 12:58:30 -08001213 return func(**kwargs)
1214
1215 return replacement
1216
1217
MK Ryufb5e3a82015-07-01 12:21:20 -07001218def fanout_rpc(host_objs, rpc_name, include_hostnames=True, **kwargs):
1219 """Fanout the given rpc to shards of given hosts.
1220
1221 @param host_objs: Host objects for the rpc.
1222 @param rpc_name: The name of the rpc.
1223 @param include_hostnames: If True, include the hostnames in the kwargs.
1224 Hostnames are not always necessary, this functions is designed to
1225 send rpcs to the shard a host is on, the rpcs themselves could be
1226 related to labels, acls etc.
1227 @param kwargs: The kwargs for the rpc.
1228 """
1229 # Figure out which hosts are on which shards.
1230 shard_host_map = bucket_hosts_by_shard(
1231 host_objs, rpc_hostnames=True)
1232
1233 # Execute the rpc against the appropriate shards.
1234 for shard, hostnames in shard_host_map.iteritems():
1235 if include_hostnames:
1236 kwargs['hosts'] = hostnames
1237 try:
1238 run_rpc_on_multiple_hostnames(rpc_name, [shard], **kwargs)
1239 except:
1240 ei = sys.exc_info()
1241 new_exc = error.RPCException('RPC %s failed on shard %s due to '
1242 '%s: %s' % (rpc_name, shard, ei[0].__name__, ei[1]))
1243 raise new_exc.__class__, new_exc, ei[2]
1244
1245
Jakob Juelich50e91f72014-10-01 12:43:23 -07001246def run_rpc_on_multiple_hostnames(rpc_call, shard_hostnames, **kwargs):
1247 """Runs an rpc to multiple AFEs
1248
1249 This is i.e. used to propagate changes made to hosts after they are assigned
1250 to a shard.
1251
1252 @param rpc_call: Name of the rpc endpoint to call.
1253 @param shard_hostnames: List of hostnames to run the rpcs on.
1254 @param **kwargs: Keyword arguments to pass in the rpcs.
1255 """
MK Ryufb5e3a82015-07-01 12:21:20 -07001256 # Make sure this function is not called on shards but only on master.
1257 assert not server_utils.is_shard()
Jakob Juelich50e91f72014-10-01 12:43:23 -07001258 for shard_hostname in shard_hostnames:
MK Ryu9651ca52015-06-08 17:48:22 -07001259 afe = frontend_wrappers.RetryingAFE(server=shard_hostname)
Jakob Juelich50e91f72014-10-01 12:43:23 -07001260 afe.run(rpc_call, **kwargs)
MK Ryu9c5fbbe2015-02-11 15:46:22 -08001261
1262
1263def get_label(name):
1264 """Gets a label object using a given name.
1265
1266 @param name: Label name.
1267 @raises model.Label.DoesNotExist: when there is no label matching
1268 the given name.
1269 @return: a label object matching the given name.
1270 """
1271 try:
1272 label = models.Label.smart_get(name)
1273 except models.Label.DoesNotExist:
1274 return None
1275 return label
1276
1277
1278def get_global_afe_hostname():
J. Richard Barnettefdfcd662015-04-13 17:20:29 -07001279 """Read the hostname of the global AFE from the global configuration."""
MK Ryu9c5fbbe2015-02-11 15:46:22 -08001280 return global_config.global_config.get_config_value(
1281 'SHARD', 'global_afe_hostname')
1282
1283
MK Ryufbb002c2015-06-08 14:13:16 -07001284def route_rpc_to_master(func):
J. Richard Barnettefdfcd662015-04-13 17:20:29 -07001285 """Route RPC to master AFE.
MK Ryu2d107562015-02-24 17:45:02 -08001286
MK Ryufbb002c2015-06-08 14:13:16 -07001287 @param func: The function to decorate
J. Richard Barnettefdfcd662015-04-13 17:20:29 -07001288
MK Ryufbb002c2015-06-08 14:13:16 -07001289 @returns: The function to replace func with.
MK Ryu2d107562015-02-24 17:45:02 -08001290 """
MK Ryufbb002c2015-06-08 14:13:16 -07001291 @wraps(func)
MK Ryuf6ab8a72015-07-06 10:19:48 -07001292 def replacement(*args, **kwargs):
1293 kwargs = inspect.getcallargs(func, *args, **kwargs)
MK Ryufbb002c2015-06-08 14:13:16 -07001294 if server_utils.is_shard():
MK Ryu9651ca52015-06-08 17:48:22 -07001295 afe = frontend_wrappers.RetryingAFE(
1296 server=get_global_afe_hostname())
1297 return afe.run(func.func_name, **kwargs)
MK Ryufbb002c2015-06-08 14:13:16 -07001298 return func(**kwargs)
1299 return replacement