blob: a82345ee467742670232909bc2b1229975a428e6 [file] [log] [blame]
mblighe8819cd2008-02-15 16:48:40 +00001"""\
2Utility functions for rpc_interface.py. We keep them in a separate file so that
3only RPC interface functions go into that file.
4"""
5
6__author__ = 'showard@google.com (Steve Howard)'
7
showard14374b12009-01-31 00:11:54 +00008import datetime, os
showard3d6ae112009-05-02 00:45:48 +00009import django.http
mblighec5546d2008-06-16 16:51:28 +000010from frontend.afe import models, model_logic
mblighe8819cd2008-02-15 16:48:40 +000011
showarda62866b2008-07-28 21:27:41 +000012NULL_DATETIME = datetime.datetime.max
13NULL_DATE = datetime.date.max
14
mblighe8819cd2008-02-15 16:48:40 +000015def prepare_for_serialization(objects):
jadmanski0afbb632008-06-06 21:10:57 +000016 """
17 Prepare Python objects to be returned via RPC.
18 """
19 if (isinstance(objects, list) and len(objects) and
20 isinstance(objects[0], dict) and 'id' in objects[0]):
21 objects = gather_unique_dicts(objects)
22 return _prepare_data(objects)
showardb8d34242008-04-25 18:11:16 +000023
24
showardc92da832009-04-07 18:14:34 +000025def prepare_rows_as_nested_dicts(query, nested_dict_column_names):
26 """
27 Prepare a Django query to be returned via RPC as a sequence of nested
28 dictionaries.
29
30 @param query - A Django model query object with a select_related() method.
31 @param nested_dict_column_names - A list of column/attribute names for the
32 rows returned by query to expand into nested dictionaries using
33 their get_object_dict() method when not None.
34
35 @returns An list suitable to returned in an RPC.
36 """
37 all_dicts = []
38 for row in query.select_related():
39 row_dict = row.get_object_dict()
40 for column in nested_dict_column_names:
41 if row_dict[column] is not None:
42 row_dict[column] = getattr(row, column).get_object_dict()
43 all_dicts.append(row_dict)
44 return prepare_for_serialization(all_dicts)
45
46
showardb8d34242008-04-25 18:11:16 +000047def _prepare_data(data):
jadmanski0afbb632008-06-06 21:10:57 +000048 """
49 Recursively process data structures, performing necessary type
50 conversions to values in data to allow for RPC serialization:
51 -convert datetimes to strings
showard2b9a88b2008-06-13 20:55:03 +000052 -convert tuples and sets to lists
jadmanski0afbb632008-06-06 21:10:57 +000053 """
54 if isinstance(data, dict):
55 new_data = {}
56 for key, value in data.iteritems():
57 new_data[key] = _prepare_data(value)
58 return new_data
showard2b9a88b2008-06-13 20:55:03 +000059 elif (isinstance(data, list) or isinstance(data, tuple) or
60 isinstance(data, set)):
jadmanski0afbb632008-06-06 21:10:57 +000061 return [_prepare_data(item) for item in data]
showard98659972008-07-17 17:00:07 +000062 elif isinstance(data, datetime.date):
showarda62866b2008-07-28 21:27:41 +000063 if data is NULL_DATETIME or data is NULL_DATE:
64 return None
jadmanski0afbb632008-06-06 21:10:57 +000065 return str(data)
66 else:
67 return data
mblighe8819cd2008-02-15 16:48:40 +000068
69
showard3d6ae112009-05-02 00:45:48 +000070def raw_http_response(response_data, content_type=None):
71 response = django.http.HttpResponse(response_data, mimetype=content_type)
72 response['Content-length'] = str(len(response.content))
73 return response
74
75
showardb0dfb9f2008-06-06 18:08:02 +000076def gather_unique_dicts(dict_iterable):
jadmanski0afbb632008-06-06 21:10:57 +000077 """\
78 Pick out unique objects (by ID) from an iterable of object dicts.
79 """
80 id_set = set()
81 result = []
82 for obj in dict_iterable:
83 if obj['id'] not in id_set:
84 id_set.add(obj['id'])
85 result.append(obj)
86 return result
showardb0dfb9f2008-06-06 18:08:02 +000087
88
mblighe8819cd2008-02-15 16:48:40 +000089def extra_job_filters(not_yet_run=False, running=False, finished=False):
jadmanski0afbb632008-06-06 21:10:57 +000090 """\
91 Generate a SQL WHERE clause for job status filtering, and return it in
92 a dict of keyword args to pass to query.extra(). No more than one of
93 the parameters should be passed as True.
94 """
95 assert not ((not_yet_run and running) or
96 (not_yet_run and finished) or
97 (running and finished)), ('Cannot specify more than one '
98 'filter to this function')
99 if not_yet_run:
100 where = ['id NOT IN (SELECT job_id FROM host_queue_entries '
101 'WHERE active OR complete)']
102 elif running:
103 where = ['(id IN (SELECT job_id FROM host_queue_entries '
104 'WHERE active OR complete)) AND '
105 '(id IN (SELECT job_id FROM host_queue_entries '
106 'WHERE not complete OR active))']
107 elif finished:
108 where = ['id NOT IN (SELECT job_id FROM host_queue_entries '
109 'WHERE not complete OR active)']
110 else:
showard10f41672009-05-13 21:28:25 +0000111 return {}
jadmanski0afbb632008-06-06 21:10:57 +0000112 return {'where': where}
mblighe8819cd2008-02-15 16:48:40 +0000113
114
showard8e3aa5e2008-04-08 19:42:32 +0000115def extra_host_filters(multiple_labels=[]):
jadmanski0afbb632008-06-06 21:10:57 +0000116 """\
117 Generate SQL WHERE clauses for matching hosts in an intersection of
118 labels.
119 """
120 extra_args = {}
121 where_str = ('hosts.id in (select host_id from hosts_labels '
122 'where label_id=%s)')
123 extra_args['where'] = [where_str] * len(multiple_labels)
124 extra_args['params'] = [models.Label.smart_get(label).id
125 for label in multiple_labels]
126 return extra_args
showard8e3aa5e2008-04-08 19:42:32 +0000127
128
showard43a3d262008-11-12 18:17:05 +0000129def get_host_query(multiple_labels, exclude_only_if_needed_labels, filter_data):
130 query = models.Host.valid_objects.all()
131 if exclude_only_if_needed_labels:
132 only_if_needed_labels = models.Label.valid_objects.filter(
133 only_if_needed=True)
showardf7eac6f2008-11-13 21:18:01 +0000134 if only_if_needed_labels.count() > 0:
135 only_if_needed_ids = ','.join(str(label['id']) for label
136 in only_if_needed_labels.values('id'))
137 query = models.Host.objects.add_join(
138 query, 'hosts_labels', join_key='host_id',
139 join_condition='hosts_labels_exclude.label_id IN (%s)'
140 % only_if_needed_ids,
141 suffix='_exclude', exclude=True)
showard43a3d262008-11-12 18:17:05 +0000142 filter_data['extra_args'] = (extra_host_filters(multiple_labels))
143 return models.Host.query_objects(filter_data, initial_query=query)
144
145
showard8fd58242008-03-10 21:29:07 +0000146class InconsistencyException(Exception):
jadmanski0afbb632008-06-06 21:10:57 +0000147 'Raised when a list of objects does not have a consistent value'
showard8fd58242008-03-10 21:29:07 +0000148
149
150def get_consistent_value(objects, field):
mblighc5ddfd12008-08-04 17:15:00 +0000151 if not objects:
152 # well a list of nothing is consistent
153 return None
154
jadmanski0afbb632008-06-06 21:10:57 +0000155 value = getattr(objects[0], field)
156 for obj in objects:
157 this_value = getattr(obj, field)
158 if this_value != value:
159 raise InconsistencyException(objects[0], obj)
160 return value
showard8fd58242008-03-10 21:29:07 +0000161
162
showard2b9a88b2008-06-13 20:55:03 +0000163def prepare_generate_control_file(tests, kernel, label, profilers):
jadmanski0afbb632008-06-06 21:10:57 +0000164 test_objects = [models.Test.smart_get(test) for test in tests]
showard2b9a88b2008-06-13 20:55:03 +0000165 profiler_objects = [models.Profiler.smart_get(profiler)
166 for profiler in profilers]
jadmanski0afbb632008-06-06 21:10:57 +0000167 # ensure tests are all the same type
168 try:
169 test_type = get_consistent_value(test_objects, 'test_type')
170 except InconsistencyException, exc:
171 test1, test2 = exc.args
mblighec5546d2008-06-16 16:51:28 +0000172 raise model_logic.ValidationError(
jadmanski0afbb632008-06-06 21:10:57 +0000173 {'tests' : 'You cannot run both server- and client-side '
174 'tests together (tests %s and %s differ' % (
175 test1.name, test2.name)})
showard8fd58242008-03-10 21:29:07 +0000176
jadmanski0afbb632008-06-06 21:10:57 +0000177 is_server = (test_type == models.Test.Types.SERVER)
showard14374b12009-01-31 00:11:54 +0000178 if test_objects:
179 synch_count = max(test.sync_count for test in test_objects)
180 else:
181 synch_count = 1
jadmanski0afbb632008-06-06 21:10:57 +0000182 if label:
183 label = models.Label.smart_get(label)
mblighe8819cd2008-02-15 16:48:40 +0000184
showard989f25d2008-10-01 11:38:11 +0000185 dependencies = set(label.name for label
186 in models.Label.objects.filter(test__in=test_objects))
187
showard2bab8f42008-11-12 18:15:22 +0000188 cf_info = dict(is_server=is_server, synch_count=synch_count,
189 dependencies=list(dependencies))
190 return cf_info, test_objects, profiler_objects, label
showard989f25d2008-10-01 11:38:11 +0000191
192
193def check_job_dependencies(host_objects, job_dependencies):
194 """
195 Check that a set of machines satisfies a job's dependencies.
196 host_objects: list of models.Host objects
197 job_dependencies: list of names of labels
198 """
199 # check that hosts satisfy dependencies
200 host_ids = [host.id for host in host_objects]
201 hosts_in_job = models.Host.objects.filter(id__in=host_ids)
202 ok_hosts = hosts_in_job
203 for index, dependency in enumerate(job_dependencies):
204 ok_hosts &= models.Host.objects.filter_custom_join(
205 '_label%d' % index, labels__name=dependency)
206 failing_hosts = (set(host.hostname for host in host_objects) -
207 set(host.hostname for host in ok_hosts))
208 if failing_hosts:
209 raise model_logic.ValidationError(
210 {'hosts' : 'Host(s) failed to meet job dependencies: ' +
211 ', '.join(failing_hosts)})
212
showard2bab8f42008-11-12 18:15:22 +0000213
214def _execution_key_for(host_queue_entry):
215 return (host_queue_entry.job.id, host_queue_entry.execution_subdir)
216
217
218def check_abort_synchronous_jobs(host_queue_entries):
219 # ensure user isn't aborting part of a synchronous autoserv execution
220 count_per_execution = {}
221 for queue_entry in host_queue_entries:
222 key = _execution_key_for(queue_entry)
223 count_per_execution.setdefault(key, 0)
224 count_per_execution[key] += 1
225
226 for queue_entry in host_queue_entries:
227 if not queue_entry.execution_subdir:
228 continue
229 execution_count = count_per_execution[_execution_key_for(queue_entry)]
230 if execution_count < queue_entry.job.synch_count:
231 raise model_logic.ValidationError(
232 {'' : 'You cannot abort part of a synchronous job execution '
showardc92da832009-04-07 18:14:34 +0000233 '(%d/%s), %d included, %d expected'
showard2bab8f42008-11-12 18:15:22 +0000234 % (queue_entry.job.id, queue_entry.execution_subdir,
showard01746192008-11-13 21:18:14 +0000235 execution_count, queue_entry.job.synch_count)})
showard8fbae652009-01-20 23:23:10 +0000236
237
showardc92da832009-04-07 18:14:34 +0000238def check_atomic_group_create_job(synch_count, host_objects, metahost_objects,
239 dependencies, atomic_group, labels_by_name):
240 """
241 Attempt to reject create_job requests with an atomic group that
242 will be impossible to schedule. The checks are not perfect but
243 should catch the most obvious issues.
244
245 @param synch_count - The job's minimum synch count.
246 @param host_objects - A list of models.Host instances.
247 @param metahost_objects - A list of models.Label instances.
248 @param dependencies - A list of job dependency label names.
249 @param atomic_group - The models.AtomicGroup instance.
250 @param labels_by_name - A dictionary mapping label names to models.Label
251 instance. Used to look up instances for dependencies.
252
253 @raises model_logic.ValidationError - When an issue is found.
254 """
255 # If specific host objects were supplied with an atomic group, verify
256 # that there are enough to satisfy the synch_count.
257 minimum_required = synch_count or 1
258 if (host_objects and not metahost_objects and
259 len(host_objects) < minimum_required):
260 raise model_logic.ValidationError(
261 {'hosts':
262 'only %d hosts provided for job with synch_count = %d' %
263 (len(host_objects), synch_count)})
264
265 # Check that the atomic group has a hope of running this job
266 # given any supplied metahosts and dependancies that may limit.
267
268 # Get a set of hostnames in the atomic group.
269 possible_hosts = set()
270 for label in atomic_group.label_set.all():
271 possible_hosts.update(h.hostname for h in label.host_set.all())
272
273 # Filter out hosts that don't match all of the job dependency labels.
274 for label_name in set(dependencies):
275 label = labels_by_name[label_name]
276 hosts_in_label = (h.hostname for h in label.host_set.all())
277 possible_hosts.intersection_update(hosts_in_label)
278
showard225bdc12009-04-13 16:09:21 +0000279 if not host_objects and not metahost_objects:
280 # No hosts or metahosts are required to queue an atomic group Job.
281 # However, if they are given, we respect them below.
282 host_set = possible_hosts
283 else:
284 host_set = set(host.hostname for host in host_objects)
285 unusable_host_set = host_set.difference(possible_hosts)
286 if unusable_host_set:
287 raise model_logic.ValidationError(
288 {'hosts': 'Hosts "%s" are not in Atomic Group "%s"' %
289 (', '.join(sorted(unusable_host_set)), atomic_group.name)})
showardc92da832009-04-07 18:14:34 +0000290
291 # Lookup hosts provided by each meta host and merge them into the
292 # host_set for final counting.
293 for meta_host in metahost_objects:
294 meta_possible = possible_hosts.copy()
295 hosts_in_meta_host = (h.hostname for h in meta_host.host_set.all())
296 meta_possible.intersection_update(hosts_in_meta_host)
297
298 # Count all hosts that this meta_host will provide.
299 host_set.update(meta_possible)
300
301 if len(host_set) < minimum_required:
302 raise model_logic.ValidationError(
303 {'atomic_group_name':
304 'Insufficient hosts in Atomic Group "%s" with the'
305 ' supplied dependencies and meta_hosts.' %
306 (atomic_group.name,)})
307
308
showard8fbae652009-01-20 23:23:10 +0000309def get_motd():
310 dirname = os.path.dirname(__file__)
311 filename = os.path.join(dirname, "..", "..", "motd.txt")
312 text = ''
313 try:
314 fp = open(filename, "r")
315 try:
316 text = fp.read()
317 finally:
318 fp.close()
319 except:
320 pass
321
322 return text
showard29f7cd22009-04-29 21:16:24 +0000323
324
325def _get_metahost_counts(metahost_objects):
326 metahost_counts = {}
327 for metahost in metahost_objects:
328 metahost_counts.setdefault(metahost, 0)
329 metahost_counts[metahost] += 1
330 return metahost_counts
331
332
showarda965cef2009-05-15 23:17:41 +0000333def get_job_info(job, preserve_metahosts=False, queue_entry_filter_data=None):
showard29f7cd22009-04-29 21:16:24 +0000334 hosts = []
335 one_time_hosts = []
336 meta_hosts = []
337 atomic_group = None
338
showard4d077562009-05-08 18:24:36 +0000339 queue_entries = job.hostqueueentry_set.all()
showarda965cef2009-05-15 23:17:41 +0000340 if queue_entry_filter_data:
341 queue_entries = models.HostQueueEntry.query_objects(
342 queue_entry_filter_data, initial_query=queue_entries)
showard4d077562009-05-08 18:24:36 +0000343
344 for queue_entry in queue_entries:
showard29f7cd22009-04-29 21:16:24 +0000345 if (queue_entry.host and (preserve_metahosts or
346 not queue_entry.meta_host)):
347 if queue_entry.deleted:
348 continue
349 if queue_entry.host.invalid:
350 one_time_hosts.append(queue_entry.host)
351 else:
352 hosts.append(queue_entry.host)
353 else:
354 meta_hosts.append(queue_entry.meta_host)
355 if atomic_group is None:
356 if queue_entry.atomic_group is not None:
357 atomic_group = queue_entry.atomic_group
358 else:
359 assert atomic_group.name == queue_entry.atomic_group.name, (
360 'DB inconsistency. HostQueueEntries with multiple atomic'
361 ' groups on job %s: %s != %s' % (
362 id, atomic_group.name, queue_entry.atomic_group.name))
363
364 meta_host_counts = _get_metahost_counts(meta_hosts)
365
366 info = dict(dependencies=[label.name for label
367 in job.dependency_labels.all()],
368 hosts=hosts,
369 meta_hosts=meta_hosts,
370 meta_host_counts=meta_host_counts,
371 one_time_hosts=one_time_hosts,
372 atomic_group=atomic_group)
373 return info
374
375
showarda1e74b32009-05-12 17:32:04 +0000376def create_new_job(owner, options, host_objects, metahost_objects,
377 atomic_group=None):
showard29f7cd22009-04-29 21:16:24 +0000378 labels_by_name = dict((label.name, label)
showarda1e74b32009-05-12 17:32:04 +0000379 for label in models.Label.objects.all())
showard29f7cd22009-04-29 21:16:24 +0000380 all_host_objects = host_objects + metahost_objects
381 metahost_counts = _get_metahost_counts(metahost_objects)
showarda1e74b32009-05-12 17:32:04 +0000382 dependencies = options.get('dependencies', [])
383 synch_count = options.get('synch_count')
showard29f7cd22009-04-29 21:16:24 +0000384
385 # check that each metahost request has enough hosts under the label
386 for label, requested_count in metahost_counts.iteritems():
387 available_count = label.host_set.count()
388 if requested_count > available_count:
389 error = ("You have requested %d %s's, but there are only %d."
390 % (requested_count, label.name, available_count))
391 raise model_logic.ValidationError({'meta_hosts' : error})
392
393 if atomic_group:
394 check_atomic_group_create_job(
395 synch_count, host_objects, metahost_objects,
396 dependencies, atomic_group, labels_by_name)
397 else:
398 if synch_count is not None and synch_count > len(all_host_objects):
399 raise model_logic.ValidationError(
400 {'hosts':
401 'only %d hosts provided for job with synch_count = %d' %
402 (len(all_host_objects), synch_count)})
403 atomic_hosts = models.Host.objects.filter(
404 id__in=[host.id for host in host_objects],
405 labels__atomic_group=True)
406 unusable_host_names = [host.hostname for host in atomic_hosts]
407 if unusable_host_names:
408 raise model_logic.ValidationError(
409 {'hosts':
410 'Host(s) "%s" are atomic group hosts but no '
411 'atomic group was specified for this job.' %
412 (', '.join(unusable_host_names),)})
413
414
415 check_job_dependencies(host_objects, dependencies)
showarda1e74b32009-05-12 17:32:04 +0000416 options['dependencies'] = [labels_by_name[label_name]
417 for label_name in dependencies]
showard29f7cd22009-04-29 21:16:24 +0000418
showarda1e74b32009-05-12 17:32:04 +0000419 for label in metahost_objects + options['dependencies']:
showard29f7cd22009-04-29 21:16:24 +0000420 if label.atomic_group and not atomic_group:
421 raise model_logic.ValidationError(
422 {'atomic_group_name':
showardc8730322009-06-30 01:56:38 +0000423 'Dependency %r requires an atomic group but no '
424 'atomic_group_name or meta_host in an atomic group was '
425 'specified for this job.' % label.name})
showard29f7cd22009-04-29 21:16:24 +0000426 elif (label.atomic_group and
427 label.atomic_group.name != atomic_group.name):
428 raise model_logic.ValidationError(
429 {'atomic_group_name':
showardc8730322009-06-30 01:56:38 +0000430 'meta_hosts or dependency %r requires atomic group '
431 '%r instead of the supplied atomic_group_name=%r.' %
432 (label.name, label.atomic_group.name, atomic_group.name)})
showard29f7cd22009-04-29 21:16:24 +0000433
showarda1e74b32009-05-12 17:32:04 +0000434 job = models.Job.create(owner=owner, options=options,
435 hosts=all_host_objects)
showard29f7cd22009-04-29 21:16:24 +0000436 job.queue(all_host_objects, atomic_group=atomic_group,
showarda1e74b32009-05-12 17:32:04 +0000437 is_template=options.get('is_template', False))
showard29f7cd22009-04-29 21:16:24 +0000438 return job.id
showard0957a842009-05-11 19:25:08 +0000439
440
showard909c9142009-07-07 20:54:42 +0000441def find_platform_and_atomic_group(host):
442 """
443 Figure out the platform name and atomic group name for the given host
444 object. If none, the return value for either will be None.
445
446 @returns (platform name, atomic group name) for the given host.
447 """
showard0957a842009-05-11 19:25:08 +0000448 platforms = [label.name for label in host.label_list if label.platform]
449 if not platforms:
showard909c9142009-07-07 20:54:42 +0000450 platform = None
451 else:
452 platform = platforms[0]
showard0957a842009-05-11 19:25:08 +0000453 if len(platforms) > 1:
454 raise ValueError('Host %s has more than one platform: %s' %
455 (host.hostname, ', '.join(platforms)))
showard909c9142009-07-07 20:54:42 +0000456 for label in host.label_list:
457 if label.atomic_group:
458 atomic_group_name = label.atomic_group.name
459 break
460 else:
461 atomic_group_name = None
462 # Don't check for multiple atomic groups on a host here. That is an
463 # error but should not trip up the RPC interface. monitor_db_cleanup
464 # deals with it. This just returns the first one found.
465 return platform, atomic_group_name