blob: 72fbfae47261427fed482709d369c74b004c064f [file] [log] [blame]
Dan Shi4df39252013-03-19 13:19:45 -07001# pylint: disable-msg=C0111
2
Chris Masone859fdec2012-01-30 08:38:09 -08003# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
4# Use of this source code is governed by a BSD-style license that can be
5# found in the LICENSE file.
6
7__author__ = 'cmasone@chromium.org (Chris Masone)'
8
Michael Tang9afc74b2016-03-21 10:19:23 -07009# The boto module is only available/used in Moblab for validation of cloud
10# storage access. The module is not available in the test lab environment,
11# and the import error is handled.
12try:
13 import boto
14except ImportError:
15 boto = None
Chris Masone859fdec2012-01-30 08:38:09 -080016import common
Simran Basi773a86e2015-05-13 19:15:42 -070017import ConfigParser
Chris Masonea8066a92012-05-01 16:52:31 -070018import datetime
Chris Masone859fdec2012-01-30 08:38:09 -080019import logging
Simran Basi71206ef2014-08-13 13:51:18 -070020import os
Michael Tang9afc74b2016-03-21 10:19:23 -070021import re
Simran Basi71206ef2014-08-13 13:51:18 -070022import shutil
Michael Tang9afc74b2016-03-21 10:19:23 -070023import socket
Aviv Keshetd83ef442013-01-16 16:19:35 -080024
Jakob Juelich82b7d1c2014-09-15 16:10:57 -070025from autotest_lib.frontend.afe import models
Matthew Sartorid96fb9b2015-05-19 18:04:58 -070026from autotest_lib.client.common_lib import control_data
Aviv Keshetd83ef442013-01-16 16:19:35 -080027from autotest_lib.client.common_lib import error
Simran Basi71206ef2014-08-13 13:51:18 -070028from autotest_lib.client.common_lib import global_config
Alex Miller7d658cf2013-09-04 16:00:35 -070029from autotest_lib.client.common_lib import priorities
Dan Shidfea3682014-08-10 23:38:40 -070030from autotest_lib.client.common_lib import time_utils
Chris Masone859fdec2012-01-30 08:38:09 -080031from autotest_lib.client.common_lib.cros import dev_server
Gabe Black1e1c41b2015-02-04 23:55:15 -080032from autotest_lib.client.common_lib.cros.graphite import autotest_stats
Jakob Juelich9fffe4f2014-08-14 18:07:05 -070033from autotest_lib.frontend.afe import rpc_utils
Simran Basib6ec8ae2014-04-23 12:05:08 -070034from autotest_lib.server import utils
Dan Shi36cfd832014-10-10 13:38:51 -070035from autotest_lib.server.cros import provision
Chris Masone44e4d6c2012-08-15 14:25:53 -070036from autotest_lib.server.cros.dynamic_suite import constants
Chris Masoneb4935552012-08-14 12:05:54 -070037from autotest_lib.server.cros.dynamic_suite import control_file_getter
Chris Masone44e4d6c2012-08-15 14:25:53 -070038from autotest_lib.server.cros.dynamic_suite import tools
Dan Shi36cfd832014-10-10 13:38:51 -070039from autotest_lib.server.cros.dynamic_suite.suite import Suite
Simran Basi71206ef2014-08-13 13:51:18 -070040from autotest_lib.server.hosts import moblab_host
Dan Shidfea3682014-08-10 23:38:40 -070041from autotest_lib.site_utils import host_history
Dan Shi193905e2014-07-25 23:33:09 -070042from autotest_lib.site_utils import job_history
Dan Shid7bb4f12015-01-06 10:53:50 -080043from autotest_lib.site_utils import server_manager_utils
Dan Shi6964fa52014-12-18 11:04:27 -080044from autotest_lib.site_utils import stable_version_utils
Simran Basi71206ef2014-08-13 13:51:18 -070045
46
47_CONFIG = global_config.global_config
48MOBLAB_BOTO_LOCATION = '/home/moblab/.boto'
Chris Masone859fdec2012-01-30 08:38:09 -080049
Michael Tang9afc74b2016-03-21 10:19:23 -070050# Google Cloud Storage bucket url regex pattern. The pattern is used to extract
51# the bucket name from the bucket URL. For example, "gs://image_bucket/google"
52# should result in a bucket name "image_bucket".
53GOOGLE_STORAGE_BUCKET_URL_PATTERN = re.compile(
54 r'gs://(?P<bucket>[a-zA-Z][a-zA-Z0-9-_]*)/?.*')
55
56# Constants used in JSON RPC field names.
57_USE_EXISTING_BOTO_FILE = 'use_existing_boto_file'
58_GS_ACCESS_KEY_ID = 'gs_access_key_id'
59_GS_SECRETE_ACCESS_KEY = 'gs_secret_access_key'
60_IMAGE_STORAGE_SERVER = 'image_storage_server'
61_RESULT_STORAGE_SERVER = 'results_storage_server'
62
63
Chris Masonef8b53062012-05-08 22:14:18 -070064# Relevant CrosDynamicSuiteExceptions are defined in client/common_lib/error.py.
Chris Masone859fdec2012-01-30 08:38:09 -080065
66
Chris Masone62579122012-03-08 15:18:43 -080067def canonicalize_suite_name(suite_name):
Dan Shi70647ca2015-07-16 22:52:35 -070068 # Do not change this naming convention without updating
69 # site_utils.parse_job_name.
Chris Masone62579122012-03-08 15:18:43 -080070 return 'test_suites/control.%s' % suite_name
71
72
Chris Masoneaa10f8e2012-05-15 13:34:21 -070073def formatted_now():
Dan Shidfea3682014-08-10 23:38:40 -070074 return datetime.datetime.now().strftime(time_utils.TIME_FMT)
Chris Masoneaa10f8e2012-05-15 13:34:21 -070075
76
Simran Basib6ec8ae2014-04-23 12:05:08 -070077def _get_control_file_contents_by_name(build, ds, suite_name):
Chris Masone8dd27e02012-06-25 15:59:43 -070078 """Return control file contents for |suite_name|.
79
80 Query the dev server at |ds| for the control file |suite_name|, included
81 in |build| for |board|.
82
83 @param build: unique name by which to refer to the image from now on.
Chris Masone8dd27e02012-06-25 15:59:43 -070084 @param ds: a dev_server.DevServer instance to fetch control file with.
85 @param suite_name: canonicalized suite name, e.g. test_suites/control.bvt.
86 @raises ControlFileNotFound if a unique suite control file doesn't exist.
87 @raises NoControlFileList if we can't list the control files at all.
88 @raises ControlFileEmpty if the control file exists on the server, but
89 can't be read.
90
91 @return the contents of the desired control file.
92 """
93 getter = control_file_getter.DevServerGetter.create(build, ds)
Gabe Black1e1c41b2015-02-04 23:55:15 -080094 timer = autotest_stats.Timer('control_files.parse.%s.%s' %
95 (ds.get_server_name(ds.url()
96 ).replace('.', '_'),
97 suite_name.rsplit('.')[-1]))
Chris Masone8dd27e02012-06-25 15:59:43 -070098 # Get the control file for the suite.
99 try:
Prashanth Balasubramanianabe3bb72014-11-20 12:00:37 -0800100 with timer:
101 control_file_in = getter.get_control_file_contents_by_name(
102 suite_name)
Chris Masone8dd27e02012-06-25 15:59:43 -0700103 except error.CrosDynamicSuiteException as e:
Simran Basib6ec8ae2014-04-23 12:05:08 -0700104 raise type(e)("%s while testing %s." % (e, build))
Chris Masone8dd27e02012-06-25 15:59:43 -0700105 if not control_file_in:
106 raise error.ControlFileEmpty(
107 "Fetching %s returned no data." % suite_name)
Alex Millera713e252013-03-01 10:45:44 -0800108 # Force control files to only contain ascii characters.
109 try:
110 control_file_in.encode('ascii')
111 except UnicodeDecodeError as e:
112 raise error.ControlFileMalformed(str(e))
113
Chris Masone8dd27e02012-06-25 15:59:43 -0700114 return control_file_in
115
116
Simran Basib6ec8ae2014-04-23 12:05:08 -0700117def _stage_build_artifacts(build):
118 """
119 Ensure components of |build| necessary for installing images are staged.
120
121 @param build image we want to stage.
122
Prashanth B6285f6a2014-05-08 18:01:27 -0700123 @raises StageControlFileFailure: if the dev server throws 500 while staging
124 suite control files.
Simran Basib6ec8ae2014-04-23 12:05:08 -0700125
126 @return: dev_server.ImageServer instance to use with this build.
127 @return: timings dictionary containing staging start/end times.
128 """
129 timings = {}
Prashanth B6285f6a2014-05-08 18:01:27 -0700130 # Ensure components of |build| necessary for installing images are staged
131 # on the dev server. However set synchronous to False to allow other
132 # components to be downloaded in the background.
Dan Shi6450e142016-03-11 11:52:20 -0800133 ds = dev_server.resolve(build)
Simran Basib6ec8ae2014-04-23 12:05:08 -0700134 timings[constants.DOWNLOAD_STARTED_TIME] = formatted_now()
Gabe Black1e1c41b2015-02-04 23:55:15 -0800135 timer = autotest_stats.Timer('control_files.stage.%s' % (
136 ds.get_server_name(ds.url()).replace('.', '_')))
Simran Basib6ec8ae2014-04-23 12:05:08 -0700137 try:
Prashanth Balasubramanianabe3bb72014-11-20 12:00:37 -0800138 with timer:
Dan Shi6450e142016-03-11 11:52:20 -0800139 ds.stage_artifacts(image=build, artifacts=['test_suites'])
Simran Basib6ec8ae2014-04-23 12:05:08 -0700140 except dev_server.DevServerException as e:
Prashanth B6285f6a2014-05-08 18:01:27 -0700141 raise error.StageControlFileFailure(
Simran Basib6ec8ae2014-04-23 12:05:08 -0700142 "Failed to stage %s: %s" % (build, e))
143 timings[constants.PAYLOAD_FINISHED_TIME] = formatted_now()
144 return (ds, timings)
145
146
MK Ryue301eb72015-06-25 12:51:02 -0700147@rpc_utils.route_rpc_to_master
Simran Basib6ec8ae2014-04-23 12:05:08 -0700148def create_suite_job(name='', board='', build='', pool='', control_file='',
149 check_hosts=True, num=None, file_bugs=False, timeout=24,
150 timeout_mins=None, priority=priorities.Priority.DEFAULT,
Fang Deng058860c2014-05-15 15:41:50 -0700151 suite_args=None, wait_for_results=True, job_retry=False,
Fang Deng443f1952015-01-02 14:51:49 -0800152 max_retries=None, max_runtime_mins=None, suite_min_duts=0,
Dan Shi36cfd832014-10-10 13:38:51 -0700153 offload_failures_only=False, builds={},
Dan Shi059261a2016-02-22 12:06:37 -0800154 test_source_build=None, run_prod_code=False,
155 delay_minutes=0, **kwargs):
Chris Masone859fdec2012-01-30 08:38:09 -0800156 """
157 Create a job to run a test suite on the given device with the given image.
158
159 When the timeout specified in the control file is reached, the
160 job is guaranteed to have completed and results will be available.
161
Simran Basib6ec8ae2014-04-23 12:05:08 -0700162 @param name: The test name if control_file is supplied, otherwise the name
163 of the test suite to run, e.g. 'bvt'.
Chris Masone859fdec2012-01-30 08:38:09 -0800164 @param board: the kind of device to run the tests on.
165 @param build: unique name by which to refer to the image from now on.
Dan Shi36cfd832014-10-10 13:38:51 -0700166 @param builds: the builds to install e.g.
167 {'cros-version:': 'x86-alex-release/R18-1655.0.0',
168 'fw-version:': 'x86-alex-firmware/R36-5771.50.0',
169 'fwro-version:': 'x86-alex-firmware/R36-5771.49.0'}
170 If builds is given a value, it overrides argument build.
171 @param test_source_build: Build that contains the server-side test code.
Scott Zawalski65650172012-02-16 11:48:26 -0500172 @param pool: Specify the pool of machines to use for scheduling
173 purposes.
Chris Masone62579122012-03-08 15:18:43 -0800174 @param check_hosts: require appropriate live hosts to exist in the lab.
Aviv Keshetd83ef442013-01-16 16:19:35 -0800175 @param num: Specify the number of machines to schedule across (integer).
176 Leave unspecified or use None to use default sharding factor.
Alex Millerc577f3e2012-09-27 14:06:07 -0700177 @param file_bugs: File a bug on each test failure in this suite.
Alex Miller139690b2013-09-07 15:35:49 -0700178 @param timeout: The max lifetime of this suite, in hours.
Simran Basi7e605742013-11-12 13:43:36 -0800179 @param timeout_mins: The max lifetime of this suite, in minutes. Takes
180 priority over timeout.
Alex Miller139690b2013-09-07 15:35:49 -0700181 @param priority: Integer denoting priority. Higher is more important.
Aviv Keshet7cd12312013-07-25 10:25:55 -0700182 @param suite_args: Optional arguments which will be parsed by the suite
183 control file. Used by control.test_that_wrapper to
184 determine which tests to run.
Dan Shi95122412013-11-12 16:20:33 -0800185 @param wait_for_results: Set to False to run the suite job without waiting
186 for test jobs to finish. Default is True.
Fang Deng058860c2014-05-15 15:41:50 -0700187 @param job_retry: Set to True to enable job-level retry. Default is False.
Fang Deng443f1952015-01-02 14:51:49 -0800188 @param max_retries: Integer, maximum job retries allowed at suite level.
189 None for no max.
Simran Basi102e3522014-09-11 11:46:10 -0700190 @param max_runtime_mins: Maximum amount of time a job can be running in
191 minutes.
Fang Dengcbc01212014-11-25 16:09:46 -0800192 @param suite_min_duts: Integer. Scheduler will prioritize getting the
193 minimum number of machines for the suite when it is
194 competing with another suite that has a higher
195 priority but already got minimum machines it needs.
Simran Basi1e10e922015-04-16 15:09:56 -0700196 @param offload_failures_only: Only enable gs_offloading for failed jobs.
Simran Basi5ace6f22016-01-06 17:30:44 -0800197 @param run_prod_code: If True, the suite will run the test code that
198 lives in prod aka the test code currently on the
199 lab servers. If False, the control files and test
200 code for this suite run will be retrieved from the
201 build artifacts.
Dan Shi059261a2016-02-22 12:06:37 -0800202 @param delay_minutes: Delay the creation of test jobs for a given number of
203 minutes.
Simran Basib6ec8ae2014-04-23 12:05:08 -0700204 @param kwargs: extra keyword args. NOT USED.
Chris Masone859fdec2012-01-30 08:38:09 -0800205
Chris Masone8dd27e02012-06-25 15:59:43 -0700206 @raises ControlFileNotFound: if a unique suite control file doesn't exist.
207 @raises NoControlFileList: if we can't list the control files at all.
Prashanth B6285f6a2014-05-08 18:01:27 -0700208 @raises StageControlFileFailure: If the dev server throws 500 while
209 staging test_suites.
Chris Masone8dd27e02012-06-25 15:59:43 -0700210 @raises ControlFileEmpty: if the control file exists on the server, but
211 can't be read.
Chris Masone859fdec2012-01-30 08:38:09 -0800212
213 @return: the job ID of the suite; -1 on error.
214 """
Aviv Keshetd83ef442013-01-16 16:19:35 -0800215 if type(num) is not int and num is not None:
Chris Sosa18c70b32013-02-15 14:12:43 -0800216 raise error.SuiteArgumentException('Ill specified num argument %r. '
217 'Must be an integer or None.' % num)
Aviv Keshetd83ef442013-01-16 16:19:35 -0800218 if num == 0:
219 logging.warning("Can't run on 0 hosts; using default.")
220 num = None
Dan Shi36cfd832014-10-10 13:38:51 -0700221
222 # TODO(dshi): crbug.com/496782 Remove argument build and its reference after
223 # R45 falls out of stable channel.
224 if build and not builds:
225 builds = {provision.CROS_VERSION_PREFIX: build}
Dan Shib49bb8b2016-03-01 15:29:27 -0800226
Dan Shi2121a332016-02-25 14:22:22 -0800227 # Default test source build to CrOS build if it's not specified and
228 # run_prod_code is set to False.
229 if not run_prod_code:
230 test_source_build = Suite.get_test_source_build(
231 builds, test_source_build=test_source_build)
Dan Shi36cfd832014-10-10 13:38:51 -0700232
Simran Basi5ace6f22016-01-06 17:30:44 -0800233 suite_name = canonicalize_suite_name(name)
234 if run_prod_code:
Dan Shi6450e142016-03-11 11:52:20 -0800235 ds = dev_server.resolve(build)
Simran Basi5ace6f22016-01-06 17:30:44 -0800236 keyvals = {}
237 getter = control_file_getter.FileSystemGetter(
238 [_CONFIG.get_config_value('SCHEDULER',
239 'drone_installation_directory')])
240 control_file = getter.get_control_file_contents_by_name(suite_name)
241 else:
242 (ds, keyvals) = _stage_build_artifacts(test_source_build)
Fang Dengcbc01212014-11-25 16:09:46 -0800243 keyvals[constants.SUITE_MIN_DUTS_KEY] = suite_min_duts
Chris Masone859fdec2012-01-30 08:38:09 -0800244
Simran Basib6ec8ae2014-04-23 12:05:08 -0700245 if not control_file:
Dan Shi36cfd832014-10-10 13:38:51 -0700246 # No control file was supplied so look it up from the build artifacts.
247 suite_name = canonicalize_suite_name(name)
248 control_file = _get_control_file_contents_by_name(test_source_build,
249 ds, suite_name)
Simran Basi86fe9c92016-02-09 17:58:20 -0800250 # Do not change this naming convention without updating
251 # site_utils.parse_job_name.
Dan Shi2121a332016-02-25 14:22:22 -0800252 if not run_prod_code:
253 name = '%s-%s' % (test_source_build, suite_name)
254 else:
255 # If run_prod_code is True, test_source_build is not set, use the
256 # first build in the builds list for the sutie job name.
257 name = '%s-%s' % (builds.values()[0], suite_name)
Chris Masone46d0eb12012-07-27 18:56:39 -0700258
Simran Basi7e605742013-11-12 13:43:36 -0800259 timeout_mins = timeout_mins or timeout * 60
Simran Basi102e3522014-09-11 11:46:10 -0700260 max_runtime_mins = max_runtime_mins or timeout * 60
Simran Basi7e605742013-11-12 13:43:36 -0800261
Simran Basib6ec8ae2014-04-23 12:05:08 -0700262 if not board:
Dan Shid215dbe2015-06-18 16:14:59 -0700263 board = utils.ParseBuildName(builds[provision.CROS_VERSION_PREFIX])[0]
Chris Masone46d0eb12012-07-27 18:56:39 -0700264
Dan Shi36cfd832014-10-10 13:38:51 -0700265 # TODO(dshi): crbug.com/496782 Remove argument build and its reference after
266 # R45 falls out of stable channel.
Simran Basib6ec8ae2014-04-23 12:05:08 -0700267 # Prepend build and board to the control file.
Scott Zawalski65650172012-02-16 11:48:26 -0500268 inject_dict = {'board': board,
Simran Basi5ace6f22016-01-06 17:30:44 -0800269 'build': builds.get(provision.CROS_VERSION_PREFIX),
Dan Shi36cfd832014-10-10 13:38:51 -0700270 'builds': builds,
Chris Masone62579122012-03-08 15:18:43 -0800271 'check_hosts': check_hosts,
Chris Masone46d0eb12012-07-27 18:56:39 -0700272 'pool': pool,
Aviv Keshetd83ef442013-01-16 16:19:35 -0800273 'num': num,
Dan Shib8a99112013-06-18 13:46:10 -0700274 'file_bugs': file_bugs,
Alex Miller139690b2013-09-07 15:35:49 -0700275 'timeout': timeout,
Simran Basi7e605742013-11-12 13:43:36 -0800276 'timeout_mins': timeout_mins,
Alex Miller7d658cf2013-09-04 16:00:35 -0700277 'devserver_url': ds.url(),
Aviv Keshet7cd12312013-07-25 10:25:55 -0700278 'priority': priority,
Dan Shi95122412013-11-12 16:20:33 -0800279 'suite_args' : suite_args,
Fang Deng058860c2014-05-15 15:41:50 -0700280 'wait_for_results': wait_for_results,
Simran Basi102e3522014-09-11 11:46:10 -0700281 'job_retry': job_retry,
Fang Deng443f1952015-01-02 14:51:49 -0800282 'max_retries': max_retries,
Fang Dengcbc01212014-11-25 16:09:46 -0800283 'max_runtime_mins': max_runtime_mins,
Dan Shi36cfd832014-10-10 13:38:51 -0700284 'offload_failures_only': offload_failures_only,
Simran Basi5ace6f22016-01-06 17:30:44 -0800285 'test_source_build': test_source_build,
Dan Shi059261a2016-02-22 12:06:37 -0800286 'run_prod_code': run_prod_code,
287 'delay_minutes': delay_minutes,
Aviv Keshet7cd12312013-07-25 10:25:55 -0700288 }
289
Simran Basib6ec8ae2014-04-23 12:05:08 -0700290 control_file = tools.inject_vars(inject_dict, control_file)
Chris Masone859fdec2012-01-30 08:38:09 -0800291
Jakob Juelich9fffe4f2014-08-14 18:07:05 -0700292 return rpc_utils.create_job_common(name,
Jakob Juelich59cfe542014-09-02 16:37:46 -0700293 priority=priority,
294 timeout_mins=timeout_mins,
295 max_runtime_mins=max_runtime_mins,
296 control_type='Server',
297 control_file=control_file,
298 hostless=True,
Fang Dengcbc01212014-11-25 16:09:46 -0800299 keyvals=keyvals)
Simran Basi71206ef2014-08-13 13:51:18 -0700300
301
302# TODO: hide the following rpcs under is_moblab
303def moblab_only(func):
304 """Ensure moblab specific functions only run on Moblab devices."""
305 def verify(*args, **kwargs):
306 if not utils.is_moblab():
307 raise error.RPCException('RPC: %s can only run on Moblab Systems!',
308 func.__name__)
309 return func(*args, **kwargs)
310 return verify
311
312
313@moblab_only
314def get_config_values():
315 """Returns all config values parsed from global and shadow configs.
316
317 Config values are grouped by sections, and each section is composed of
318 a list of name value pairs.
319 """
320 sections =_CONFIG.get_sections()
321 config_values = {}
322 for section in sections:
323 config_values[section] = _CONFIG.config.items(section)
Jakob Juelich9fffe4f2014-08-14 18:07:05 -0700324 return rpc_utils.prepare_for_serialization(config_values)
Simran Basi71206ef2014-08-13 13:51:18 -0700325
326
Michael Tang9afc74b2016-03-21 10:19:23 -0700327def _write_config_file(config_file, config_values, overwrite=False):
328 """Writes out a configuration file.
Simran Basi71206ef2014-08-13 13:51:18 -0700329
Michael Tang9afc74b2016-03-21 10:19:23 -0700330 @param config_file: The name of the configuration file.
331 @param config_values: The ConfigParser object.
332 @param ovewrite: Flag on if overwriting is allowed.
333 """
334 if not config_file:
335 raise error.RPCException('Empty config file name.')
336 if not overwrite and os.path.exists(config_file):
337 raise error.RPCException('Config file already exists.')
338
339 if config_values:
340 with open(config_file, 'w') as config_file:
341 config_values.write(config_file)
342
343
344def _read_original_config():
345 """Reads the orginal configuratino without shadow.
346
347 @return: A configuration object, see global_config_class.
Simran Basi71206ef2014-08-13 13:51:18 -0700348 """
Simran Basi773a86e2015-05-13 19:15:42 -0700349 original_config = global_config.global_config_class()
350 original_config.set_config_files(shadow_file='')
Michael Tang9afc74b2016-03-21 10:19:23 -0700351 return original_config
352
353
354def _read_raw_config(config_file):
355 """Reads the raw configuration from a configuration file.
356
357 @param: config_file: The path of the configuration file.
358
359 @return: A ConfigParser object.
360 """
361 shadow_config = ConfigParser.RawConfigParser()
362 shadow_config.read(config_file)
363 return shadow_config
364
365
366def _get_shadow_config_from_partial_update(config_values):
367 """Finds out the new shadow configuration based on a partial update.
368
369 Since the input is only a partial config, we should not lose the config
370 data inside the existing shadow config file. We also need to distinguish
371 if the input config info overrides with a new value or reverts back to
372 an original value.
373
374 @param config_values: See get_moblab_settings().
375
376 @return: The new shadow configuration as ConfigParser object.
377 """
378 original_config = _read_original_config()
379 existing_shadow = _read_raw_config(_CONFIG.shadow_file)
380 for section, config_value_list in config_values.iteritems():
381 for key, value in config_value_list:
382 if original_config.get_config_value(section, key,
383 default='',
384 allow_blank=True) != value:
385 if not existing_shadow.has_section(section):
386 existing_shadow.add_section(section)
387 existing_shadow.set(section, key, value)
388 elif existing_shadow.has_option(section, key):
389 existing_shadow.remove_option(section, key)
390 return existing_shadow
391
392
393def _update_partial_config(config_values):
394 """Updates the shadow configuration file with a partial config udpate.
395
396 @param config_values: See get_moblab_settings().
397 """
398 existing_config = _get_shadow_config_from_partial_update(config_values)
399 _write_config_file(_CONFIG.shadow_file, existing_config, True)
400
401
402@moblab_only
403def update_config_handler(config_values):
404 """Update config values and override shadow config.
405
406 @param config_values: See get_moblab_settings().
407 """
408 original_config = _read_original_config()
Simran Basi773a86e2015-05-13 19:15:42 -0700409 new_shadow = ConfigParser.RawConfigParser()
Simran Basi71206ef2014-08-13 13:51:18 -0700410 for section, config_value_list in config_values.iteritems():
411 for key, value in config_value_list:
Simran Basi773a86e2015-05-13 19:15:42 -0700412 if original_config.get_config_value(section, key,
413 default='',
414 allow_blank=True) != value:
415 if not new_shadow.has_section(section):
416 new_shadow.add_section(section)
417 new_shadow.set(section, key, value)
Michael Tang9afc74b2016-03-21 10:19:23 -0700418
Simran Basi71206ef2014-08-13 13:51:18 -0700419 if not _CONFIG.shadow_file or not os.path.exists(_CONFIG.shadow_file):
420 raise error.RPCException('Shadow config file does not exist.')
Michael Tang9afc74b2016-03-21 10:19:23 -0700421 _write_config_file(_CONFIG.shadow_file, new_shadow, True)
Simran Basi71206ef2014-08-13 13:51:18 -0700422
Simran Basi71206ef2014-08-13 13:51:18 -0700423 # TODO (sbasi) crbug.com/403916 - Remove the reboot command and
424 # instead restart the services that rely on the config values.
425 os.system('sudo reboot')
426
427
428@moblab_only
429def reset_config_settings():
430 with open(_CONFIG.shadow_file, 'w') as config_file:
Dan Shi36cfd832014-10-10 13:38:51 -0700431 pass
Simran Basi71206ef2014-08-13 13:51:18 -0700432 os.system('sudo reboot')
433
434
435@moblab_only
436def set_boto_key(boto_key):
437 """Update the boto_key file.
438
439 @param boto_key: File name of boto_key uploaded through handle_file_upload.
440 """
441 if not os.path.exists(boto_key):
442 raise error.RPCException('Boto key: %s does not exist!' % boto_key)
443 shutil.copyfile(boto_key, moblab_host.MOBLAB_BOTO_LOCATION)
Dan Shi193905e2014-07-25 23:33:09 -0700444
445
Dan Shiaec99012016-01-07 09:09:16 -0800446@moblab_only
447def set_launch_control_key(launch_control_key):
448 """Update the launch_control_key file.
449
450 @param launch_control_key: File name of launch_control_key uploaded through
451 handle_file_upload.
452 """
453 if not os.path.exists(launch_control_key):
454 raise error.RPCException('Launch Control key: %s does not exist!' %
455 launch_control_key)
456 shutil.copyfile(launch_control_key,
457 moblab_host.MOBLAB_LAUNCH_CONTROL_KEY_LOCATION)
458 # Restart the devserver service.
459 os.system('sudo restart moblab-devserver-init')
460
461
Michael Tang9afc74b2016-03-21 10:19:23 -0700462###########Moblab Config Wizard RPCs #######################
463def _get_public_ip_address(socket_handle):
464 """Gets the public IP address.
465
466 Connects to Google DNS server using a socket and gets the preferred IP
467 address from the connection.
468
469 @param: socket_handle: a unix socket.
470
471 @return: public ip address as string.
472 """
473 try:
474 socket_handle.settimeout(1)
475 socket_handle.connect(('8.8.8.8', 53))
476 socket_name = socket_handle.getsockname()
477 if socket_name is not None:
478 logging.info('Got socket name from UDP socket.')
479 return socket_name[0]
480 logging.warn('Created UDP socket but with no socket_name.')
481 except socket.error:
482 logging.warn('Could not get socket name from UDP socket.')
483 return None
484
485
486def _get_network_info():
487 """Gets the network information.
488
489 TCP socket is used to test the connectivity. If there is no connectivity, try to
490 get the public IP with UDP socket.
491
492 @return: a tuple as (public_ip_address, connected_to_internet).
493 """
494 s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
495 ip = _get_public_ip_address(s)
496 if ip is not None:
497 logging.info('Established TCP connection with well known server.')
498 return (ip, True)
499 s = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
500 return (_get_public_ip_address(s), False)
501
502
503@moblab_only
504def get_network_info():
505 """Returns the server ip addresses, and if the server connectivity.
506
507 The server ip addresses as an array of strings, and the connectivity as a
508 flag.
509 """
510 network_info = {}
511 info = _get_network_info()
512 if info[0] is not None:
513 network_info['server_ips'] = [info[0]]
514 network_info['is_connected'] = info[1]
515
516 return rpc_utils.prepare_for_serialization(network_info)
517
518
519# Gets the boto configuration.
520def _get_boto_config():
521 """Reads the boto configuration from the boto file.
522
523 @return: Boto configuration as ConfigParser object.
524 """
525 boto_config = ConfigParser.ConfigParser()
526 boto_config.read(MOBLAB_BOTO_LOCATION)
527 return boto_config
528
529
530@moblab_only
531def get_cloud_storage_info():
532 """RPC handler to get the cloud storage access information.
533 """
534 cloud_storage_info = {}
535 value =_CONFIG.get_config_value('CROS', _IMAGE_STORAGE_SERVER)
536 if value is not None:
537 cloud_storage_info[_IMAGE_STORAGE_SERVER] = value
538 value =_CONFIG.get_config_value('CROS', _RESULT_STORAGE_SERVER)
539 if value is not None:
540 cloud_storage_info[_RESULT_STORAGE_SERVER] = value
541
542 boto_config = _get_boto_config()
543 sections = boto_config.sections()
544
545 if sections:
546 cloud_storage_info[_USE_EXISTING_BOTO_FILE] = True
547 else:
548 cloud_storage_info[_USE_EXISTING_BOTO_FILE] = False
549 if 'Credentials' in sections:
550 options = boto_config.options('Credentials')
551 if _GS_ACCESS_KEY_ID in options:
552 value = boto_config.get('Credentials', _GS_ACCESS_KEY_ID)
553 cloud_storage_info[_GS_ACCESS_KEY_ID] = value
554 if _GS_SECRETE_ACCESS_KEY in options:
555 value = boto_config.get('Credentials', _GS_SECRETE_ACCESS_KEY)
556 cloud_storage_info[_GS_SECRETE_ACCESS_KEY] = value
557
558 return rpc_utils.prepare_for_serialization(cloud_storage_info)
559
560
561def _get_bucket_name_from_url(bucket_url):
562 """Gets the bucket name from a bucket url.
563
564 @param: bucket_url: the bucket url string.
565 """
566 if bucket_url:
567 match = GOOGLE_STORAGE_BUCKET_URL_PATTERN.match(bucket_url)
568 if match:
569 return match.group('bucket')
570 return None
571
572
573def _is_valid_boto_key(key_id, key_secret):
574 """Checks if the boto key is valid.
575
576 @param: key_id: The boto key id string.
577 @param: key_secret: The boto key string.
578
579 @return: A tuple as (valid_boolean, details_string).
580 """
581 if not key_id or not key_secret:
582 return (False, "Empty key id or secret.")
583 conn = boto.connect_gs(key_id, key_secret)
584 try:
585 buckets = conn.get_all_buckets()
586 return (True, None)
587 except boto.exception.GSResponseError:
588 details = "The boto access key is not valid"
589 return (False, details)
590 finally:
591 conn.close()
592
593
594def _is_valid_bucket(key_id, key_secret, bucket_name):
595 """Checks if a bucket is valid and accessible.
596
597 @param: key_id: The boto key id string.
598 @param: key_secret: The boto key string.
599 @param: bucket name string.
600
601 @return: A tuple as (valid_boolean, details_string).
602 """
603 if not key_id or not key_secret or not bucket_name:
604 return (False, "Server error: invalid argument")
605 conn = boto.connect_gs(key_id, key_secret)
606 bucket = conn.lookup(bucket_name)
607 conn.close()
608 if bucket:
609 return (True, None)
610 return (False, "Bucket %s does not exist." % bucket_name)
611
612
613def _is_valid_bucket_url(key_id, key_secret, bucket_url):
614 """Validates the bucket url is accessible.
615
616 @param: key_id: The boto key id string.
617 @param: key_secret: The boto key string.
618 @param: bucket url string.
619
620 @return: A tuple as (valid_boolean, details_string).
621 """
622 bucket_name = _get_bucket_name_from_url(bucket_url)
623 if bucket_name:
624 return _is_valid_bucket(key_id, key_secret, bucket_name)
625 return (False, "Bucket url %s is not valid" % bucket_url)
626
627
628def _validate_cloud_storage_info(cloud_storage_info):
629 """Checks if the cloud storage information is valid.
630
631 @param: cloud_storage_info: The JSON RPC object for cloud storage info.
632
633 @return: A tuple as (valid_boolean, details_string).
634 """
635 valid = True
636 details = None
637 if not cloud_storage_info[_USE_EXISTING_BOTO_FILE]:
638 key_id = cloud_storage_info[_GS_ACCESS_KEY_ID]
639 key_secret = cloud_storage_info[_GS_SECRETE_ACCESS_KEY]
640 valid, details = _is_valid_boto_key(key_id, key_secret)
641
642 if valid:
643 valid, details = _is_valid_bucket_url(
644 key_id, key_secret, cloud_storage_info[_IMAGE_STORAGE_SERVER])
645
646 if valid:
647 valid, details = _is_valid_bucket_url(
648 key_id, key_secret, cloud_storage_info[_RESULT_STORAGE_SERVER])
649 return (valid, details)
650
651
652def _create_operation_status_response(is_ok, details):
653 """Helper method to create a operation status reponse.
654
655 @param: is_ok: Boolean for if the operation is ok.
656 @param: details: A detailed string.
657
658 @return: A serialized JSON RPC object.
659 """
660 status_response = {'status_ok': is_ok}
661 if details:
662 status_response['status_details'] = details
663 return rpc_utils.prepare_for_serialization(status_response)
664
665
666@moblab_only
667def validate_cloud_storage_info(cloud_storage_info):
668 """RPC handler to check if the cloud storage info is valid.
669 """
670 valid, details = _validate_cloud_storage_info(cloud_storage_info)
671 return _create_operation_status_response(valid, details)
672
673
674@moblab_only
675def submit_wizard_config_info(cloud_storage_info):
676 """RPC handler to submit the cloud storage info.
677 """
678 valid, details = _validate_cloud_storage_info(cloud_storage_info)
679 if not valid:
680 return _create_operation_status_response(valid, details)
681 config_update = {}
682 config_update['CROS'] = [
683 (_IMAGE_STORAGE_SERVER, cloud_storage_info[_IMAGE_STORAGE_SERVER]),
684 (_RESULT_STORAGE_SERVER, cloud_storage_info[_RESULT_STORAGE_SERVER])
685 ]
686 _update_partial_config(config_update)
687
688 if not cloud_storage_info[_USE_EXISTING_BOTO_FILE]:
689 boto_config = ConfigParser.RawConfigParser()
690 boto_config.add_section('Credentials')
691 boto_config.set('Credentials', _GS_ACCESS_KEY_ID,
692 cloud_storage_info[_GS_ACCESS_KEY_ID])
693 boto_config.set('Credentials', _GS_SECRETE_ACCESS_KEY,
694 cloud_storage_info[_GS_SECRETE_ACCESS_KEY])
695 _write_config_file(MOBLAB_BOTO_LOCATION, boto_config, True)
696
697 _CONFIG.parse_config_file()
698
699 return _create_operation_status_response(True, None)
700
701
Dan Shi193905e2014-07-25 23:33:09 -0700702def get_job_history(**filter_data):
703 """Get history of the job, including the special tasks executed for the job
704
705 @param filter_data: filter for the call, should at least include
706 {'job_id': [job id]}
707 @returns: JSON string of the job's history, including the information such
708 as the hosts run the job and the special tasks executed before
709 and after the job.
710 """
711 job_id = filter_data['job_id']
712 job_info = job_history.get_job_info(job_id)
Dan Shidfea3682014-08-10 23:38:40 -0700713 return rpc_utils.prepare_for_serialization(job_info.get_history())
714
715
716def get_host_history(start_time, end_time, hosts=None, board=None, pool=None):
717 """Get history of a list of host.
718
719 The return is a JSON string of host history for each host, for example,
720 {'172.22.33.51': [{'status': 'Resetting'
721 'start_time': '2014-08-07 10:02:16',
722 'end_time': '2014-08-07 10:03:16',
723 'log_url': 'http://autotest/reset-546546/debug',
724 'dbg_str': 'Task: Special Task 19441991 (host ...)'},
725 {'status': 'Running'
726 'start_time': '2014-08-07 10:03:18',
727 'end_time': '2014-08-07 10:13:00',
728 'log_url': 'http://autotest/reset-546546/debug',
729 'dbg_str': 'HQE: 15305005, for job: 14995562'}
730 ]
731 }
732 @param start_time: start time to search for history, can be string value or
733 epoch time.
734 @param end_time: end time to search for history, can be string value or
735 epoch time.
736 @param hosts: A list of hosts to search for history. Default is None.
737 @param board: board type of hosts. Default is None.
738 @param pool: pool type of hosts. Default is None.
739 @returns: JSON string of the host history.
740 """
741 return rpc_utils.prepare_for_serialization(
742 host_history.get_history_details(
743 start_time=start_time, end_time=end_time,
744 hosts=hosts, board=board, pool=pool,
745 process_pool_size=4))
Jakob Juelich59cfe542014-09-02 16:37:46 -0700746
747
MK Ryu07a109f2015-07-21 17:44:32 -0700748def shard_heartbeat(shard_hostname, jobs=(), hqes=(), known_job_ids=(),
749 known_host_ids=(), known_host_statuses=()):
Jakob Juelich1b525742014-09-30 13:08:07 -0700750 """Receive updates for job statuses from shards and assign hosts and jobs.
Jakob Juelich59cfe542014-09-02 16:37:46 -0700751
752 @param shard_hostname: Hostname of the calling shard
Jakob Juelicha94efe62014-09-18 16:02:49 -0700753 @param jobs: Jobs in serialized form that should be updated with newer
754 status from a shard.
755 @param hqes: Hostqueueentries in serialized form that should be updated with
756 newer status from a shard. Note that for every hostqueueentry
757 the corresponding job must be in jobs.
Jakob Juelich1b525742014-09-30 13:08:07 -0700758 @param known_job_ids: List of ids of jobs the shard already has.
759 @param known_host_ids: List of ids of hosts the shard already has.
MK Ryu07a109f2015-07-21 17:44:32 -0700760 @param known_host_statuses: List of statuses of hosts the shard already has.
Jakob Juelicha94efe62014-09-18 16:02:49 -0700761
Fang Dengf3705992014-12-16 17:32:18 -0800762 @returns: Serialized representations of hosts, jobs, suite job keyvals
763 and their dependencies to be inserted into a shard's database.
Jakob Juelich59cfe542014-09-02 16:37:46 -0700764 """
Jakob Juelich1b525742014-09-30 13:08:07 -0700765 # The following alternatives to sending host and job ids in every heartbeat
766 # have been considered:
767 # 1. Sending the highest known job and host ids. This would work for jobs:
768 # Newer jobs always have larger ids. Also, if a job is not assigned to a
769 # particular shard during a heartbeat, it never will be assigned to this
770 # shard later.
771 # This is not true for hosts though: A host that is leased won't be sent
772 # to the shard now, but might be sent in a future heartbeat. This means
773 # sometimes hosts should be transfered that have a lower id than the
774 # maximum host id the shard knows.
775 # 2. Send the number of jobs/hosts the shard knows to the master in each
776 # heartbeat. Compare these to the number of records that already have
777 # the shard_id set to this shard. In the normal case, they should match.
778 # In case they don't, resend all entities of that type.
779 # This would work well for hosts, because there aren't that many.
780 # Resending all jobs is quite a big overhead though.
781 # Also, this approach might run into edge cases when entities are
782 # ever deleted.
783 # 3. Mixtures of the above: Use 1 for jobs and 2 for hosts.
784 # Using two different approaches isn't consistent and might cause
785 # confusion. Also the issues with the case of deletions might still
786 # occur.
787 #
788 # The overhead of sending all job and host ids in every heartbeat is low:
789 # At peaks one board has about 1200 created but unfinished jobs.
790 # See the numbers here: http://goo.gl/gQCGWH
791 # Assuming that job id's have 6 digits and that json serialization takes a
792 # comma and a space as overhead, the traffic per id sent is about 8 bytes.
793 # If 5000 ids need to be sent, this means 40 kilobytes of traffic.
794 # A NOT IN query with 5000 ids took about 30ms in tests made.
795 # These numbers seem low enough to outweigh the disadvantages of the
796 # solutions described above.
Gabe Black1e1c41b2015-02-04 23:55:15 -0800797 timer = autotest_stats.Timer('shard_heartbeat')
Jakob Juelich59cfe542014-09-02 16:37:46 -0700798 with timer:
799 shard_obj = rpc_utils.retrieve_shard(shard_hostname=shard_hostname)
Jakob Juelicha94efe62014-09-18 16:02:49 -0700800 rpc_utils.persist_records_sent_from_shard(shard_obj, jobs, hqes)
MK Ryu07a109f2015-07-21 17:44:32 -0700801 assert len(known_host_ids) == len(known_host_statuses)
802 for i in range(len(known_host_ids)):
803 host_model = models.Host.objects.get(pk=known_host_ids[i])
804 if host_model.status != known_host_statuses[i]:
805 host_model.status = known_host_statuses[i]
806 host_model.save()
807
Fang Dengf3705992014-12-16 17:32:18 -0800808 hosts, jobs, suite_keyvals = rpc_utils.find_records_for_shard(
MK Ryu07a109f2015-07-21 17:44:32 -0700809 shard_obj, known_job_ids=known_job_ids,
810 known_host_ids=known_host_ids)
Jakob Juelich59cfe542014-09-02 16:37:46 -0700811 return {
812 'hosts': [host.serialize() for host in hosts],
813 'jobs': [job.serialize() for job in jobs],
Fang Dengf3705992014-12-16 17:32:18 -0800814 'suite_keyvals': [kv.serialize() for kv in suite_keyvals],
Jakob Juelich59cfe542014-09-02 16:37:46 -0700815 }
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700816
817
818def get_shards(**filter_data):
819 """Return a list of all shards.
820
821 @returns A sequence of nested dictionaries of shard information.
822 """
823 shards = models.Shard.query_objects(filter_data)
824 serialized_shards = rpc_utils.prepare_rows_as_nested_dicts(shards, ())
825 for serialized, shard in zip(serialized_shards, shards):
826 serialized['labels'] = [label.name for label in shard.labels.all()]
827
828 return serialized_shards
829
830
MK Ryu5dfcc892015-07-16 15:34:04 -0700831def add_shard(hostname, labels):
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700832 """Add a shard and start running jobs on it.
833
834 @param hostname: The hostname of the shard to be added; needs to be unique.
MK Ryu5dfcc892015-07-16 15:34:04 -0700835 @param labels: Board labels separated by a comma. Jobs of one of the labels
836 will be assigned to the shard.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700837
Jakob Juelich8b110ee2014-09-15 16:13:42 -0700838 @raises error.RPCException: If label provided doesn't start with `board:`
839 @raises model_logic.ValidationError: If a shard with the given hostname
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700840 already exists.
Jakob Juelich8b110ee2014-09-15 16:13:42 -0700841 @raises models.Label.DoesNotExist: If the label specified doesn't exist.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700842 """
MK Ryu5dfcc892015-07-16 15:34:04 -0700843 labels = labels.split(',')
844 label_models = []
845 for label in labels:
846 if not label.startswith('board:'):
847 raise error.RPCException('Sharding only supports for `board:.*` '
848 'labels.')
849 # Fetch label first, so shard isn't created when label doesn't exist.
850 label_models.append(models.Label.smart_get(label))
Jakob Juelich8b110ee2014-09-15 16:13:42 -0700851
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700852 shard = models.Shard.add_object(hostname=hostname)
MK Ryu5dfcc892015-07-16 15:34:04 -0700853 for label in label_models:
854 shard.labels.add(label)
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700855 return shard.id
856
857
858def delete_shard(hostname):
859 """Delete a shard and reclaim all resources from it.
860
861 This claims back all assigned hosts from the shard. To ensure all DUTs are
xixuan03cb93f2016-03-22 16:21:41 -0700862 in a sane state, a Reboot task with highest priority is scheduled for them.
863 This reboots the DUTs and then all left tasks continue to run in drone of
864 the master.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700865
xixuan03cb93f2016-03-22 16:21:41 -0700866 The procedure for deleting a shard:
867 * Lock all unlocked hosts on that shard.
868 * Remove shard information .
869 * Assign a reboot task with highest priority to these hosts.
870 * Unlock these hosts, then, the reboot tasks run in front of all other
871 tasks.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700872
873 The status of jobs that haven't been reported to be finished yet, will be
874 lost. The master scheduler will pick up the jobs and execute them.
875
876 @param hostname: Hostname of the shard to delete.
877 """
878 shard = rpc_utils.retrieve_shard(shard_hostname=hostname)
xixuan03cb93f2016-03-22 16:21:41 -0700879 hostnames_to_lock = [h.hostname for h in
880 models.Host.objects.filter(shard=shard, locked=False)]
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700881
882 # TODO(beeps): Power off shard
xixuan03cb93f2016-03-22 16:21:41 -0700883 # For ChromeOS hosts, a reboot test with the highest priority is added to
884 # the DUT. After a reboot it should be ganranteed that no processes from
885 # prior tests that were run by a shard are still running on.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700886
xixuan03cb93f2016-03-22 16:21:41 -0700887 # Lock all unlocked hosts.
888 dicts = {'locked': True, 'lock_time': datetime.datetime.now()}
889 models.Host.objects.filter(hostname__in=hostnames_to_lock).update(**dicts)
890
891 # Remove shard information.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700892 models.Host.objects.filter(shard=shard).update(shard=None)
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700893 models.Job.objects.filter(shard=shard).update(shard=None)
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700894 shard.labels.clear()
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700895 shard.delete()
Dan Shi6964fa52014-12-18 11:04:27 -0800896
xixuan03cb93f2016-03-22 16:21:41 -0700897 # Assign a reboot task with highest priority: Super.
898 t = models.Test.objects.get(name='platform_BootPerfServer:shard')
899 c = utils.read_file(os.path.join(common.autotest_dir, t.path))
900 if hostnames_to_lock:
901 rpc_utils.create_job_common(
902 'reboot_dut_for_shard_deletion',
903 priority=priorities.Priority.SUPER,
904 control_type='Server',
905 control_file=c, hosts=hostnames_to_lock)
906
907 # Unlock these shard-related hosts.
908 dicts = {'locked': False, 'lock_time': None}
909 models.Host.objects.filter(hostname__in=hostnames_to_lock).update(**dicts)
910
Dan Shi6964fa52014-12-18 11:04:27 -0800911
MK Ryua34e3b12015-08-21 16:20:47 -0700912def get_servers(hostname=None, role=None, status=None):
Dan Shid7bb4f12015-01-06 10:53:50 -0800913 """Get a list of servers with matching role and status.
914
MK Ryua34e3b12015-08-21 16:20:47 -0700915 @param hostname: FQDN of the server.
Dan Shid7bb4f12015-01-06 10:53:50 -0800916 @param role: Name of the server role, e.g., drone, scheduler. Default to
917 None to match any role.
918 @param status: Status of the server, e.g., primary, backup, repair_required.
919 Default to None to match any server status.
920
921 @raises error.RPCException: If server database is not used.
922 @return: A list of server names for servers with matching role and status.
923 """
924 if not server_manager_utils.use_server_db():
925 raise error.RPCException('Server database is not enabled. Please try '
926 'retrieve servers from global config.')
MK Ryua34e3b12015-08-21 16:20:47 -0700927 servers = server_manager_utils.get_servers(hostname=hostname, role=role,
Dan Shid7bb4f12015-01-06 10:53:50 -0800928 status=status)
929 return [s.get_details() for s in servers]
930
931
MK Ryufbb002c2015-06-08 14:13:16 -0700932@rpc_utils.route_rpc_to_master
Simran Basibeb2bb22016-02-03 15:25:48 -0800933def get_stable_version(board=stable_version_utils.DEFAULT, android=False):
Dan Shi6964fa52014-12-18 11:04:27 -0800934 """Get stable version for the given board.
935
936 @param board: Name of the board.
Simran Basibeb2bb22016-02-03 15:25:48 -0800937 @param android: If True, the given board is an Android-based device. If
938 False, assume its a Chrome OS-based device.
939
Dan Shi6964fa52014-12-18 11:04:27 -0800940 @return: Stable version of the given board. Return global configure value
941 of CROS.stable_cros_version if stable_versinos table does not have
942 entry of board DEFAULT.
943 """
Simran Basibeb2bb22016-02-03 15:25:48 -0800944 return stable_version_utils.get(board=board, android=android)
Dan Shi25e1fd42014-12-19 14:36:42 -0800945
946
MK Ryufbb002c2015-06-08 14:13:16 -0700947@rpc_utils.route_rpc_to_master
Dan Shi25e1fd42014-12-19 14:36:42 -0800948def get_all_stable_versions():
949 """Get stable versions for all boards.
950
951 @return: A dictionary of board:version.
952 """
953 return stable_version_utils.get_all()
954
955
MK Ryufbb002c2015-06-08 14:13:16 -0700956@rpc_utils.route_rpc_to_master
Dan Shi25e1fd42014-12-19 14:36:42 -0800957def set_stable_version(version, board=stable_version_utils.DEFAULT):
958 """Modify stable version for the given board.
959
960 @param version: The new value of stable version for given board.
961 @param board: Name of the board, default to value `DEFAULT`.
962 """
963 stable_version_utils.set(version=version, board=board)
964
965
MK Ryufbb002c2015-06-08 14:13:16 -0700966@rpc_utils.route_rpc_to_master
Dan Shi25e1fd42014-12-19 14:36:42 -0800967def delete_stable_version(board):
968 """Modify stable version for the given board.
969
970 Delete a stable version entry in afe_stable_versions table for a given
971 board, so default stable version will be used.
972
973 @param board: Name of the board.
974 """
975 stable_version_utils.delete(board=board)
Matthew Sartorid96fb9b2015-05-19 18:04:58 -0700976
977
978def get_tests_by_build(build):
979 """Get the tests that are available for the specified build.
980
981 @param build: unique name by which to refer to the image.
982
983 @return: A sorted list of all tests that are in the build specified.
984 """
985 # Stage the test artifacts.
986 try:
987 ds = dev_server.ImageServer.resolve(build)
988 build = ds.translate(build)
989 except dev_server.DevServerException as e:
990 raise ValueError('Could not resolve build %s: %s' % (build, e))
991
992 try:
Dan Shi6450e142016-03-11 11:52:20 -0800993 ds.stage_artifacts(image=build, artifacts=['test_suites'])
Matthew Sartorid96fb9b2015-05-19 18:04:58 -0700994 except dev_server.DevServerException as e:
995 raise error.StageControlFileFailure(
996 'Failed to stage %s: %s' % (build, e))
997
998 # Collect the control files specified in this build
999 cfile_getter = control_file_getter.DevServerGetter.create(build, ds)
1000 control_file_list = cfile_getter.get_control_file_list()
1001
1002 test_objects = []
1003 _id = 0
1004 for control_file_path in control_file_list:
1005 # Read and parse the control file
1006 control_file = cfile_getter.get_control_file_contents(
1007 control_file_path)
1008 control_obj = control_data.parse_control_string(control_file)
1009
1010 # Extract the values needed for the AFE from the control_obj.
1011 # The keys list represents attributes in the control_obj that
1012 # are required by the AFE
1013 keys = ['author', 'doc', 'name', 'time', 'test_type', 'experimental',
1014 'test_category', 'test_class', 'dependencies', 'run_verify',
1015 'sync_count', 'job_retries', 'retries', 'path']
1016
1017 test_object = {}
1018 for key in keys:
1019 test_object[key] = getattr(control_obj, key) if hasattr(
1020 control_obj, key) else ''
1021
1022 # Unfortunately, the AFE expects different key-names for certain
1023 # values, these must be corrected to avoid the risk of tests
1024 # being omitted by the AFE.
1025 # The 'id' is an additional value used in the AFE.
Matthew Sartori10438092015-06-24 14:30:18 -07001026 # The control_data parsing does not reference 'run_reset', but it
1027 # is also used in the AFE and defaults to True.
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001028 test_object['id'] = _id
Matthew Sartori10438092015-06-24 14:30:18 -07001029 test_object['run_reset'] = True
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001030 test_object['description'] = test_object.get('doc', '')
1031 test_object['test_time'] = test_object.get('time', 0)
1032 test_object['test_retry'] = test_object.get('retries', 0)
1033
1034 # Fix the test name to be consistent with the current presentation
1035 # of test names in the AFE.
1036 testpath, subname = os.path.split(control_file_path)
1037 testname = os.path.basename(testpath)
1038 subname = subname.split('.')[1:]
1039 if subname:
1040 testname = '%s:%s' % (testname, ':'.join(subname))
1041
1042 test_object['name'] = testname
1043
Matthew Sartori10438092015-06-24 14:30:18 -07001044 # Correct the test path as parse_control_string sets an empty string.
1045 test_object['path'] = control_file_path
1046
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001047 _id += 1
1048 test_objects.append(test_object)
1049
Matthew Sartori10438092015-06-24 14:30:18 -07001050 test_objects = sorted(test_objects, key=lambda x: x.get('name'))
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001051 return rpc_utils.prepare_for_serialization(test_objects)