blob: 60773263e0e80522801ea089772f1c38eabd794c [file] [log] [blame]
Dan Shi4df39252013-03-19 13:19:45 -07001# pylint: disable-msg=C0111
2
Chris Masone859fdec2012-01-30 08:38:09 -08003# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
4# Use of this source code is governed by a BSD-style license that can be
5# found in the LICENSE file.
6
7__author__ = 'cmasone@chromium.org (Chris Masone)'
8
Michael Tang9afc74b2016-03-21 10:19:23 -07009# The boto module is only available/used in Moblab for validation of cloud
10# storage access. The module is not available in the test lab environment,
11# and the import error is handled.
12try:
13 import boto
14except ImportError:
15 boto = None
Chris Masone859fdec2012-01-30 08:38:09 -080016import common
Simran Basi773a86e2015-05-13 19:15:42 -070017import ConfigParser
Chris Masonea8066a92012-05-01 16:52:31 -070018import datetime
Chris Masone859fdec2012-01-30 08:38:09 -080019import logging
Simran Basi71206ef2014-08-13 13:51:18 -070020import os
Michael Tang9afc74b2016-03-21 10:19:23 -070021import re
Simran Basi71206ef2014-08-13 13:51:18 -070022import shutil
Michael Tang9afc74b2016-03-21 10:19:23 -070023import socket
Aviv Keshetd83ef442013-01-16 16:19:35 -080024
Jakob Juelich82b7d1c2014-09-15 16:10:57 -070025from autotest_lib.frontend.afe import models
Matthew Sartorid96fb9b2015-05-19 18:04:58 -070026from autotest_lib.client.common_lib import control_data
Aviv Keshetd83ef442013-01-16 16:19:35 -080027from autotest_lib.client.common_lib import error
Simran Basi71206ef2014-08-13 13:51:18 -070028from autotest_lib.client.common_lib import global_config
Alex Miller7d658cf2013-09-04 16:00:35 -070029from autotest_lib.client.common_lib import priorities
Dan Shidfea3682014-08-10 23:38:40 -070030from autotest_lib.client.common_lib import time_utils
Chris Masone859fdec2012-01-30 08:38:09 -080031from autotest_lib.client.common_lib.cros import dev_server
Gabe Black1e1c41b2015-02-04 23:55:15 -080032from autotest_lib.client.common_lib.cros.graphite import autotest_stats
Jakob Juelich9fffe4f2014-08-14 18:07:05 -070033from autotest_lib.frontend.afe import rpc_utils
Simran Basib6ec8ae2014-04-23 12:05:08 -070034from autotest_lib.server import utils
Dan Shi36cfd832014-10-10 13:38:51 -070035from autotest_lib.server.cros import provision
Chris Masone44e4d6c2012-08-15 14:25:53 -070036from autotest_lib.server.cros.dynamic_suite import constants
Chris Masoneb4935552012-08-14 12:05:54 -070037from autotest_lib.server.cros.dynamic_suite import control_file_getter
Chris Masone44e4d6c2012-08-15 14:25:53 -070038from autotest_lib.server.cros.dynamic_suite import tools
xixuan0f7755d2016-04-18 14:49:12 -070039from autotest_lib.server.cros.dynamic_suite import suite as SuiteBase
Dan Shi36cfd832014-10-10 13:38:51 -070040from autotest_lib.server.cros.dynamic_suite.suite import Suite
Simran Basi71206ef2014-08-13 13:51:18 -070041from autotest_lib.server.hosts import moblab_host
Dan Shidfea3682014-08-10 23:38:40 -070042from autotest_lib.site_utils import host_history
Dan Shi193905e2014-07-25 23:33:09 -070043from autotest_lib.site_utils import job_history
Dan Shid7bb4f12015-01-06 10:53:50 -080044from autotest_lib.site_utils import server_manager_utils
Dan Shi6964fa52014-12-18 11:04:27 -080045from autotest_lib.site_utils import stable_version_utils
Simran Basi71206ef2014-08-13 13:51:18 -070046
47
48_CONFIG = global_config.global_config
49MOBLAB_BOTO_LOCATION = '/home/moblab/.boto'
Chris Masone859fdec2012-01-30 08:38:09 -080050
Michael Tang9afc74b2016-03-21 10:19:23 -070051# Google Cloud Storage bucket url regex pattern. The pattern is used to extract
52# the bucket name from the bucket URL. For example, "gs://image_bucket/google"
53# should result in a bucket name "image_bucket".
54GOOGLE_STORAGE_BUCKET_URL_PATTERN = re.compile(
55 r'gs://(?P<bucket>[a-zA-Z][a-zA-Z0-9-_]*)/?.*')
56
57# Constants used in JSON RPC field names.
58_USE_EXISTING_BOTO_FILE = 'use_existing_boto_file'
59_GS_ACCESS_KEY_ID = 'gs_access_key_id'
60_GS_SECRETE_ACCESS_KEY = 'gs_secret_access_key'
61_IMAGE_STORAGE_SERVER = 'image_storage_server'
62_RESULT_STORAGE_SERVER = 'results_storage_server'
Chris Masonef8b53062012-05-08 22:14:18 -070063# Relevant CrosDynamicSuiteExceptions are defined in client/common_lib/error.py.
Chris Masone859fdec2012-01-30 08:38:09 -080064
65
Chris Masone62579122012-03-08 15:18:43 -080066def canonicalize_suite_name(suite_name):
Dan Shi70647ca2015-07-16 22:52:35 -070067 # Do not change this naming convention without updating
68 # site_utils.parse_job_name.
Chris Masone62579122012-03-08 15:18:43 -080069 return 'test_suites/control.%s' % suite_name
70
71
Chris Masoneaa10f8e2012-05-15 13:34:21 -070072def formatted_now():
Dan Shidfea3682014-08-10 23:38:40 -070073 return datetime.datetime.now().strftime(time_utils.TIME_FMT)
Chris Masoneaa10f8e2012-05-15 13:34:21 -070074
75
Simran Basib6ec8ae2014-04-23 12:05:08 -070076def _get_control_file_contents_by_name(build, ds, suite_name):
Chris Masone8dd27e02012-06-25 15:59:43 -070077 """Return control file contents for |suite_name|.
78
79 Query the dev server at |ds| for the control file |suite_name|, included
80 in |build| for |board|.
81
82 @param build: unique name by which to refer to the image from now on.
Chris Masone8dd27e02012-06-25 15:59:43 -070083 @param ds: a dev_server.DevServer instance to fetch control file with.
84 @param suite_name: canonicalized suite name, e.g. test_suites/control.bvt.
85 @raises ControlFileNotFound if a unique suite control file doesn't exist.
86 @raises NoControlFileList if we can't list the control files at all.
87 @raises ControlFileEmpty if the control file exists on the server, but
88 can't be read.
89
90 @return the contents of the desired control file.
91 """
92 getter = control_file_getter.DevServerGetter.create(build, ds)
Gabe Black1e1c41b2015-02-04 23:55:15 -080093 timer = autotest_stats.Timer('control_files.parse.%s.%s' %
94 (ds.get_server_name(ds.url()
95 ).replace('.', '_'),
96 suite_name.rsplit('.')[-1]))
Chris Masone8dd27e02012-06-25 15:59:43 -070097 # Get the control file for the suite.
98 try:
Prashanth Balasubramanianabe3bb72014-11-20 12:00:37 -080099 with timer:
100 control_file_in = getter.get_control_file_contents_by_name(
101 suite_name)
Chris Masone8dd27e02012-06-25 15:59:43 -0700102 except error.CrosDynamicSuiteException as e:
Simran Basib6ec8ae2014-04-23 12:05:08 -0700103 raise type(e)("%s while testing %s." % (e, build))
Chris Masone8dd27e02012-06-25 15:59:43 -0700104 if not control_file_in:
105 raise error.ControlFileEmpty(
106 "Fetching %s returned no data." % suite_name)
Alex Millera713e252013-03-01 10:45:44 -0800107 # Force control files to only contain ascii characters.
108 try:
109 control_file_in.encode('ascii')
110 except UnicodeDecodeError as e:
111 raise error.ControlFileMalformed(str(e))
112
Chris Masone8dd27e02012-06-25 15:59:43 -0700113 return control_file_in
114
115
Dan Shi5e8fa182016-04-15 11:04:36 -0700116def _stage_build_artifacts(build, hostname=None):
Simran Basib6ec8ae2014-04-23 12:05:08 -0700117 """
118 Ensure components of |build| necessary for installing images are staged.
119
120 @param build image we want to stage.
Dan Shi5e8fa182016-04-15 11:04:36 -0700121 @param hostname hostname of a dut may run test on. This is to help to locate
122 a devserver closer to duts if needed. Default is None.
Simran Basib6ec8ae2014-04-23 12:05:08 -0700123
Prashanth B6285f6a2014-05-08 18:01:27 -0700124 @raises StageControlFileFailure: if the dev server throws 500 while staging
125 suite control files.
Simran Basib6ec8ae2014-04-23 12:05:08 -0700126
127 @return: dev_server.ImageServer instance to use with this build.
128 @return: timings dictionary containing staging start/end times.
129 """
130 timings = {}
Prashanth B6285f6a2014-05-08 18:01:27 -0700131 # Ensure components of |build| necessary for installing images are staged
132 # on the dev server. However set synchronous to False to allow other
133 # components to be downloaded in the background.
Dan Shi5e8fa182016-04-15 11:04:36 -0700134 ds = dev_server.resolve(build, hostname=hostname)
Simran Basib6ec8ae2014-04-23 12:05:08 -0700135 timings[constants.DOWNLOAD_STARTED_TIME] = formatted_now()
Gabe Black1e1c41b2015-02-04 23:55:15 -0800136 timer = autotest_stats.Timer('control_files.stage.%s' % (
137 ds.get_server_name(ds.url()).replace('.', '_')))
Simran Basib6ec8ae2014-04-23 12:05:08 -0700138 try:
Prashanth Balasubramanianabe3bb72014-11-20 12:00:37 -0800139 with timer:
Dan Shi6450e142016-03-11 11:52:20 -0800140 ds.stage_artifacts(image=build, artifacts=['test_suites'])
Simran Basib6ec8ae2014-04-23 12:05:08 -0700141 except dev_server.DevServerException as e:
Prashanth B6285f6a2014-05-08 18:01:27 -0700142 raise error.StageControlFileFailure(
Simran Basib6ec8ae2014-04-23 12:05:08 -0700143 "Failed to stage %s: %s" % (build, e))
144 timings[constants.PAYLOAD_FINISHED_TIME] = formatted_now()
145 return (ds, timings)
146
147
MK Ryue301eb72015-06-25 12:51:02 -0700148@rpc_utils.route_rpc_to_master
Dan Shi5984d782016-04-05 18:43:51 -0700149def create_suite_job(name='', board='', pool='', control_file='',
Simran Basib6ec8ae2014-04-23 12:05:08 -0700150 check_hosts=True, num=None, file_bugs=False, timeout=24,
151 timeout_mins=None, priority=priorities.Priority.DEFAULT,
Fang Deng058860c2014-05-15 15:41:50 -0700152 suite_args=None, wait_for_results=True, job_retry=False,
Fang Deng443f1952015-01-02 14:51:49 -0800153 max_retries=None, max_runtime_mins=None, suite_min_duts=0,
Dan Shi36cfd832014-10-10 13:38:51 -0700154 offload_failures_only=False, builds={},
Dan Shi059261a2016-02-22 12:06:37 -0800155 test_source_build=None, run_prod_code=False,
Michael Tang6dc174e2016-05-31 23:13:42 -0700156 delay_minutes=0, is_cloning=False, **kwargs):
Chris Masone859fdec2012-01-30 08:38:09 -0800157 """
158 Create a job to run a test suite on the given device with the given image.
159
160 When the timeout specified in the control file is reached, the
161 job is guaranteed to have completed and results will be available.
162
Simran Basib6ec8ae2014-04-23 12:05:08 -0700163 @param name: The test name if control_file is supplied, otherwise the name
164 of the test suite to run, e.g. 'bvt'.
Chris Masone859fdec2012-01-30 08:38:09 -0800165 @param board: the kind of device to run the tests on.
Dan Shi36cfd832014-10-10 13:38:51 -0700166 @param builds: the builds to install e.g.
167 {'cros-version:': 'x86-alex-release/R18-1655.0.0',
Dan Shi5984d782016-04-05 18:43:51 -0700168 'fwrw-version:': 'x86-alex-firmware/R36-5771.50.0',
Dan Shi36cfd832014-10-10 13:38:51 -0700169 'fwro-version:': 'x86-alex-firmware/R36-5771.49.0'}
170 If builds is given a value, it overrides argument build.
171 @param test_source_build: Build that contains the server-side test code.
Scott Zawalski65650172012-02-16 11:48:26 -0500172 @param pool: Specify the pool of machines to use for scheduling
173 purposes.
Chris Masone62579122012-03-08 15:18:43 -0800174 @param check_hosts: require appropriate live hosts to exist in the lab.
Aviv Keshetd83ef442013-01-16 16:19:35 -0800175 @param num: Specify the number of machines to schedule across (integer).
176 Leave unspecified or use None to use default sharding factor.
Alex Millerc577f3e2012-09-27 14:06:07 -0700177 @param file_bugs: File a bug on each test failure in this suite.
Alex Miller139690b2013-09-07 15:35:49 -0700178 @param timeout: The max lifetime of this suite, in hours.
Simran Basi7e605742013-11-12 13:43:36 -0800179 @param timeout_mins: The max lifetime of this suite, in minutes. Takes
180 priority over timeout.
Alex Miller139690b2013-09-07 15:35:49 -0700181 @param priority: Integer denoting priority. Higher is more important.
Aviv Keshet7cd12312013-07-25 10:25:55 -0700182 @param suite_args: Optional arguments which will be parsed by the suite
183 control file. Used by control.test_that_wrapper to
184 determine which tests to run.
Dan Shi95122412013-11-12 16:20:33 -0800185 @param wait_for_results: Set to False to run the suite job without waiting
186 for test jobs to finish. Default is True.
Fang Deng058860c2014-05-15 15:41:50 -0700187 @param job_retry: Set to True to enable job-level retry. Default is False.
Fang Deng443f1952015-01-02 14:51:49 -0800188 @param max_retries: Integer, maximum job retries allowed at suite level.
189 None for no max.
Simran Basi102e3522014-09-11 11:46:10 -0700190 @param max_runtime_mins: Maximum amount of time a job can be running in
191 minutes.
Fang Dengcbc01212014-11-25 16:09:46 -0800192 @param suite_min_duts: Integer. Scheduler will prioritize getting the
193 minimum number of machines for the suite when it is
194 competing with another suite that has a higher
195 priority but already got minimum machines it needs.
Simran Basi1e10e922015-04-16 15:09:56 -0700196 @param offload_failures_only: Only enable gs_offloading for failed jobs.
Simran Basi5ace6f22016-01-06 17:30:44 -0800197 @param run_prod_code: If True, the suite will run the test code that
198 lives in prod aka the test code currently on the
199 lab servers. If False, the control files and test
200 code for this suite run will be retrieved from the
201 build artifacts.
Dan Shi059261a2016-02-22 12:06:37 -0800202 @param delay_minutes: Delay the creation of test jobs for a given number of
203 minutes.
Michael Tang6dc174e2016-05-31 23:13:42 -0700204 @param is_cloning: True if creating a cloning job.
Simran Basib6ec8ae2014-04-23 12:05:08 -0700205 @param kwargs: extra keyword args. NOT USED.
Chris Masone859fdec2012-01-30 08:38:09 -0800206
Chris Masone8dd27e02012-06-25 15:59:43 -0700207 @raises ControlFileNotFound: if a unique suite control file doesn't exist.
208 @raises NoControlFileList: if we can't list the control files at all.
Prashanth B6285f6a2014-05-08 18:01:27 -0700209 @raises StageControlFileFailure: If the dev server throws 500 while
210 staging test_suites.
Chris Masone8dd27e02012-06-25 15:59:43 -0700211 @raises ControlFileEmpty: if the control file exists on the server, but
212 can't be read.
Chris Masone859fdec2012-01-30 08:38:09 -0800213
214 @return: the job ID of the suite; -1 on error.
215 """
Aviv Keshetd83ef442013-01-16 16:19:35 -0800216 if type(num) is not int and num is not None:
Chris Sosa18c70b32013-02-15 14:12:43 -0800217 raise error.SuiteArgumentException('Ill specified num argument %r. '
218 'Must be an integer or None.' % num)
Aviv Keshetd83ef442013-01-16 16:19:35 -0800219 if num == 0:
220 logging.warning("Can't run on 0 hosts; using default.")
221 num = None
Dan Shi36cfd832014-10-10 13:38:51 -0700222
Dan Shi2121a332016-02-25 14:22:22 -0800223 # Default test source build to CrOS build if it's not specified and
224 # run_prod_code is set to False.
225 if not run_prod_code:
226 test_source_build = Suite.get_test_source_build(
227 builds, test_source_build=test_source_build)
Dan Shi36cfd832014-10-10 13:38:51 -0700228
Dan Shi5e8fa182016-04-15 11:04:36 -0700229 # If 'prefer_local_devserver' is True in global setting, and both board
230 # and pool are specified, pick a dut in the given board and pool, and
231 # use that to help to pick a devserver in the same subnet of the duts
232 # to be used to run tests.
233 if dev_server.PREFER_LOCAL_DEVSERVER and pool and board:
234 sample_dut = rpc_utils.get_sample_dut(board, pool)
235 else:
236 sample_dut = None
237
Simran Basi5ace6f22016-01-06 17:30:44 -0800238 suite_name = canonicalize_suite_name(name)
239 if run_prod_code:
Dan Shi5e8fa182016-04-15 11:04:36 -0700240 ds = dev_server.resolve(test_source_build, hostname=sample_dut)
Simran Basi5ace6f22016-01-06 17:30:44 -0800241 keyvals = {}
242 getter = control_file_getter.FileSystemGetter(
243 [_CONFIG.get_config_value('SCHEDULER',
244 'drone_installation_directory')])
245 control_file = getter.get_control_file_contents_by_name(suite_name)
246 else:
Dan Shi5e8fa182016-04-15 11:04:36 -0700247 (ds, keyvals) = _stage_build_artifacts(
248 test_source_build, hostname=sample_dut)
Fang Dengcbc01212014-11-25 16:09:46 -0800249 keyvals[constants.SUITE_MIN_DUTS_KEY] = suite_min_duts
Chris Masone859fdec2012-01-30 08:38:09 -0800250
Simran Basib6ec8ae2014-04-23 12:05:08 -0700251 if not control_file:
Dan Shi36cfd832014-10-10 13:38:51 -0700252 # No control file was supplied so look it up from the build artifacts.
253 suite_name = canonicalize_suite_name(name)
254 control_file = _get_control_file_contents_by_name(test_source_build,
255 ds, suite_name)
Simran Basi86fe9c92016-02-09 17:58:20 -0800256 # Do not change this naming convention without updating
257 # site_utils.parse_job_name.
Dan Shi2121a332016-02-25 14:22:22 -0800258 if not run_prod_code:
259 name = '%s-%s' % (test_source_build, suite_name)
260 else:
261 # If run_prod_code is True, test_source_build is not set, use the
262 # first build in the builds list for the sutie job name.
263 name = '%s-%s' % (builds.values()[0], suite_name)
Chris Masone46d0eb12012-07-27 18:56:39 -0700264
Simran Basi7e605742013-11-12 13:43:36 -0800265 timeout_mins = timeout_mins or timeout * 60
Simran Basi102e3522014-09-11 11:46:10 -0700266 max_runtime_mins = max_runtime_mins or timeout * 60
Simran Basi7e605742013-11-12 13:43:36 -0800267
Simran Basib6ec8ae2014-04-23 12:05:08 -0700268 if not board:
Dan Shid215dbe2015-06-18 16:14:59 -0700269 board = utils.ParseBuildName(builds[provision.CROS_VERSION_PREFIX])[0]
Chris Masone46d0eb12012-07-27 18:56:39 -0700270
Dan Shi5984d782016-04-05 18:43:51 -0700271 # Prepend builds and board to the control file.
Scott Zawalski65650172012-02-16 11:48:26 -0500272 inject_dict = {'board': board,
Dan Shi6dc22d12016-04-06 22:10:04 -0700273 # `build` is needed for suites like AU to stage image inside
274 # suite control file.
275 'build': test_source_build,
Dan Shi36cfd832014-10-10 13:38:51 -0700276 'builds': builds,
Chris Masone62579122012-03-08 15:18:43 -0800277 'check_hosts': check_hosts,
Chris Masone46d0eb12012-07-27 18:56:39 -0700278 'pool': pool,
Aviv Keshetd83ef442013-01-16 16:19:35 -0800279 'num': num,
Dan Shib8a99112013-06-18 13:46:10 -0700280 'file_bugs': file_bugs,
Alex Miller139690b2013-09-07 15:35:49 -0700281 'timeout': timeout,
Simran Basi7e605742013-11-12 13:43:36 -0800282 'timeout_mins': timeout_mins,
Alex Miller7d658cf2013-09-04 16:00:35 -0700283 'devserver_url': ds.url(),
Aviv Keshet7cd12312013-07-25 10:25:55 -0700284 'priority': priority,
Dan Shi95122412013-11-12 16:20:33 -0800285 'suite_args' : suite_args,
Fang Deng058860c2014-05-15 15:41:50 -0700286 'wait_for_results': wait_for_results,
Simran Basi102e3522014-09-11 11:46:10 -0700287 'job_retry': job_retry,
Fang Deng443f1952015-01-02 14:51:49 -0800288 'max_retries': max_retries,
Fang Dengcbc01212014-11-25 16:09:46 -0800289 'max_runtime_mins': max_runtime_mins,
Dan Shi36cfd832014-10-10 13:38:51 -0700290 'offload_failures_only': offload_failures_only,
Simran Basi5ace6f22016-01-06 17:30:44 -0800291 'test_source_build': test_source_build,
Dan Shi059261a2016-02-22 12:06:37 -0800292 'run_prod_code': run_prod_code,
293 'delay_minutes': delay_minutes,
Aviv Keshet7cd12312013-07-25 10:25:55 -0700294 }
295
Michael Tang6dc174e2016-05-31 23:13:42 -0700296 if is_cloning:
297 control_file = tools.remove_injection(control_file)
Simran Basib6ec8ae2014-04-23 12:05:08 -0700298 control_file = tools.inject_vars(inject_dict, control_file)
Chris Masone859fdec2012-01-30 08:38:09 -0800299
Jakob Juelich9fffe4f2014-08-14 18:07:05 -0700300 return rpc_utils.create_job_common(name,
Jakob Juelich59cfe542014-09-02 16:37:46 -0700301 priority=priority,
302 timeout_mins=timeout_mins,
303 max_runtime_mins=max_runtime_mins,
304 control_type='Server',
305 control_file=control_file,
306 hostless=True,
Fang Dengcbc01212014-11-25 16:09:46 -0800307 keyvals=keyvals)
Simran Basi71206ef2014-08-13 13:51:18 -0700308
309
310# TODO: hide the following rpcs under is_moblab
311def moblab_only(func):
312 """Ensure moblab specific functions only run on Moblab devices."""
313 def verify(*args, **kwargs):
314 if not utils.is_moblab():
315 raise error.RPCException('RPC: %s can only run on Moblab Systems!',
316 func.__name__)
317 return func(*args, **kwargs)
318 return verify
319
320
321@moblab_only
322def get_config_values():
323 """Returns all config values parsed from global and shadow configs.
324
325 Config values are grouped by sections, and each section is composed of
326 a list of name value pairs.
327 """
328 sections =_CONFIG.get_sections()
329 config_values = {}
330 for section in sections:
331 config_values[section] = _CONFIG.config.items(section)
Jakob Juelich9fffe4f2014-08-14 18:07:05 -0700332 return rpc_utils.prepare_for_serialization(config_values)
Simran Basi71206ef2014-08-13 13:51:18 -0700333
334
Michael Tang9afc74b2016-03-21 10:19:23 -0700335def _write_config_file(config_file, config_values, overwrite=False):
336 """Writes out a configuration file.
Simran Basi71206ef2014-08-13 13:51:18 -0700337
Michael Tang9afc74b2016-03-21 10:19:23 -0700338 @param config_file: The name of the configuration file.
339 @param config_values: The ConfigParser object.
340 @param ovewrite: Flag on if overwriting is allowed.
341 """
342 if not config_file:
343 raise error.RPCException('Empty config file name.')
344 if not overwrite and os.path.exists(config_file):
345 raise error.RPCException('Config file already exists.')
346
347 if config_values:
348 with open(config_file, 'w') as config_file:
349 config_values.write(config_file)
350
351
352def _read_original_config():
353 """Reads the orginal configuratino without shadow.
354
355 @return: A configuration object, see global_config_class.
Simran Basi71206ef2014-08-13 13:51:18 -0700356 """
Simran Basi773a86e2015-05-13 19:15:42 -0700357 original_config = global_config.global_config_class()
358 original_config.set_config_files(shadow_file='')
Michael Tang9afc74b2016-03-21 10:19:23 -0700359 return original_config
360
361
362def _read_raw_config(config_file):
363 """Reads the raw configuration from a configuration file.
364
365 @param: config_file: The path of the configuration file.
366
367 @return: A ConfigParser object.
368 """
369 shadow_config = ConfigParser.RawConfigParser()
370 shadow_config.read(config_file)
371 return shadow_config
372
373
374def _get_shadow_config_from_partial_update(config_values):
375 """Finds out the new shadow configuration based on a partial update.
376
377 Since the input is only a partial config, we should not lose the config
378 data inside the existing shadow config file. We also need to distinguish
379 if the input config info overrides with a new value or reverts back to
380 an original value.
381
382 @param config_values: See get_moblab_settings().
383
384 @return: The new shadow configuration as ConfigParser object.
385 """
386 original_config = _read_original_config()
387 existing_shadow = _read_raw_config(_CONFIG.shadow_file)
388 for section, config_value_list in config_values.iteritems():
389 for key, value in config_value_list:
390 if original_config.get_config_value(section, key,
391 default='',
392 allow_blank=True) != value:
393 if not existing_shadow.has_section(section):
394 existing_shadow.add_section(section)
395 existing_shadow.set(section, key, value)
396 elif existing_shadow.has_option(section, key):
397 existing_shadow.remove_option(section, key)
398 return existing_shadow
399
400
401def _update_partial_config(config_values):
402 """Updates the shadow configuration file with a partial config udpate.
403
404 @param config_values: See get_moblab_settings().
405 """
406 existing_config = _get_shadow_config_from_partial_update(config_values)
407 _write_config_file(_CONFIG.shadow_file, existing_config, True)
408
409
410@moblab_only
411def update_config_handler(config_values):
412 """Update config values and override shadow config.
413
414 @param config_values: See get_moblab_settings().
415 """
416 original_config = _read_original_config()
Simran Basi773a86e2015-05-13 19:15:42 -0700417 new_shadow = ConfigParser.RawConfigParser()
Simran Basi71206ef2014-08-13 13:51:18 -0700418 for section, config_value_list in config_values.iteritems():
419 for key, value in config_value_list:
Simran Basi773a86e2015-05-13 19:15:42 -0700420 if original_config.get_config_value(section, key,
421 default='',
422 allow_blank=True) != value:
423 if not new_shadow.has_section(section):
424 new_shadow.add_section(section)
425 new_shadow.set(section, key, value)
Michael Tang9afc74b2016-03-21 10:19:23 -0700426
Simran Basi71206ef2014-08-13 13:51:18 -0700427 if not _CONFIG.shadow_file or not os.path.exists(_CONFIG.shadow_file):
428 raise error.RPCException('Shadow config file does not exist.')
Michael Tang9afc74b2016-03-21 10:19:23 -0700429 _write_config_file(_CONFIG.shadow_file, new_shadow, True)
Simran Basi71206ef2014-08-13 13:51:18 -0700430
Simran Basi71206ef2014-08-13 13:51:18 -0700431 # TODO (sbasi) crbug.com/403916 - Remove the reboot command and
432 # instead restart the services that rely on the config values.
433 os.system('sudo reboot')
434
435
436@moblab_only
437def reset_config_settings():
438 with open(_CONFIG.shadow_file, 'w') as config_file:
Dan Shi36cfd832014-10-10 13:38:51 -0700439 pass
Simran Basi71206ef2014-08-13 13:51:18 -0700440 os.system('sudo reboot')
441
442
443@moblab_only
Michael Tangc05c9ef2016-03-25 14:31:14 -0700444def reboot_moblab():
445 """Simply reboot the device."""
446 os.system('sudo reboot')
447
448@moblab_only
Simran Basi71206ef2014-08-13 13:51:18 -0700449def set_boto_key(boto_key):
450 """Update the boto_key file.
451
452 @param boto_key: File name of boto_key uploaded through handle_file_upload.
453 """
454 if not os.path.exists(boto_key):
455 raise error.RPCException('Boto key: %s does not exist!' % boto_key)
456 shutil.copyfile(boto_key, moblab_host.MOBLAB_BOTO_LOCATION)
Dan Shi193905e2014-07-25 23:33:09 -0700457
458
Dan Shiaec99012016-01-07 09:09:16 -0800459@moblab_only
460def set_launch_control_key(launch_control_key):
461 """Update the launch_control_key file.
462
463 @param launch_control_key: File name of launch_control_key uploaded through
464 handle_file_upload.
465 """
466 if not os.path.exists(launch_control_key):
467 raise error.RPCException('Launch Control key: %s does not exist!' %
468 launch_control_key)
469 shutil.copyfile(launch_control_key,
470 moblab_host.MOBLAB_LAUNCH_CONTROL_KEY_LOCATION)
471 # Restart the devserver service.
472 os.system('sudo restart moblab-devserver-init')
473
474
Michael Tang9afc74b2016-03-21 10:19:23 -0700475###########Moblab Config Wizard RPCs #######################
476def _get_public_ip_address(socket_handle):
477 """Gets the public IP address.
478
479 Connects to Google DNS server using a socket and gets the preferred IP
480 address from the connection.
481
482 @param: socket_handle: a unix socket.
483
484 @return: public ip address as string.
485 """
486 try:
487 socket_handle.settimeout(1)
488 socket_handle.connect(('8.8.8.8', 53))
489 socket_name = socket_handle.getsockname()
490 if socket_name is not None:
491 logging.info('Got socket name from UDP socket.')
492 return socket_name[0]
493 logging.warn('Created UDP socket but with no socket_name.')
494 except socket.error:
495 logging.warn('Could not get socket name from UDP socket.')
496 return None
497
498
499def _get_network_info():
500 """Gets the network information.
501
502 TCP socket is used to test the connectivity. If there is no connectivity, try to
503 get the public IP with UDP socket.
504
505 @return: a tuple as (public_ip_address, connected_to_internet).
506 """
507 s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
508 ip = _get_public_ip_address(s)
509 if ip is not None:
510 logging.info('Established TCP connection with well known server.')
511 return (ip, True)
512 s = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
513 return (_get_public_ip_address(s), False)
514
515
516@moblab_only
517def get_network_info():
518 """Returns the server ip addresses, and if the server connectivity.
519
520 The server ip addresses as an array of strings, and the connectivity as a
521 flag.
522 """
523 network_info = {}
524 info = _get_network_info()
525 if info[0] is not None:
526 network_info['server_ips'] = [info[0]]
527 network_info['is_connected'] = info[1]
528
529 return rpc_utils.prepare_for_serialization(network_info)
530
531
532# Gets the boto configuration.
533def _get_boto_config():
534 """Reads the boto configuration from the boto file.
535
536 @return: Boto configuration as ConfigParser object.
537 """
538 boto_config = ConfigParser.ConfigParser()
539 boto_config.read(MOBLAB_BOTO_LOCATION)
540 return boto_config
541
542
543@moblab_only
544def get_cloud_storage_info():
545 """RPC handler to get the cloud storage access information.
546 """
547 cloud_storage_info = {}
548 value =_CONFIG.get_config_value('CROS', _IMAGE_STORAGE_SERVER)
549 if value is not None:
550 cloud_storage_info[_IMAGE_STORAGE_SERVER] = value
551 value =_CONFIG.get_config_value('CROS', _RESULT_STORAGE_SERVER)
552 if value is not None:
553 cloud_storage_info[_RESULT_STORAGE_SERVER] = value
554
555 boto_config = _get_boto_config()
556 sections = boto_config.sections()
557
558 if sections:
559 cloud_storage_info[_USE_EXISTING_BOTO_FILE] = True
560 else:
561 cloud_storage_info[_USE_EXISTING_BOTO_FILE] = False
562 if 'Credentials' in sections:
563 options = boto_config.options('Credentials')
564 if _GS_ACCESS_KEY_ID in options:
565 value = boto_config.get('Credentials', _GS_ACCESS_KEY_ID)
566 cloud_storage_info[_GS_ACCESS_KEY_ID] = value
567 if _GS_SECRETE_ACCESS_KEY in options:
568 value = boto_config.get('Credentials', _GS_SECRETE_ACCESS_KEY)
569 cloud_storage_info[_GS_SECRETE_ACCESS_KEY] = value
570
571 return rpc_utils.prepare_for_serialization(cloud_storage_info)
572
573
574def _get_bucket_name_from_url(bucket_url):
575 """Gets the bucket name from a bucket url.
576
577 @param: bucket_url: the bucket url string.
578 """
579 if bucket_url:
580 match = GOOGLE_STORAGE_BUCKET_URL_PATTERN.match(bucket_url)
581 if match:
582 return match.group('bucket')
583 return None
584
585
586def _is_valid_boto_key(key_id, key_secret):
587 """Checks if the boto key is valid.
588
589 @param: key_id: The boto key id string.
590 @param: key_secret: The boto key string.
591
592 @return: A tuple as (valid_boolean, details_string).
593 """
594 if not key_id or not key_secret:
595 return (False, "Empty key id or secret.")
596 conn = boto.connect_gs(key_id, key_secret)
597 try:
598 buckets = conn.get_all_buckets()
599 return (True, None)
600 except boto.exception.GSResponseError:
601 details = "The boto access key is not valid"
602 return (False, details)
603 finally:
604 conn.close()
605
606
607def _is_valid_bucket(key_id, key_secret, bucket_name):
608 """Checks if a bucket is valid and accessible.
609
610 @param: key_id: The boto key id string.
611 @param: key_secret: The boto key string.
612 @param: bucket name string.
613
614 @return: A tuple as (valid_boolean, details_string).
615 """
616 if not key_id or not key_secret or not bucket_name:
617 return (False, "Server error: invalid argument")
618 conn = boto.connect_gs(key_id, key_secret)
619 bucket = conn.lookup(bucket_name)
620 conn.close()
621 if bucket:
622 return (True, None)
623 return (False, "Bucket %s does not exist." % bucket_name)
624
625
626def _is_valid_bucket_url(key_id, key_secret, bucket_url):
627 """Validates the bucket url is accessible.
628
629 @param: key_id: The boto key id string.
630 @param: key_secret: The boto key string.
631 @param: bucket url string.
632
633 @return: A tuple as (valid_boolean, details_string).
634 """
635 bucket_name = _get_bucket_name_from_url(bucket_url)
636 if bucket_name:
637 return _is_valid_bucket(key_id, key_secret, bucket_name)
638 return (False, "Bucket url %s is not valid" % bucket_url)
639
640
641def _validate_cloud_storage_info(cloud_storage_info):
642 """Checks if the cloud storage information is valid.
643
644 @param: cloud_storage_info: The JSON RPC object for cloud storage info.
645
646 @return: A tuple as (valid_boolean, details_string).
647 """
648 valid = True
649 details = None
650 if not cloud_storage_info[_USE_EXISTING_BOTO_FILE]:
651 key_id = cloud_storage_info[_GS_ACCESS_KEY_ID]
652 key_secret = cloud_storage_info[_GS_SECRETE_ACCESS_KEY]
653 valid, details = _is_valid_boto_key(key_id, key_secret)
654
655 if valid:
656 valid, details = _is_valid_bucket_url(
657 key_id, key_secret, cloud_storage_info[_IMAGE_STORAGE_SERVER])
658
659 if valid:
660 valid, details = _is_valid_bucket_url(
661 key_id, key_secret, cloud_storage_info[_RESULT_STORAGE_SERVER])
662 return (valid, details)
663
664
665def _create_operation_status_response(is_ok, details):
666 """Helper method to create a operation status reponse.
667
668 @param: is_ok: Boolean for if the operation is ok.
669 @param: details: A detailed string.
670
671 @return: A serialized JSON RPC object.
672 """
673 status_response = {'status_ok': is_ok}
674 if details:
675 status_response['status_details'] = details
676 return rpc_utils.prepare_for_serialization(status_response)
677
678
679@moblab_only
680def validate_cloud_storage_info(cloud_storage_info):
681 """RPC handler to check if the cloud storage info is valid.
682 """
683 valid, details = _validate_cloud_storage_info(cloud_storage_info)
684 return _create_operation_status_response(valid, details)
685
686
687@moblab_only
688def submit_wizard_config_info(cloud_storage_info):
689 """RPC handler to submit the cloud storage info.
690 """
691 valid, details = _validate_cloud_storage_info(cloud_storage_info)
692 if not valid:
693 return _create_operation_status_response(valid, details)
694 config_update = {}
695 config_update['CROS'] = [
696 (_IMAGE_STORAGE_SERVER, cloud_storage_info[_IMAGE_STORAGE_SERVER]),
697 (_RESULT_STORAGE_SERVER, cloud_storage_info[_RESULT_STORAGE_SERVER])
698 ]
699 _update_partial_config(config_update)
700
701 if not cloud_storage_info[_USE_EXISTING_BOTO_FILE]:
702 boto_config = ConfigParser.RawConfigParser()
703 boto_config.add_section('Credentials')
704 boto_config.set('Credentials', _GS_ACCESS_KEY_ID,
705 cloud_storage_info[_GS_ACCESS_KEY_ID])
706 boto_config.set('Credentials', _GS_SECRETE_ACCESS_KEY,
707 cloud_storage_info[_GS_SECRETE_ACCESS_KEY])
708 _write_config_file(MOBLAB_BOTO_LOCATION, boto_config, True)
709
710 _CONFIG.parse_config_file()
711
Michael Tangc05c9ef2016-03-25 14:31:14 -0700712 # TODO(ntang): replace reboot with less intrusive reloading.
713 os.system('sudo reboot')
714
Michael Tang9afc74b2016-03-21 10:19:23 -0700715 return _create_operation_status_response(True, None)
716
717
Dan Shi193905e2014-07-25 23:33:09 -0700718def get_job_history(**filter_data):
719 """Get history of the job, including the special tasks executed for the job
720
721 @param filter_data: filter for the call, should at least include
722 {'job_id': [job id]}
723 @returns: JSON string of the job's history, including the information such
724 as the hosts run the job and the special tasks executed before
725 and after the job.
726 """
727 job_id = filter_data['job_id']
728 job_info = job_history.get_job_info(job_id)
Dan Shidfea3682014-08-10 23:38:40 -0700729 return rpc_utils.prepare_for_serialization(job_info.get_history())
730
731
732def get_host_history(start_time, end_time, hosts=None, board=None, pool=None):
733 """Get history of a list of host.
734
735 The return is a JSON string of host history for each host, for example,
736 {'172.22.33.51': [{'status': 'Resetting'
737 'start_time': '2014-08-07 10:02:16',
738 'end_time': '2014-08-07 10:03:16',
739 'log_url': 'http://autotest/reset-546546/debug',
740 'dbg_str': 'Task: Special Task 19441991 (host ...)'},
741 {'status': 'Running'
742 'start_time': '2014-08-07 10:03:18',
743 'end_time': '2014-08-07 10:13:00',
744 'log_url': 'http://autotest/reset-546546/debug',
745 'dbg_str': 'HQE: 15305005, for job: 14995562'}
746 ]
747 }
748 @param start_time: start time to search for history, can be string value or
749 epoch time.
750 @param end_time: end time to search for history, can be string value or
751 epoch time.
752 @param hosts: A list of hosts to search for history. Default is None.
753 @param board: board type of hosts. Default is None.
754 @param pool: pool type of hosts. Default is None.
755 @returns: JSON string of the host history.
756 """
757 return rpc_utils.prepare_for_serialization(
758 host_history.get_history_details(
759 start_time=start_time, end_time=end_time,
760 hosts=hosts, board=board, pool=pool,
761 process_pool_size=4))
Jakob Juelich59cfe542014-09-02 16:37:46 -0700762
763
MK Ryu07a109f2015-07-21 17:44:32 -0700764def shard_heartbeat(shard_hostname, jobs=(), hqes=(), known_job_ids=(),
765 known_host_ids=(), known_host_statuses=()):
Jakob Juelich1b525742014-09-30 13:08:07 -0700766 """Receive updates for job statuses from shards and assign hosts and jobs.
Jakob Juelich59cfe542014-09-02 16:37:46 -0700767
768 @param shard_hostname: Hostname of the calling shard
Jakob Juelicha94efe62014-09-18 16:02:49 -0700769 @param jobs: Jobs in serialized form that should be updated with newer
770 status from a shard.
771 @param hqes: Hostqueueentries in serialized form that should be updated with
772 newer status from a shard. Note that for every hostqueueentry
773 the corresponding job must be in jobs.
Jakob Juelich1b525742014-09-30 13:08:07 -0700774 @param known_job_ids: List of ids of jobs the shard already has.
775 @param known_host_ids: List of ids of hosts the shard already has.
MK Ryu07a109f2015-07-21 17:44:32 -0700776 @param known_host_statuses: List of statuses of hosts the shard already has.
Jakob Juelicha94efe62014-09-18 16:02:49 -0700777
Fang Dengf3705992014-12-16 17:32:18 -0800778 @returns: Serialized representations of hosts, jobs, suite job keyvals
779 and their dependencies to be inserted into a shard's database.
Jakob Juelich59cfe542014-09-02 16:37:46 -0700780 """
Jakob Juelich1b525742014-09-30 13:08:07 -0700781 # The following alternatives to sending host and job ids in every heartbeat
782 # have been considered:
783 # 1. Sending the highest known job and host ids. This would work for jobs:
784 # Newer jobs always have larger ids. Also, if a job is not assigned to a
785 # particular shard during a heartbeat, it never will be assigned to this
786 # shard later.
787 # This is not true for hosts though: A host that is leased won't be sent
788 # to the shard now, but might be sent in a future heartbeat. This means
789 # sometimes hosts should be transfered that have a lower id than the
790 # maximum host id the shard knows.
791 # 2. Send the number of jobs/hosts the shard knows to the master in each
792 # heartbeat. Compare these to the number of records that already have
793 # the shard_id set to this shard. In the normal case, they should match.
794 # In case they don't, resend all entities of that type.
795 # This would work well for hosts, because there aren't that many.
796 # Resending all jobs is quite a big overhead though.
797 # Also, this approach might run into edge cases when entities are
798 # ever deleted.
799 # 3. Mixtures of the above: Use 1 for jobs and 2 for hosts.
800 # Using two different approaches isn't consistent and might cause
801 # confusion. Also the issues with the case of deletions might still
802 # occur.
803 #
804 # The overhead of sending all job and host ids in every heartbeat is low:
805 # At peaks one board has about 1200 created but unfinished jobs.
806 # See the numbers here: http://goo.gl/gQCGWH
807 # Assuming that job id's have 6 digits and that json serialization takes a
808 # comma and a space as overhead, the traffic per id sent is about 8 bytes.
809 # If 5000 ids need to be sent, this means 40 kilobytes of traffic.
810 # A NOT IN query with 5000 ids took about 30ms in tests made.
811 # These numbers seem low enough to outweigh the disadvantages of the
812 # solutions described above.
Gabe Black1e1c41b2015-02-04 23:55:15 -0800813 timer = autotest_stats.Timer('shard_heartbeat')
Jakob Juelich59cfe542014-09-02 16:37:46 -0700814 with timer:
815 shard_obj = rpc_utils.retrieve_shard(shard_hostname=shard_hostname)
Jakob Juelicha94efe62014-09-18 16:02:49 -0700816 rpc_utils.persist_records_sent_from_shard(shard_obj, jobs, hqes)
MK Ryu07a109f2015-07-21 17:44:32 -0700817 assert len(known_host_ids) == len(known_host_statuses)
818 for i in range(len(known_host_ids)):
819 host_model = models.Host.objects.get(pk=known_host_ids[i])
820 if host_model.status != known_host_statuses[i]:
821 host_model.status = known_host_statuses[i]
822 host_model.save()
823
Fang Dengf3705992014-12-16 17:32:18 -0800824 hosts, jobs, suite_keyvals = rpc_utils.find_records_for_shard(
MK Ryu07a109f2015-07-21 17:44:32 -0700825 shard_obj, known_job_ids=known_job_ids,
826 known_host_ids=known_host_ids)
Jakob Juelich59cfe542014-09-02 16:37:46 -0700827 return {
828 'hosts': [host.serialize() for host in hosts],
829 'jobs': [job.serialize() for job in jobs],
Fang Dengf3705992014-12-16 17:32:18 -0800830 'suite_keyvals': [kv.serialize() for kv in suite_keyvals],
Jakob Juelich59cfe542014-09-02 16:37:46 -0700831 }
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700832
833
834def get_shards(**filter_data):
835 """Return a list of all shards.
836
837 @returns A sequence of nested dictionaries of shard information.
838 """
839 shards = models.Shard.query_objects(filter_data)
840 serialized_shards = rpc_utils.prepare_rows_as_nested_dicts(shards, ())
841 for serialized, shard in zip(serialized_shards, shards):
842 serialized['labels'] = [label.name for label in shard.labels.all()]
843
844 return serialized_shards
845
846
MK Ryu5dfcc892015-07-16 15:34:04 -0700847def add_shard(hostname, labels):
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700848 """Add a shard and start running jobs on it.
849
850 @param hostname: The hostname of the shard to be added; needs to be unique.
MK Ryu5dfcc892015-07-16 15:34:04 -0700851 @param labels: Board labels separated by a comma. Jobs of one of the labels
852 will be assigned to the shard.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700853
Jakob Juelich8b110ee2014-09-15 16:13:42 -0700854 @raises error.RPCException: If label provided doesn't start with `board:`
855 @raises model_logic.ValidationError: If a shard with the given hostname
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700856 already exists.
Jakob Juelich8b110ee2014-09-15 16:13:42 -0700857 @raises models.Label.DoesNotExist: If the label specified doesn't exist.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700858 """
MK Ryu5dfcc892015-07-16 15:34:04 -0700859 labels = labels.split(',')
860 label_models = []
861 for label in labels:
862 if not label.startswith('board:'):
863 raise error.RPCException('Sharding only supports for `board:.*` '
864 'labels.')
865 # Fetch label first, so shard isn't created when label doesn't exist.
866 label_models.append(models.Label.smart_get(label))
Jakob Juelich8b110ee2014-09-15 16:13:42 -0700867
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700868 shard = models.Shard.add_object(hostname=hostname)
MK Ryu5dfcc892015-07-16 15:34:04 -0700869 for label in label_models:
870 shard.labels.add(label)
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700871 return shard.id
872
873
874def delete_shard(hostname):
875 """Delete a shard and reclaim all resources from it.
876
877 This claims back all assigned hosts from the shard. To ensure all DUTs are
xixuan03cb93f2016-03-22 16:21:41 -0700878 in a sane state, a Reboot task with highest priority is scheduled for them.
879 This reboots the DUTs and then all left tasks continue to run in drone of
880 the master.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700881
xixuan03cb93f2016-03-22 16:21:41 -0700882 The procedure for deleting a shard:
883 * Lock all unlocked hosts on that shard.
884 * Remove shard information .
885 * Assign a reboot task with highest priority to these hosts.
886 * Unlock these hosts, then, the reboot tasks run in front of all other
887 tasks.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700888
889 The status of jobs that haven't been reported to be finished yet, will be
890 lost. The master scheduler will pick up the jobs and execute them.
891
892 @param hostname: Hostname of the shard to delete.
893 """
894 shard = rpc_utils.retrieve_shard(shard_hostname=hostname)
xixuan03cb93f2016-03-22 16:21:41 -0700895 hostnames_to_lock = [h.hostname for h in
896 models.Host.objects.filter(shard=shard, locked=False)]
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700897
898 # TODO(beeps): Power off shard
xixuan03cb93f2016-03-22 16:21:41 -0700899 # For ChromeOS hosts, a reboot test with the highest priority is added to
900 # the DUT. After a reboot it should be ganranteed that no processes from
901 # prior tests that were run by a shard are still running on.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700902
xixuan03cb93f2016-03-22 16:21:41 -0700903 # Lock all unlocked hosts.
904 dicts = {'locked': True, 'lock_time': datetime.datetime.now()}
905 models.Host.objects.filter(hostname__in=hostnames_to_lock).update(**dicts)
906
907 # Remove shard information.
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700908 models.Host.objects.filter(shard=shard).update(shard=None)
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700909 models.Job.objects.filter(shard=shard).update(shard=None)
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700910 shard.labels.clear()
Jakob Juelich82b7d1c2014-09-15 16:10:57 -0700911 shard.delete()
Dan Shi6964fa52014-12-18 11:04:27 -0800912
xixuan03cb93f2016-03-22 16:21:41 -0700913 # Assign a reboot task with highest priority: Super.
914 t = models.Test.objects.get(name='platform_BootPerfServer:shard')
915 c = utils.read_file(os.path.join(common.autotest_dir, t.path))
916 if hostnames_to_lock:
917 rpc_utils.create_job_common(
918 'reboot_dut_for_shard_deletion',
919 priority=priorities.Priority.SUPER,
920 control_type='Server',
921 control_file=c, hosts=hostnames_to_lock)
922
923 # Unlock these shard-related hosts.
924 dicts = {'locked': False, 'lock_time': None}
925 models.Host.objects.filter(hostname__in=hostnames_to_lock).update(**dicts)
926
Dan Shi6964fa52014-12-18 11:04:27 -0800927
MK Ryua34e3b12015-08-21 16:20:47 -0700928def get_servers(hostname=None, role=None, status=None):
Dan Shid7bb4f12015-01-06 10:53:50 -0800929 """Get a list of servers with matching role and status.
930
MK Ryua34e3b12015-08-21 16:20:47 -0700931 @param hostname: FQDN of the server.
Dan Shid7bb4f12015-01-06 10:53:50 -0800932 @param role: Name of the server role, e.g., drone, scheduler. Default to
933 None to match any role.
934 @param status: Status of the server, e.g., primary, backup, repair_required.
935 Default to None to match any server status.
936
937 @raises error.RPCException: If server database is not used.
938 @return: A list of server names for servers with matching role and status.
939 """
940 if not server_manager_utils.use_server_db():
941 raise error.RPCException('Server database is not enabled. Please try '
942 'retrieve servers from global config.')
MK Ryua34e3b12015-08-21 16:20:47 -0700943 servers = server_manager_utils.get_servers(hostname=hostname, role=role,
Dan Shid7bb4f12015-01-06 10:53:50 -0800944 status=status)
945 return [s.get_details() for s in servers]
946
947
MK Ryufbb002c2015-06-08 14:13:16 -0700948@rpc_utils.route_rpc_to_master
Simran Basibeb2bb22016-02-03 15:25:48 -0800949def get_stable_version(board=stable_version_utils.DEFAULT, android=False):
Dan Shi6964fa52014-12-18 11:04:27 -0800950 """Get stable version for the given board.
951
952 @param board: Name of the board.
Simran Basibeb2bb22016-02-03 15:25:48 -0800953 @param android: If True, the given board is an Android-based device. If
954 False, assume its a Chrome OS-based device.
955
Dan Shi6964fa52014-12-18 11:04:27 -0800956 @return: Stable version of the given board. Return global configure value
957 of CROS.stable_cros_version if stable_versinos table does not have
958 entry of board DEFAULT.
959 """
Simran Basibeb2bb22016-02-03 15:25:48 -0800960 return stable_version_utils.get(board=board, android=android)
Dan Shi25e1fd42014-12-19 14:36:42 -0800961
962
MK Ryufbb002c2015-06-08 14:13:16 -0700963@rpc_utils.route_rpc_to_master
Dan Shi25e1fd42014-12-19 14:36:42 -0800964def get_all_stable_versions():
965 """Get stable versions for all boards.
966
967 @return: A dictionary of board:version.
968 """
969 return stable_version_utils.get_all()
970
971
MK Ryufbb002c2015-06-08 14:13:16 -0700972@rpc_utils.route_rpc_to_master
Dan Shi25e1fd42014-12-19 14:36:42 -0800973def set_stable_version(version, board=stable_version_utils.DEFAULT):
974 """Modify stable version for the given board.
975
976 @param version: The new value of stable version for given board.
977 @param board: Name of the board, default to value `DEFAULT`.
978 """
979 stable_version_utils.set(version=version, board=board)
980
981
MK Ryufbb002c2015-06-08 14:13:16 -0700982@rpc_utils.route_rpc_to_master
Dan Shi25e1fd42014-12-19 14:36:42 -0800983def delete_stable_version(board):
984 """Modify stable version for the given board.
985
986 Delete a stable version entry in afe_stable_versions table for a given
987 board, so default stable version will be used.
988
989 @param board: Name of the board.
990 """
991 stable_version_utils.delete(board=board)
Matthew Sartorid96fb9b2015-05-19 18:04:58 -0700992
993
Michael Tang340efe32016-04-16 12:15:17 -0700994def get_tests_by_build(build, ignore_invalid_tests=False):
Matthew Sartorid96fb9b2015-05-19 18:04:58 -0700995 """Get the tests that are available for the specified build.
996
997 @param build: unique name by which to refer to the image.
Michael Tang340efe32016-04-16 12:15:17 -0700998 @param ignore_invalid_tests: flag on if unparsable tests are ignored.
Matthew Sartorid96fb9b2015-05-19 18:04:58 -0700999
1000 @return: A sorted list of all tests that are in the build specified.
1001 """
1002 # Stage the test artifacts.
1003 try:
1004 ds = dev_server.ImageServer.resolve(build)
1005 build = ds.translate(build)
1006 except dev_server.DevServerException as e:
1007 raise ValueError('Could not resolve build %s: %s' % (build, e))
1008
1009 try:
Dan Shi6450e142016-03-11 11:52:20 -08001010 ds.stage_artifacts(image=build, artifacts=['test_suites'])
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001011 except dev_server.DevServerException as e:
1012 raise error.StageControlFileFailure(
1013 'Failed to stage %s: %s' % (build, e))
1014
1015 # Collect the control files specified in this build
1016 cfile_getter = control_file_getter.DevServerGetter.create(build, ds)
xixuan0f7755d2016-04-18 14:49:12 -07001017 if SuiteBase.ENABLE_CONTROLS_IN_BATCH:
1018 control_file_info_list = cfile_getter.get_suite_info()
1019 control_file_list = control_file_info_list.keys()
1020 else:
1021 control_file_list = cfile_getter.get_control_file_list()
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001022
1023 test_objects = []
1024 _id = 0
1025 for control_file_path in control_file_list:
1026 # Read and parse the control file
xixuan0f7755d2016-04-18 14:49:12 -07001027 if SuiteBase.ENABLE_CONTROLS_IN_BATCH:
1028 control_file = control_file_info_list[control_file_path]
1029 else:
1030 control_file = cfile_getter.get_control_file_contents(
1031 control_file_path)
Michael Tang340efe32016-04-16 12:15:17 -07001032 try:
1033 control_obj = control_data.parse_control_string(control_file)
1034 except:
Michael Tang6dc174e2016-05-31 23:13:42 -07001035 logging.info('Failed to parse control file: %s', control_file_path)
Michael Tang340efe32016-04-16 12:15:17 -07001036 if not ignore_invalid_tests:
1037 raise
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001038
1039 # Extract the values needed for the AFE from the control_obj.
1040 # The keys list represents attributes in the control_obj that
1041 # are required by the AFE
1042 keys = ['author', 'doc', 'name', 'time', 'test_type', 'experimental',
1043 'test_category', 'test_class', 'dependencies', 'run_verify',
1044 'sync_count', 'job_retries', 'retries', 'path']
1045
1046 test_object = {}
1047 for key in keys:
1048 test_object[key] = getattr(control_obj, key) if hasattr(
1049 control_obj, key) else ''
1050
1051 # Unfortunately, the AFE expects different key-names for certain
1052 # values, these must be corrected to avoid the risk of tests
1053 # being omitted by the AFE.
1054 # The 'id' is an additional value used in the AFE.
Matthew Sartori10438092015-06-24 14:30:18 -07001055 # The control_data parsing does not reference 'run_reset', but it
1056 # is also used in the AFE and defaults to True.
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001057 test_object['id'] = _id
Matthew Sartori10438092015-06-24 14:30:18 -07001058 test_object['run_reset'] = True
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001059 test_object['description'] = test_object.get('doc', '')
1060 test_object['test_time'] = test_object.get('time', 0)
1061 test_object['test_retry'] = test_object.get('retries', 0)
1062
1063 # Fix the test name to be consistent with the current presentation
1064 # of test names in the AFE.
1065 testpath, subname = os.path.split(control_file_path)
1066 testname = os.path.basename(testpath)
1067 subname = subname.split('.')[1:]
1068 if subname:
1069 testname = '%s:%s' % (testname, ':'.join(subname))
1070
1071 test_object['name'] = testname
1072
Matthew Sartori10438092015-06-24 14:30:18 -07001073 # Correct the test path as parse_control_string sets an empty string.
1074 test_object['path'] = control_file_path
1075
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001076 _id += 1
1077 test_objects.append(test_object)
1078
Matthew Sartori10438092015-06-24 14:30:18 -07001079 test_objects = sorted(test_objects, key=lambda x: x.get('name'))
Matthew Sartorid96fb9b2015-05-19 18:04:58 -07001080 return rpc_utils.prepare_for_serialization(test_objects)