blob: 5bc716ef8f2ff452f5f1ee0f1574a5d72aac43c0 [file] [log] [blame]
Dan Shia1ecd5c2013-06-06 11:21:31 -07001# Copyright (c) 2013 The Chromium Authors. All rights reserved.
2# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
Dan Shia1ecd5c2013-06-06 11:21:31 -07005
Paul Hobbs20cc72a2016-08-30 16:57:05 -07006import contextlib
Fang Deng18699fe2015-12-04 16:40:27 -08007import grp
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -08008import httplib
9import json
Alex Millerdadc2c22013-07-08 15:21:21 -070010import logging
MK Ryu35d661e2014-09-25 17:44:10 -070011import os
beeps023afc62014-02-04 16:59:22 -080012import random
Alex Millerdadc2c22013-07-08 15:21:21 -070013import re
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -080014import time
Paul Drewsbef578d2013-09-24 15:10:36 -070015import urllib2
Alex Millerdadc2c22013-07-08 15:21:21 -070016
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -080017import common
Dan Shief31f032016-05-13 15:51:39 -070018from autotest_lib.client.common_lib import utils
beeps023afc62014-02-04 16:59:22 -080019from autotest_lib.client.common_lib import error
20from autotest_lib.client.common_lib import global_config
MK Ryu0c1a37d2015-04-30 12:00:55 -070021from autotest_lib.client.common_lib import host_queue_entry_states
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -070022from autotest_lib.client.common_lib import host_states
Simran Basi7756a0b2016-03-16 13:10:07 -070023from autotest_lib.server.cros import provision
Dan Shia1ecd5c2013-06-06 11:21:31 -070024from autotest_lib.server.cros.dynamic_suite import constants
Dan Shi7e04fa82013-07-25 15:08:48 -070025from autotest_lib.server.cros.dynamic_suite import job_status
Dan Shia1ecd5c2013-06-06 11:21:31 -070026
Dan Shi82997b92015-05-06 12:08:02 -070027try:
28 from chromite.lib import cros_build_lib
Paul Hobbs20cc72a2016-08-30 16:57:05 -070029 from chromite.lib import ts_mon_config
Dan Shi82997b92015-05-06 12:08:02 -070030except ImportError:
Paul Hobbs20cc72a2016-08-30 16:57:05 -070031 logging.warn('Unable to import chromite. Monarch is disabled.')
Dan Shi82997b92015-05-06 12:08:02 -070032 # Init the module variable to None. Access to this module can check if it
33 # is not None before making calls.
34 cros_build_lib = None
Paul Hobbs20cc72a2016-08-30 16:57:05 -070035 ts_mon_config = None
Dan Shi82997b92015-05-06 12:08:02 -070036
Dan Shia1ecd5c2013-06-06 11:21:31 -070037
Dan Shid37736b2016-07-06 15:10:29 -070038CONFIG = global_config.global_config
39
40_SHERIFF_JS = CONFIG.get_config_value('NOTIFICATIONS', 'sheriffs', default='')
41_LAB_SHERIFF_JS = CONFIG.get_config_value(
42 'NOTIFICATIONS', 'lab_sheriffs', default='')
43_CHROMIUM_BUILD_URL = CONFIG.get_config_value(
44 'NOTIFICATIONS', 'chromium_build_url', default='')
Alex Millerdadc2c22013-07-08 15:21:21 -070045
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -080046LAB_GOOD_STATES = ('open', 'throttled')
47
Dan Shid37736b2016-07-06 15:10:29 -070048ENABLE_DRONE_IN_RESTRICTED_SUBNET = CONFIG.get_config_value(
49 'CROS', 'enable_drone_in_restricted_subnet', type=bool,
50 default=False)
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -080051
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -070052# Wait at most 10 mins for duts to go idle.
53IDLE_DUT_WAIT_TIMEOUT = 600
54
Dan Shi43274402016-11-04 15:13:43 -070055# Mapping between board name and build target. This is for special case handling
56# for certain Android board that the board name and build target name does not
57# match.
tturney08fc62e2016-11-17 15:44:30 -080058ANDROID_TARGET_TO_BOARD_MAP = {
59 'seed_l8150': 'gm4g_sprout',
60 'bat_land': 'bat'
61 }
62ANDROID_BOARD_TO_TARGET_MAP = {
63 'gm4g_sprout': 'seed_l8150',
64 'bat': 'bat_land'
65 }
Dan Shi43274402016-11-04 15:13:43 -070066
J. Richard Barnetteabbe0962013-12-10 18:15:44 -080067class TestLabException(Exception):
68 """Exception raised when the Test Lab blocks a test or suite."""
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -080069 pass
70
71
72class ParseBuildNameException(Exception):
73 """Raised when ParseBuildName() cannot parse a build name."""
74 pass
75
76
Fang Dengf08814a2015-08-03 18:12:18 +000077class Singleton(type):
78 """Enforce that only one client class is instantiated per process."""
79 _instances = {}
80
81 def __call__(cls, *args, **kwargs):
82 """Fetch the instance of a class to use for subsequent calls."""
83 if cls not in cls._instances:
84 cls._instances[cls] = super(Singleton, cls).__call__(
85 *args, **kwargs)
86 return cls._instances[cls]
87
Kevin Cheng05ae2a42016-06-06 10:12:48 -070088class EmptyAFEHost(object):
89 """Object to represent an AFE host object when there is no AFE."""
90
91 def __init__(self):
92 """
93 We'll be setting the instance attributes as we use them. Right now
94 we only use attributes and labels but as time goes by and other
95 attributes are used from an actual AFE Host object (check
96 rpc_interfaces.get_hosts()), we'll add them in here so users won't be
97 perplexed why their host's afe_host object complains that attribute
98 doesn't exist.
99 """
100 self.attributes = {}
101 self.labels = []
102
Fang Dengf08814a2015-08-03 18:12:18 +0000103
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800104def ParseBuildName(name):
105 """Format a build name, given board, type, milestone, and manifest num.
106
Simran Basib7d21162014-05-21 15:26:16 -0700107 @param name: a build name, e.g. 'x86-alex-release/R20-2015.0.0' or a
108 relative build name, e.g. 'x86-alex-release/LATEST'
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800109
110 @return board: board the manifest is for, e.g. x86-alex.
111 @return type: one of 'release', 'factory', or 'firmware'
112 @return milestone: (numeric) milestone the manifest was associated with.
Simran Basib7d21162014-05-21 15:26:16 -0700113 Will be None for relative build names.
114 @return manifest: manifest number, e.g. '2015.0.0'.
115 Will be None for relative build names.
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800116
117 """
Dan Shie02810d2016-08-25 09:44:57 -0700118 match = re.match(r'(trybot-)?(?P<board>[\w-]+?)(?:-chrome)?(?:-chromium)?'
119 r'-(?P<type>\w+)/(R(?P<milestone>\d+)-'
120 r'(?P<manifest>[\d.ab-]+)|LATEST)',
Simran Basif8f648e2014-09-09 11:40:03 -0700121 name)
122 if match and len(match.groups()) >= 5:
Simran Basib7d21162014-05-21 15:26:16 -0700123 return (match.group('board'), match.group('type'),
124 match.group('milestone'), match.group('manifest'))
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800125 raise ParseBuildNameException('%s is a malformed build name.' % name)
126
Alex Millerdadc2c22013-07-08 15:21:21 -0700127
Dan Shi3d7a0e12015-10-12 11:55:45 -0700128def get_labels_from_afe(hostname, label_prefix, afe):
129 """Retrieve a host's specific labels from the AFE.
130
131 Looks for the host labels that have the form <label_prefix>:<value>
132 and returns the "<value>" part of the label. None is returned
133 if there is not a label matching the pattern
134
135 @param hostname: hostname of given DUT.
136 @param label_prefix: prefix of label to be matched, e.g., |board:|
137 @param afe: afe instance.
138
139 @returns A list of labels that match the prefix or 'None'
140
141 """
142 labels = afe.get_labels(name__startswith=label_prefix,
143 host__hostname__in=[hostname])
144 if labels:
145 return [l.name.split(label_prefix, 1)[1] for l in labels]
146
147
Dan Shia1ecd5c2013-06-06 11:21:31 -0700148def get_label_from_afe(hostname, label_prefix, afe):
149 """Retrieve a host's specific label from the AFE.
150
151 Looks for a host label that has the form <label_prefix>:<value>
152 and returns the "<value>" part of the label. None is returned
153 if there is not a label matching the pattern
154
155 @param hostname: hostname of given DUT.
156 @param label_prefix: prefix of label to be matched, e.g., |board:|
157 @param afe: afe instance.
158 @returns the label that matches the prefix or 'None'
159
160 """
Dan Shi3d7a0e12015-10-12 11:55:45 -0700161 labels = get_labels_from_afe(hostname, label_prefix, afe)
Dan Shia1ecd5c2013-06-06 11:21:31 -0700162 if labels and len(labels) == 1:
Dan Shi3d7a0e12015-10-12 11:55:45 -0700163 return labels[0]
Dan Shia1ecd5c2013-06-06 11:21:31 -0700164
165
166def get_board_from_afe(hostname, afe):
167 """Retrieve given host's board from its labels in the AFE.
168
169 Looks for a host label of the form "board:<board>", and
170 returns the "<board>" part of the label. `None` is returned
171 if there is not a single, unique label matching the pattern.
172
173 @param hostname: hostname of given DUT.
174 @param afe: afe instance.
175 @returns board from label, or `None`.
176
177 """
178 return get_label_from_afe(hostname, constants.BOARD_PREFIX, afe)
179
180
181def get_build_from_afe(hostname, afe):
182 """Retrieve the current build for given host from the AFE.
183
184 Looks through the host's labels in the AFE to determine its build.
185
186 @param hostname: hostname of given DUT.
187 @param afe: afe instance.
188 @returns The current build or None if it could not find it or if there
189 were multiple build labels assigned to this host.
190
191 """
Simran Basi7756a0b2016-03-16 13:10:07 -0700192 for prefix in [provision.CROS_VERSION_PREFIX,
193 provision.ANDROID_BUILD_VERSION_PREFIX]:
194 build = get_label_from_afe(hostname, prefix + ':', afe)
195 if build:
196 return build
197 return None
Dan Shia1ecd5c2013-06-06 11:21:31 -0700198
199
Allen Li6a612392016-08-18 12:09:32 -0700200# TODO(fdeng): fix get_sheriffs crbug.com/483254
Fang Deng3197b392013-06-26 11:42:02 -0700201def get_sheriffs(lab_only=False):
Alex Millerdadc2c22013-07-08 15:21:21 -0700202 """
203 Polls the javascript file that holds the identity of the sheriff and
204 parses it's output to return a list of chromium sheriff email addresses.
205 The javascript file can contain the ldap of more than one sheriff, eg:
206 document.write('sheriff_one, sheriff_two').
207
Fang Deng3197b392013-06-26 11:42:02 -0700208 @param lab_only: if True, only pulls lab sheriff.
209 @return: A list of chroium.org sheriff email addresses to cc on the bug.
210 An empty list if failed to parse the javascript.
Alex Millerdadc2c22013-07-08 15:21:21 -0700211 """
212 sheriff_ids = []
Fang Deng3197b392013-06-26 11:42:02 -0700213 sheriff_js_list = _LAB_SHERIFF_JS.split(',')
214 if not lab_only:
215 sheriff_js_list.extend(_SHERIFF_JS.split(','))
216
217 for sheriff_js in sheriff_js_list:
Alex Millerdadc2c22013-07-08 15:21:21 -0700218 try:
Dan Shief31f032016-05-13 15:51:39 -0700219 url_content = utils.urlopen('%s%s'% (
Alex Millerdadc2c22013-07-08 15:21:21 -0700220 _CHROMIUM_BUILD_URL, sheriff_js)).read()
221 except (ValueError, IOError) as e:
beeps4efdf032013-09-17 11:27:14 -0700222 logging.warning('could not parse sheriff from url %s%s: %s',
223 _CHROMIUM_BUILD_URL, sheriff_js, str(e))
Paul Drewsbef578d2013-09-24 15:10:36 -0700224 except (urllib2.URLError, httplib.HTTPException) as e:
225 logging.warning('unexpected error reading from url "%s%s": %s',
226 _CHROMIUM_BUILD_URL, sheriff_js, str(e))
Alex Millerdadc2c22013-07-08 15:21:21 -0700227 else:
228 ldaps = re.search(r"document.write\('(.*)'\)", url_content)
229 if not ldaps:
beeps4efdf032013-09-17 11:27:14 -0700230 logging.warning('Could not retrieve sheriff ldaps for: %s',
231 url_content)
Alex Millerdadc2c22013-07-08 15:21:21 -0700232 continue
233 sheriff_ids += ['%s@chromium.org' % alias.replace(' ', '')
234 for alias in ldaps.group(1).split(',')]
235 return sheriff_ids
beeps46dadc92013-11-07 14:07:10 -0800236
237
238def remote_wget(source_url, dest_path, ssh_cmd):
239 """wget source_url from localhost to dest_path on remote host using ssh.
240
241 @param source_url: The complete url of the source of the package to send.
242 @param dest_path: The path on the remote host's file system where we would
243 like to store the package.
244 @param ssh_cmd: The ssh command to use in performing the remote wget.
245 """
246 wget_cmd = ("wget -O - %s | %s 'cat >%s'" %
247 (source_url, ssh_cmd, dest_path))
Dan Shief31f032016-05-13 15:51:39 -0700248 utils.run(wget_cmd)
beeps46dadc92013-11-07 14:07:10 -0800249
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800250
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800251_MAX_LAB_STATUS_ATTEMPTS = 5
252def _get_lab_status(status_url):
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800253 """Grabs the current lab status and message.
254
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800255 @returns The JSON object obtained from the given URL.
256
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800257 """
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800258 retry_waittime = 1
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800259 for _ in range(_MAX_LAB_STATUS_ATTEMPTS):
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800260 try:
261 response = urllib2.urlopen(status_url)
262 except IOError as e:
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800263 logging.debug('Error occurred when grabbing the lab status: %s.',
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800264 e)
265 time.sleep(retry_waittime)
266 continue
267 # Check for successful response code.
268 if response.getcode() == 200:
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800269 return json.load(response)
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800270 time.sleep(retry_waittime)
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800271 return None
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800272
273
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800274def _decode_lab_status(lab_status, build):
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800275 """Decode lab status, and report exceptions as needed.
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800276
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800277 Take a deserialized JSON object from the lab status page, and
278 interpret it to determine the actual lab status. Raise
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800279 exceptions as required to report when the lab is down.
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800280
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800281 @param build: build name that we want to check the status of.
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800282
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800283 @raises TestLabException Raised if a request to test for the given
284 status and build should be blocked.
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800285 """
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800286 # First check if the lab is up.
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800287 if not lab_status['general_state'] in LAB_GOOD_STATES:
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800288 raise TestLabException('Chromium OS Test Lab is closed: '
289 '%s.' % lab_status['message'])
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800290
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800291 # Check if the build we wish to use is disabled.
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800292 # Lab messages should be in the format of:
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800293 # Lab is 'status' [regex ...] (comment)
294 # If the build name matches any regex, it will be blocked.
295 build_exceptions = re.search('\[(.*)\]', lab_status['message'])
Prashanth Balasubramanianae437212014-10-27 11:17:26 -0700296 if not build_exceptions or not build:
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800297 return
298 for build_pattern in build_exceptions.group(1).split():
J. Richard Barnette7f215d32015-06-19 12:44:38 -0700299 if re.match(build_pattern, build):
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800300 raise TestLabException('Chromium OS Test Lab is closed: '
301 '%s matches %s.' % (
302 build, build_pattern))
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800303 return
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800304
305
Dan Shi94234cb2014-05-23 20:04:31 -0700306def is_in_lab():
307 """Check if current Autotest instance is in lab
308
309 @return: True if the Autotest instance is in lab.
310 """
Dan Shid37736b2016-07-06 15:10:29 -0700311 test_server_name = CONFIG.get_config_value('SERVER', 'hostname')
Dan Shi94234cb2014-05-23 20:04:31 -0700312 return test_server_name.startswith('cautotest')
313
314
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800315def check_lab_status(build):
316 """Check if the lab status allows us to schedule for a build.
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800317
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800318 Checks if the lab is down, or if testing for the requested build
319 should be blocked.
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800320
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800321 @param build: Name of the build to be scheduled for testing.
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800322
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800323 @raises TestLabException Raised if a request to test for the given
324 status and build should be blocked.
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800325
326 """
327 # Ensure we are trying to schedule on the actual lab.
Dan Shi94234cb2014-05-23 20:04:31 -0700328 if not is_in_lab():
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800329 return
330
331 # Download the lab status from its home on the web.
Dan Shid37736b2016-07-06 15:10:29 -0700332 status_url = CONFIG.get_config_value('CROS', 'lab_status_url')
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800333 json_status = _get_lab_status(status_url)
334 if json_status is None:
335 # We go ahead and say the lab is open if we can't get the status.
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -0700336 logging.warning('Could not get a status from %s', status_url)
J. Richard Barnette266da2a2013-11-27 15:09:55 -0800337 return
J. Richard Barnetteabbe0962013-12-10 18:15:44 -0800338 _decode_lab_status(json_status, build)
beeps023afc62014-02-04 16:59:22 -0800339
340
341def lock_host_with_labels(afe, lock_manager, labels):
342 """Lookup and lock one host that matches the list of input labels.
343
344 @param afe: An instance of the afe class, as defined in server.frontend.
345 @param lock_manager: A lock manager capable of locking hosts, eg the
346 one defined in server.cros.host_lock_manager.
347 @param labels: A list of labels to look for on hosts.
348
349 @return: The hostname of a host matching all labels, and locked through the
350 lock_manager. The hostname will be as specified in the database the afe
351 object is associated with, i.e if it exists in afe_hosts with a .cros
352 suffix, the hostname returned will contain a .cros suffix.
353
354 @raises: error.NoEligibleHostException: If no hosts matching the list of
355 input labels are available.
356 @raises: error.TestError: If unable to lock a host matching the labels.
357 """
358 potential_hosts = afe.get_hosts(multiple_labels=labels)
359 if not potential_hosts:
360 raise error.NoEligibleHostException(
361 'No devices found with labels %s.' % labels)
362
363 # This prevents errors where a fault might seem repeatable
364 # because we lock, say, the same packet capturer for each test run.
365 random.shuffle(potential_hosts)
366 for host in potential_hosts:
367 if lock_manager.lock([host.hostname]):
368 logging.info('Locked device %s with labels %s.',
369 host.hostname, labels)
370 return host.hostname
371 else:
372 logging.info('Unable to lock device %s with labels %s.',
373 host.hostname, labels)
374
375 raise error.TestError('Could not lock a device with labels %s' % labels)
Dan Shi7e04fa82013-07-25 15:08:48 -0700376
377
378def get_test_views_from_tko(suite_job_id, tko):
379 """Get test name and result for given suite job ID.
380
381 @param suite_job_id: ID of suite job.
382 @param tko: an instance of TKO as defined in server/frontend.py.
383 @return: A dictionary of test status keyed by test name, e.g.,
384 {'dummy_Fail.Error': 'ERROR', 'dummy_Fail.NAError': 'TEST_NA'}
385 @raise: Exception when there is no test view found.
386
387 """
388 views = tko.run('get_detailed_test_views', afe_job_id=suite_job_id)
389 relevant_views = filter(job_status.view_is_relevant, views)
390 if not relevant_views:
391 raise Exception('Failed to retrieve job results.')
392
393 test_views = {}
394 for view in relevant_views:
395 test_views[view['test_name']] = view['status']
396
397 return test_views
MK Ryu35d661e2014-09-25 17:44:10 -0700398
399
MK Ryuc9c0c3f2014-10-27 14:36:01 -0700400def get_data_key(prefix, suite, build, board):
401 """
402 Constructs a key string from parameters.
403
404 @param prefix: Prefix for the generating key.
405 @param suite: a suite name. e.g., bvt-cq, bvt-inline, dummy
406 @param build: The build string. This string should have a consistent
407 format eg: x86-mario-release/R26-3570.0.0. If the format of this
408 string changes such that we can't determine build_type or branch
409 we give up and use the parametes we're sure of instead (suite,
410 board). eg:
411 1. build = x86-alex-pgo-release/R26-3570.0.0
412 branch = 26
413 build_type = pgo-release
414 2. build = lumpy-paladin/R28-3993.0.0-rc5
415 branch = 28
416 build_type = paladin
417 @param board: The board that this suite ran on.
418 @return: The key string used for a dictionary.
419 """
420 try:
421 _board, build_type, branch = ParseBuildName(build)[:3]
422 except ParseBuildNameException as e:
423 logging.error(str(e))
424 branch = 'Unknown'
425 build_type = 'Unknown'
426 else:
427 embedded_str = re.search(r'x86-\w+-(.*)', _board)
428 if embedded_str:
429 build_type = embedded_str.group(1) + '-' + build_type
430
431 data_key_dict = {
432 'prefix': prefix,
433 'board': board,
434 'branch': branch,
435 'build_type': build_type,
436 'suite': suite,
437 }
438 return ('%(prefix)s.%(board)s.%(build_type)s.%(branch)s.%(suite)s'
439 % data_key_dict)
MK Ryu83184352014-12-10 14:59:40 -0800440
441
MK Ryu2d0a3642015-01-07 15:11:19 -0800442def setup_logging(logfile=None, prefix=False):
MK Ryu83184352014-12-10 14:59:40 -0800443 """Setup basic logging with all logging info stripped.
444
445 Calls to logging will only show the message. No severity is logged.
446
447 @param logfile: If specified dump output to a file as well.
MK Ryu2d0a3642015-01-07 15:11:19 -0800448 @param prefix: Flag for log prefix. Set to True to add prefix to log
449 entries to include timestamp and log level. Default is False.
MK Ryu83184352014-12-10 14:59:40 -0800450 """
451 # Remove all existing handlers. client/common_lib/logging_config adds
452 # a StreamHandler to logger when modules are imported, e.g.,
453 # autotest_lib.client.bin.utils. A new StreamHandler will be added here to
454 # log only messages, not severity.
455 logging.getLogger().handlers = []
456
MK Ryu2d0a3642015-01-07 15:11:19 -0800457 if prefix:
458 log_format = '%(asctime)s %(levelname)-5s| %(message)s'
459 else:
460 log_format = '%(message)s'
461
MK Ryu83184352014-12-10 14:59:40 -0800462 screen_handler = logging.StreamHandler()
MK Ryu2d0a3642015-01-07 15:11:19 -0800463 screen_handler.setFormatter(logging.Formatter(log_format))
MK Ryu83184352014-12-10 14:59:40 -0800464 logging.getLogger().addHandler(screen_handler)
465 logging.getLogger().setLevel(logging.INFO)
466 if logfile:
467 file_handler = logging.FileHandler(logfile)
MK Ryu2d0a3642015-01-07 15:11:19 -0800468 file_handler.setFormatter(logging.Formatter(log_format))
MK Ryu83184352014-12-10 14:59:40 -0800469 file_handler.setLevel(logging.DEBUG)
470 logging.getLogger().addHandler(file_handler)
Prashanth Balasubramanian8c98ac12014-12-23 11:26:44 -0800471
472
473def is_shard():
474 """Determines if this instance is running as a shard.
475
476 Reads the global_config value shard_hostname in the section SHARD.
477
478 @return True, if shard_hostname is set, False otherwise.
479 """
Dan Shid37736b2016-07-06 15:10:29 -0700480 hostname = CONFIG.get_config_value('SHARD', 'shard_hostname', default=None)
MK Ryu0c1a37d2015-04-30 12:00:55 -0700481 return bool(hostname)
482
483
Fang Deng0cb2a3b2015-12-10 17:59:00 -0800484def get_global_afe_hostname():
485 """Read the hostname of the global AFE from the global configuration."""
Dan Shid37736b2016-07-06 15:10:29 -0700486 return CONFIG.get_config_value('SERVER', 'global_afe_hostname')
Fang Deng0cb2a3b2015-12-10 17:59:00 -0800487
488
Fang Deng18699fe2015-12-04 16:40:27 -0800489def is_restricted_user(username):
490 """Determines if a user is in a restricted group.
491
492 User in restricted group only have access to master.
493
494 @param username: A string, representing a username.
495
496 @returns: True if the user is in a restricted group.
497 """
498 if not username:
499 return False
500
Dan Shid37736b2016-07-06 15:10:29 -0700501 restricted_groups = CONFIG.get_config_value(
Fang Deng18699fe2015-12-04 16:40:27 -0800502 'AUTOTEST_WEB', 'restricted_groups', default='').split(',')
503 for group in restricted_groups:
Fang Deng5229c852016-02-09 13:30:31 -0800504 try:
505 if group and username in grp.getgrnam(group).gr_mem:
506 return True
507 except KeyError as e:
508 logging.debug("%s is not a valid group.", group)
Fang Deng18699fe2015-12-04 16:40:27 -0800509 return False
510
511
MK Ryu0c1a37d2015-04-30 12:00:55 -0700512def get_special_task_status(is_complete, success, is_active):
513 """Get the status of a special task.
514
515 Emulate a host queue entry status for a special task
516 Although SpecialTasks are not HostQueueEntries, it is helpful to
517 the user to present similar statuses.
518
519 @param is_complete Boolean if the task is completed.
520 @param success Boolean if the task succeeded.
521 @param is_active Boolean if the task is active.
522
523 @return The status of a special task.
524 """
525 if is_complete:
526 if success:
527 return host_queue_entry_states.Status.COMPLETED
528 return host_queue_entry_states.Status.FAILED
529 if is_active:
530 return host_queue_entry_states.Status.RUNNING
531 return host_queue_entry_states.Status.QUEUED
532
533
534def get_special_task_exec_path(hostname, task_id, task_name, time_requested):
535 """Get the execution path of the SpecialTask.
536
537 This method returns different paths depending on where a
538 the task ran:
539 * Master: hosts/hostname/task_id-task_type
540 * Shard: Master_path/time_created
541 This is to work around the fact that a shard can fail independent
542 of the master, and be replaced by another shard that has the same
543 hosts. Without the time_created stamp the logs of the tasks running
544 on the second shard will clobber the logs from the first in google
545 storage, because task ids are not globally unique.
546
547 @param hostname Hostname
548 @param task_id Special task id
549 @param task_name Special task name (e.g., Verify, Repair, etc)
550 @param time_requested Special task requested time.
551
552 @return An execution path for the task.
553 """
554 results_path = 'hosts/%s/%s-%s' % (hostname, task_id, task_name.lower())
555
556 # If we do this on the master it will break backward compatibility,
557 # as there are tasks that currently don't have timestamps. If a host
558 # or job has been sent to a shard, the rpc for that host/job will
559 # be redirected to the shard, so this global_config check will happen
560 # on the shard the logs are on.
561 if not is_shard():
562 return results_path
563
564 # Generate a uid to disambiguate special task result directories
565 # in case this shard fails. The simplest uid is the job_id, however
566 # in rare cases tasks do not have jobs associated with them (eg:
567 # frontend verify), so just use the creation timestamp. The clocks
568 # between a shard and master should always be in sync. Any discrepancies
569 # will be brought to our attention in the form of job timeouts.
570 uid = time_requested.strftime('%Y%d%m%H%M%S')
571
572 # TODO: This is a hack, however it is the easiest way to achieve
573 # correctness. There is currently some debate over the future of
574 # tasks in our infrastructure and refactoring everything right
575 # now isn't worth the time.
576 return '%s/%s' % (results_path, uid)
577
578
579def get_job_tag(id, owner):
580 """Returns a string tag for a job.
581
582 @param id Job id
583 @param owner Job owner
584
585 """
586 return '%s-%s' % (id, owner)
587
588
589def get_hqe_exec_path(tag, execution_subdir):
590 """Returns a execution path to a HQE's results.
591
592 @param tag Tag string for a job associated with a HQE.
593 @param execution_subdir Execution sub-directory string of a HQE.
594
595 """
596 return os.path.join(tag, execution_subdir)
Dan Shi82997b92015-05-06 12:08:02 -0700597
598
599def is_inside_chroot():
600 """Check if the process is running inside chroot.
601
602 This is a wrapper around chromite.lib.cros_build_lib.IsInsideChroot(). The
603 method checks if cros_build_lib can be imported first.
604
605 @return: True if the process is running inside chroot or cros_build_lib
606 cannot be imported.
607
608 """
J. Richard Barnette7f215d32015-06-19 12:44:38 -0700609 return not cros_build_lib or cros_build_lib.IsInsideChroot()
Dan Shi70647ca2015-07-16 22:52:35 -0700610
611
612def parse_job_name(name):
613 """Parse job name to get information including build, board and suite etc.
614
615 Suite job created by run_suite follows the naming convention of:
616 [build]-test_suites/control.[suite]
617 For example: lumpy-release/R46-7272.0.0-test_suites/control.bvt
Allen Licdd00f22017-02-01 18:01:52 -0800618 The naming convention is defined in rpc_interface.create_suite_job.
Dan Shi70647ca2015-07-16 22:52:35 -0700619
620 Test job created by suite job follows the naming convention of:
621 [build]/[suite]/[test name]
622 For example: lumpy-release/R46-7272.0.0/bvt/login_LoginSuccess
623 The naming convention is defined in
624 server/cros/dynamic_suite/tools.create_job_name
625
626 Note that pgo and chrome-perf builds will fail the method. Since lab does
627 not run test for these builds, they can be ignored.
Dan Shief31f032016-05-13 15:51:39 -0700628 Also, tests for Launch Control builds have different naming convention.
629 The build ID will be used as build_version.
Dan Shi70647ca2015-07-16 22:52:35 -0700630
631 @param name: Name of the job.
632
633 @return: A dictionary containing the test information. The keyvals include:
634 build: Name of the build, e.g., lumpy-release/R46-7272.0.0
635 build_version: The version of the build, e.g., R46-7272.0.0
636 board: Name of the board, e.g., lumpy
637 suite: Name of the test suite, e.g., bvt
638
639 """
640 info = {}
Dan Shief31f032016-05-13 15:51:39 -0700641 suite_job_regex = '([^/]*/[^/]*(?:/\d+)?)-test_suites/control\.(.*)'
642 test_job_regex = '([^/]*/[^/]*(?:/\d+)?)/([^/]+)/.*'
Dan Shi70647ca2015-07-16 22:52:35 -0700643 match = re.match(suite_job_regex, name)
644 if not match:
645 match = re.match(test_job_regex, name)
646 if match:
647 info['build'] = match.groups()[0]
648 info['suite'] = match.groups()[1]
649 info['build_version'] = info['build'].split('/')[1]
650 try:
651 info['board'], _, _, _ = ParseBuildName(info['build'])
652 except ParseBuildNameException:
Dan Shief31f032016-05-13 15:51:39 -0700653 # Try to parse it as Launch Control build
654 # Launch Control builds have name format:
655 # branch/build_target-build_type/build_id.
656 try:
657 _, target, build_id = utils.parse_launch_control_build(
658 info['build'])
659 build_target, _ = utils.parse_launch_control_target(target)
660 if build_target:
661 info['board'] = build_target
662 info['build_version'] = build_id
663 except ValueError:
664 pass
Dan Shi70647ca2015-07-16 22:52:35 -0700665 return info
Kevin Cheng3a4a57a2015-09-30 12:09:50 -0700666
667
668def add_label_detector(label_function_list, label_list=None, label=None):
669 """Decorator used to group functions together into the provided list.
670
671 This is a helper function to automatically add label functions that have
672 the label decorator. This is to help populate the class list of label
673 functions to be retrieved by the get_labels class method.
674
675 @param label_function_list: List of label detecting functions to add
676 decorated function to.
677 @param label_list: List of detectable labels to add detectable labels to.
678 (Default: None)
679 @param label: Label string that is detectable by this detection function
680 (Default: None)
681 """
682 def add_func(func):
683 """
684 @param func: The function to be added as a detector.
685 """
686 label_function_list.append(func)
687 if label and label_list is not None:
688 label_list.append(label)
689 return func
690 return add_func
Simran Basi9f364a62015-12-07 14:15:19 -0800691
692
693def verify_not_root_user():
694 """Simple function to error out if running with uid == 0"""
695 if os.getuid() == 0:
Simran Basi1bf60eb2015-12-01 16:39:29 -0800696 raise error.IllegalUser('This script can not be ran as root.')
697
698
699def get_hostname_from_machine(machine):
700 """Lookup hostname from a machine string or dict.
701
702 @returns: Machine hostname in string format.
703 """
704 hostname, _ = get_host_info_from_machine(machine)
705 return hostname
706
707
708def get_host_info_from_machine(machine):
709 """Lookup host information from a machine string or dict.
710
Kevin Cheng05ae2a42016-06-06 10:12:48 -0700711 @returns: Tuple of (hostname, afe_host)
Simran Basi1bf60eb2015-12-01 16:39:29 -0800712 """
713 if isinstance(machine, dict):
Kevin Cheng05ae2a42016-06-06 10:12:48 -0700714 return (machine['hostname'], machine['afe_host'])
Simran Basi1bf60eb2015-12-01 16:39:29 -0800715 else:
Kevin Cheng05ae2a42016-06-06 10:12:48 -0700716 return (machine, EmptyAFEHost())
717
718
719def get_afe_host_from_machine(machine):
720 """Return the afe_host from the machine dict if possible.
721
722 @returns: AFE host object.
723 """
724 _, afe_host = get_host_info_from_machine(machine)
725 return afe_host
Fang Dengf8a94e22015-12-07 13:39:13 -0800726
727
728def get_creds_abspath(creds_file):
729 """Returns the abspath of the credentials file.
730
731 If creds_file is already an absolute path, just return it.
732 Otherwise, assume it is located in the creds directory
733 specified in global_config and return the absolute path.
734
735 @param: creds_path, a path to the credentials.
736 @return: An absolute path to the credentials file.
737 """
738 if not creds_file:
739 return None
740 if os.path.isabs(creds_file):
741 return creds_file
Dan Shid37736b2016-07-06 15:10:29 -0700742 creds_dir = CONFIG.get_config_value('SERVER', 'creds_dir', default='')
Fang Dengf8a94e22015-12-07 13:39:13 -0800743 if not creds_dir or not os.path.exists(creds_dir):
744 creds_dir = common.autotest_dir
745 return os.path.join(creds_dir, creds_file)
Kevin Cheng3b111812015-12-15 11:52:08 -0800746
747
748def machine_is_testbed(machine):
749 """Checks if the machine is a testbed.
750
751 The signal we use to determine if the machine is a testbed
752 is if the host attributes contain more than 1 serial.
753
754 @param machine: is a list of dicts
755
756 @return: True if the machine is a testbed, False otherwise.
757 """
Kevin Cheng05ae2a42016-06-06 10:12:48 -0700758 _, afe_host = get_host_info_from_machine(machine)
759 return len(afe_host.attributes.get('serials', '').split(',')) > 1
Paul Hobbs20cc72a2016-08-30 16:57:05 -0700760
761
762def SetupTsMonGlobalState(*args, **kwargs):
763 """Import-safe wrap around chromite.lib.ts_mon_config's setup function.
764
765 @param *args: Args to pass through.
766 @param **kwargs: Kwargs to pass through.
767 """
768 if ts_mon_config:
Paul Hobbs604fc872016-09-29 16:41:55 -0700769 try:
770 context = ts_mon_config.SetupTsMonGlobalState(*args, **kwargs)
771 if hasattr(context, '__exit__'):
772 return context
773 except Exception as e:
774 logging.warning('Caught an exception trying to setup ts_mon, '
775 'monitoring is disabled: %s', e, exc_info=True)
776 return TrivialContextManager()
Paul Hobbs20cc72a2016-08-30 16:57:05 -0700777 else:
Paul Hobbs930ed9d2016-09-28 15:59:08 -0700778 return TrivialContextManager()
Paul Hobbs20cc72a2016-08-30 16:57:05 -0700779
780
781@contextlib.contextmanager
Paul Hobbs604fc872016-09-29 16:41:55 -0700782def TrivialContextManager(*args, **kwargs):
783 """Context manager that does nothing.
784
785 @param *args: Ignored args
786 @param **kwargs: Ignored kwargs.
787 """
Paul Hobbs20cc72a2016-08-30 16:57:05 -0700788 yield
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700789
790
791def wait_for_idle_duts(duts, afe, max_wait=IDLE_DUT_WAIT_TIMEOUT):
792 """Wait for the hosts to all go idle.
793
794 @param duts: List of duts to check for idle state.
795 @param afe: afe instance.
796 @param max_wait: Max wait time in seconds.
797
798 @returns Boolean True if all hosts are idle or False if any hosts did not
799 go idle within max_wait.
800 """
801 start_time = time.time()
802 # We make a shallow copy since we're going to be modifying active_dut_list.
803 active_dut_list = duts[:]
804 while active_dut_list:
805 # Let's rate-limit how often we hit the AFE.
806 time.sleep(1)
807
808 # Check if we've waited too long.
809 if (time.time() - start_time) > max_wait:
810 return False
811
812 idle_duts = []
813 # Get the status for the duts and see if they're in the idle state.
814 afe_hosts = afe.get_hosts(active_dut_list)
815 idle_duts = [afe_host.hostname for afe_host in afe_hosts
816 if afe_host.status in host_states.IDLE_STATES]
817
818 # Take out idle duts so we don't needlessly check them
819 # next time around.
820 for idle_dut in idle_duts:
821 active_dut_list.remove(idle_dut)
822
823 logging.info('still waiting for following duts to go idle: %s',
824 active_dut_list)
825 return True
826
827
828@contextlib.contextmanager
829def lock_duts_and_wait(duts, afe, lock_msg='default lock message',
830 max_wait=IDLE_DUT_WAIT_TIMEOUT):
831 """Context manager to lock the duts and wait for them to go idle.
832
833 @param duts: List of duts to lock.
834 @param afe: afe instance.
835
836 @returns Boolean lock_success where True if all duts locked successfully or
837 False if we timed out waiting too long for hosts to go idle.
838 """
839 try:
840 locked_duts = []
841 duts.sort()
842 for dut in duts:
843 if afe.lock_host(dut, lock_msg, fail_if_locked=True):
844 locked_duts.append(dut)
845 else:
846 logging.info('%s already locked', dut)
847 yield wait_for_idle_duts(locked_duts, afe, max_wait)
848 finally:
849 afe.unlock_hosts(locked_duts)
Dan Shib5b8b4f2016-11-02 14:04:02 -0700850
851
852def board_labels_allowed(boards):
853 """Check if the list of board labels can be set to a single host.
854
855 The only case multiple board labels can be set to a single host is for
856 testbed, which may have a list of board labels like
857 board:angler-1, board:angler-2, board:angler-3, board:marlin-1'
858
859 @param boards: A list of board labels (may include platform label).
860
861 @returns True if the the list of boards can be set to a single host.
862 """
863 # Filter out any non-board labels
864 boards = [b for b in boards if re.match('board:.*', b)]
865 if len(boards) <= 1:
866 return True
867 for board in boards:
868 if not re.match('board:[^-]+-\d+', board):
869 return False
870 return True