blob: 1489799cf07834aa29dc8ca32362f41aa3e777a3 [file] [log] [blame]
mbligh6203ace2007-10-04 21:54:24 +00001#!/usr/bin/python -u
mbligh1ffd5dc2008-11-25 13:24:05 +00002# Copyright 2007-2008 Martin J. Bligh <mbligh@google.com>, Google Inc.
mbligh82648e52008-11-20 16:54:25 +00003# Released under the GPL v2
mblighdcd57a82007-07-11 23:06:47 +00004
mblighc8949b82007-07-23 16:33:58 +00005"""
Aviv Keshetde6bb192013-01-30 16:17:22 -08006Run a control file through the server side engine
mblighdcd57a82007-07-11 23:06:47 +00007"""
mbligh1ffd5dc2008-11-25 13:24:05 +00008
Fang Deng042c1472014-10-23 13:56:41 -07009import ast
10import datetime
11import getpass
12import logging
13import os
14import re
15import signal
Dan Shicf4d2032015-03-12 15:04:21 -070016import socket
Fang Deng042c1472014-10-23 13:56:41 -070017import sys
18import traceback
19import time
20import urllib2
mbligh1ffd5dc2008-11-25 13:24:05 +000021
mblighf5427bb2008-04-09 15:55:57 +000022import common
mbligh9ff89cd2009-09-03 20:28:17 +000023
Dan Shia1ecd5c2013-06-06 11:21:31 -070024from autotest_lib.client.common_lib import control_data
25from autotest_lib.client.common_lib import global_config
Dan Shi37bee222015-04-13 15:46:47 -070026from autotest_lib.client.common_lib.cros.graphite import autotest_es
27from autotest_lib.client.common_lib.cros.graphite import autotest_stats
Prashanth Balasubramanianf8b83712014-11-06 15:58:21 -080028try:
29 from autotest_lib.puppylab import results_mocker
30except ImportError:
31 results_mocker = None
32
Dan Shia1ecd5c2013-06-06 11:21:31 -070033require_atfork = global_config.global_config.get_config_value(
mblighcb8cb332009-09-03 21:08:56 +000034 'AUTOSERV', 'require_atfork_module', type=bool, default=True)
35
Dan Shia1ecd5c2013-06-06 11:21:31 -070036
Jakob Jueliche497b552014-09-23 19:11:59 -070037# Number of seconds to wait before returning if testing mode is enabled
Prashanth B6285f6a2014-05-08 18:01:27 -070038TESTING_MODE_SLEEP_SECS = 1
Jakob Jueliche497b552014-09-23 19:11:59 -070039
mblighcb8cb332009-09-03 21:08:56 +000040try:
41 import atfork
42 atfork.monkeypatch_os_fork_functions()
43 import atfork.stdlib_fixer
44 # Fix the Python standard library for threading+fork safety with its
45 # internal locks. http://code.google.com/p/python-atfork/
46 import warnings
47 warnings.filterwarnings('ignore', 'logging module already imported')
48 atfork.stdlib_fixer.fix_logging_module()
49except ImportError, e:
50 from autotest_lib.client.common_lib import global_config
51 if global_config.global_config.get_config_value(
52 'AUTOSERV', 'require_atfork_module', type=bool, default=False):
53 print >>sys.stderr, 'Please run utils/build_externals.py'
54 print e
55 sys.exit(1)
mbligh9ff89cd2009-09-03 20:28:17 +000056
Dan Shia1ecd5c2013-06-06 11:21:31 -070057from autotest_lib.server import frontend
showard75cdfee2009-06-10 17:40:41 +000058from autotest_lib.server import server_logging_config
showard043c62a2009-06-10 19:48:57 +000059from autotest_lib.server import server_job, utils, autoserv_parser, autotest
Dan Shia1ecd5c2013-06-06 11:21:31 -070060from autotest_lib.server import utils as server_utils
Dan Shicf4d2032015-03-12 15:04:21 -070061from autotest_lib.site_utils import job_directories
Fang Deng042c1472014-10-23 13:56:41 -070062from autotest_lib.site_utils import job_overhead
Dan Shicf4d2032015-03-12 15:04:21 -070063from autotest_lib.site_utils import lxc
showard75cdfee2009-06-10 17:40:41 +000064from autotest_lib.client.common_lib import pidfile, logging_manager
Gabe Black1e1c41b2015-02-04 23:55:15 -080065from autotest_lib.client.common_lib.cros.graphite import autotest_stats
mbligh92c0fc22008-11-20 16:52:23 +000066
Dan Shicf4d2032015-03-12 15:04:21 -070067# Control segment to stage server-side package.
68STAGE_SERVER_SIDE_PACKAGE_CONTROL_FILE = server_job._control_segment_path(
69 'stage_server_side_package')
70
Alex Millerf1af17e2013-01-09 22:50:32 -080071def log_alarm(signum, frame):
72 logging.error("Received SIGALARM. Ignoring and continuing on.")
Alex Miller0528d6f2013-01-11 10:49:48 -080073 sys.exit(1)
Alex Millerf1af17e2013-01-09 22:50:32 -080074
Dan Shicf4d2032015-03-12 15:04:21 -070075
76def _get_machines(parser):
77 """Get a list of machine names from command line arg -m or a file.
78
79 @param parser: Parser for the command line arguments.
80
81 @return: A list of machine names from command line arg -m or the
82 machines file specified in the command line arg -M.
83 """
84 if parser.options.machines:
85 machines = parser.options.machines.replace(',', ' ').strip().split()
86 else:
87 machines = []
88 machines_file = parser.options.machines_file
89 if machines_file:
90 machines = []
91 for m in open(machines_file, 'r').readlines():
92 # remove comments, spaces
93 m = re.sub('#.*', '', m).strip()
94 if m:
95 machines.append(m)
96 logging.debug('Read list of machines from file: %s', machines_file)
97 logging.debug('Machines: %s', ','.join(machines))
98
99 if machines:
100 for machine in machines:
101 if not machine or re.search('\s', machine):
102 parser.parser.error("Invalid machine: %s" % str(machine))
103 machines = list(set(machines))
104 machines.sort()
105 return machines
106
107
108def _stage_ssp(parser):
109 """Stage server-side package.
110
111 This function calls a control segment to stage server-side package based on
112 the job and autoserv command line option. The detail implementation could
113 be different for each host type. Currently, only CrosHost has
114 stage_server_side_package function defined.
115 The script returns None if no server-side package is available. However,
116 it may raise exception if it failed for reasons other than artifact (the
117 server-side package) not found.
118
119 @param parser: Command line arguments parser passed in the autoserv process.
120
121 @return: url of the staged server-side package. Return None if server-
122 side package is not found for the build.
123 """
124 namespace = {'machines': _get_machines(parser),
125 'image': parser.options.image}
126 script_locals = {}
127 execfile(STAGE_SERVER_SIDE_PACKAGE_CONTROL_FILE, namespace, script_locals)
128 return script_locals['ssp_url']
129
130
131def _run_with_ssp(container_name, job_id, results, parser, ssp_url):
132 """Run the server job with server-side packaging.
133
134 @param container_name: Name of the container to run the test.
135 @param job_id: ID of the test job.
136 @param results: Folder to store results. This could be different from
137 parser.options.results:
138 parser.options.results can be set to None for results to be
139 stored in a temp folder.
140 results can be None for autoserv run requires no logging.
141 @param parser: Command line parser that contains the options.
142 @param ssp_url: url of the staged server-side package.
143 """
144 bucket = lxc.ContainerBucket()
145 control = (parser.args[0] if len(parser.args) > 0 and parser.args[0] != ''
146 else None)
147 test_container = bucket.setup_test(container_name, job_id, ssp_url, results,
148 control=control)
149 args = sys.argv[:]
150 args.remove('--require-ssp')
151
152 # A dictionary of paths to replace in the command line. Key is the path to
153 # be replaced with the one in value.
154 paths_to_replace = {}
155 # Replace the control file path with the one in container.
156 if control:
157 container_control_filename = os.path.join(
158 lxc.CONTROL_TEMP_PATH, os.path.basename(control))
159 paths_to_replace[control] = container_control_filename
160 # Update result directory with the one in container.
161 if parser.options.results:
162 container_result_dir = os.path.join(lxc.RESULT_DIR_FMT % job_id)
163 paths_to_replace[parser.options.results] = container_result_dir
164 # Update parse_job directory with the one in container. The assumption is
165 # that the result folder to be parsed is always the same as the results_dir.
166 if parser.options.parse_job:
167 container_parse_dir = os.path.join(lxc.RESULT_DIR_FMT % job_id)
168 paths_to_replace[parser.options.parse_job] = container_result_dir
169
170 args = [paths_to_replace.get(arg, arg) for arg in args]
171
172 # Apply --use-existing-results, results directory is aready created and
173 # mounted in container. Apply this arg to avoid exception being raised.
174 if not '--use-existing-results' in args:
175 args.append('--use-existing-results')
176
177 # Make sure autoserv running in container using a different pid file.
178 if not '--pidfile-label' in args:
179 args.extend(['--pidfile-label', 'container_autoserv'])
180
Dan Shid1f51232015-04-18 00:29:14 -0700181 cmd_line = ' '.join(["'%s'" % arg if ' ' in arg else arg for arg in args])
Dan Shicf4d2032015-03-12 15:04:21 -0700182 logging.info('Run command in container: %s', cmd_line)
Dan Shi37bee222015-04-13 15:46:47 -0700183 success = False
Dan Shicf4d2032015-03-12 15:04:21 -0700184 try:
185 test_container.attach_run(cmd_line)
Dan Shi37bee222015-04-13 15:46:47 -0700186 success = True
Dan Shicf4d2032015-03-12 15:04:21 -0700187 finally:
Dan Shi37bee222015-04-13 15:46:47 -0700188 counter_key = '%s.%s' % (lxc.STATS_KEY,
189 'success' if success else 'fail')
190 autotest_stats.Counter(counter_key).increment()
191 # metadata is uploaded separately so it can use http to upload.
192 metadata = {'drone': socket.gethostname(),
193 'job_id': job_id,
194 'success': success}
195 autotest_es.post(use_http=True,
196 type_str=lxc.CONTAINER_RUN_TEST_METADB_TYPE,
197 metadata=metadata)
Dan Shicf4d2032015-03-12 15:04:21 -0700198 test_container.destroy()
199
200
Dan Shic68fefb2015-04-07 10:10:52 -0700201def run_autoserv(pid_file_manager, results, parser, ssp_url, use_ssp):
Dan Shicf4d2032015-03-12 15:04:21 -0700202 """Run server job with given options.
203
204 @param pid_file_manager: PidFileManager used to monitor the autoserv process
205 @param results: Folder to store results.
206 @param parser: Parser for the command line arguments.
207 @param ssp_url: Url to server-side package.
Dan Shic68fefb2015-04-07 10:10:52 -0700208 @param use_ssp: Set to True to run with server-side packaging.
Dan Shicf4d2032015-03-12 15:04:21 -0700209 """
Dan Shiec1d47d2015-02-13 11:38:13 -0800210 if parser.options.warn_no_ssp:
Dan Shic68fefb2015-04-07 10:10:52 -0700211 # Post a warning in the log.
Dan Shiec1d47d2015-02-13 11:38:13 -0800212 logging.warn('Autoserv is required to run with server-side packaging. '
213 'However, no drone is found to support server-side '
214 'packaging. The test will be executed in a drone without '
215 'server-side packaging supported.')
216
jadmanski0afbb632008-06-06 21:10:57 +0000217 # send stdin to /dev/null
218 dev_null = os.open(os.devnull, os.O_RDONLY)
219 os.dup2(dev_null, sys.stdin.fileno())
220 os.close(dev_null)
mblighdbf37612007-11-24 19:38:11 +0000221
jadmanski0afbb632008-06-06 21:10:57 +0000222 # Create separate process group
223 os.setpgrp()
mbligh1d42d4e2007-11-05 22:42:00 +0000224
Dan Shicf4d2032015-03-12 15:04:21 -0700225 # Container name is predefined so the container can be destroyed in
226 # handle_sigterm.
227 job_or_task_id = job_directories.get_job_id_or_task_id(
228 parser.options.results)
229 container_name = (lxc.TEST_CONTAINER_NAME_FMT %
Dan Shid68d51c2015-04-21 17:00:42 -0700230 (job_or_task_id, time.time(), os.getpid()))
Dan Shicf4d2032015-03-12 15:04:21 -0700231
jadmanski0afbb632008-06-06 21:10:57 +0000232 # Implement SIGTERM handler
mblighc2299562009-07-02 19:00:36 +0000233 def handle_sigterm(signum, frame):
Simran Basi9d9b7292013-10-16 16:44:07 -0700234 logging.debug('Received SIGTERM')
mblighff7d61f2008-12-22 14:53:35 +0000235 if pid_file_manager:
236 pid_file_manager.close_file(1, signal.SIGTERM)
Simran Basi49e21e62013-10-17 12:40:33 -0700237 logging.debug('Finished writing to pid_file. Killing process.')
Simran Basid6b83772014-01-06 16:31:30 -0800238 # TODO (sbasi) - remove the time.sleep when crbug.com/302815 is solved.
239 # This sleep allows the pending output to be logged before the kill
240 # signal is sent.
241 time.sleep(.1)
Dan Shic68fefb2015-04-07 10:10:52 -0700242 if use_ssp:
Dan Shicf4d2032015-03-12 15:04:21 -0700243 logging.debug('Destroy container %s before aborting the autoserv '
244 'process.', container_name)
245 try:
246 bucket = lxc.ContainerBucket()
247 container = bucket.get(container_name)
248 if container:
249 container.destroy()
250 else:
251 logging.debug('Container %s is not found.', container_name)
252 except:
253 # Handle any exception so the autoserv process can be aborted.
254 logging.error('Failed to destroy container %s. Error: %s',
255 container_name, sys.exc_info())
256
jadmanski0afbb632008-06-06 21:10:57 +0000257 os.killpg(os.getpgrp(), signal.SIGKILL)
mblighfaf0cd42007-11-19 16:00:24 +0000258
jadmanski0afbb632008-06-06 21:10:57 +0000259 # Set signal handler
mblighc2299562009-07-02 19:00:36 +0000260 signal.signal(signal.SIGTERM, handle_sigterm)
mbligha46678d2008-05-01 20:00:01 +0000261
Simran Basid6b83772014-01-06 16:31:30 -0800262 # faulthandler is only needed to debug in the Lab and is not avaliable to
263 # be imported in the chroot as part of VMTest, so Try-Except it.
264 try:
265 import faulthandler
266 faulthandler.register(signal.SIGTERM, all_threads=True, chain=True)
267 logging.debug('faulthandler registered on SIGTERM.')
268 except ImportError:
269 pass
270
David Rochberg8a60d1e2011-02-01 14:22:07 -0500271 # Ignore SIGTTOU's generated by output from forked children.
272 signal.signal(signal.SIGTTOU, signal.SIG_IGN)
273
Alex Millerf1af17e2013-01-09 22:50:32 -0800274 # If we received a SIGALARM, let's be loud about it.
275 signal.signal(signal.SIGALRM, log_alarm)
276
mbligha5f5e542009-12-30 16:57:49 +0000277 # Server side tests that call shell scripts often depend on $USER being set
278 # but depending on how you launch your autotest scheduler it may not be set.
279 os.environ['USER'] = getpass.getuser()
280
mblighb2bea302008-07-24 20:25:57 +0000281 label = parser.options.label
mbligh374f3412009-05-13 21:29:45 +0000282 group_name = parser.options.group_name
mblighb2bea302008-07-24 20:25:57 +0000283 user = parser.options.user
284 client = parser.options.client
285 server = parser.options.server
jadmanski0afbb632008-06-06 21:10:57 +0000286 install_before = parser.options.install_before
mblighb2bea302008-07-24 20:25:57 +0000287 install_after = parser.options.install_after
288 verify = parser.options.verify
289 repair = parser.options.repair
showard45ae8192008-11-05 19:32:53 +0000290 cleanup = parser.options.cleanup
Alex Millercb79ba72013-05-29 14:43:00 -0700291 provision = parser.options.provision
Dan Shi07e09af2013-04-12 09:31:29 -0700292 reset = parser.options.reset
Alex Miller667b5f22014-02-28 15:33:39 -0800293 job_labels = parser.options.job_labels
mblighb2bea302008-07-24 20:25:57 +0000294 no_tee = parser.options.no_tee
jadmanski0afbb632008-06-06 21:10:57 +0000295 parse_job = parser.options.parse_job
mblighe7d9c602009-07-02 19:02:33 +0000296 execution_tag = parser.options.execution_tag
297 if not execution_tag:
298 execution_tag = parse_job
jadmanskifbc1f0a2008-07-09 14:12:54 +0000299 host_protection = parser.options.host_protection
jadmanski0afbb632008-06-06 21:10:57 +0000300 ssh_user = parser.options.ssh_user
301 ssh_port = parser.options.ssh_port
302 ssh_pass = parser.options.ssh_pass
jadmanskidef0c3c2009-03-25 20:07:10 +0000303 collect_crashinfo = parser.options.collect_crashinfo
mblighe0cbc912010-03-11 18:03:07 +0000304 control_filename = parser.options.control_filename
Scott Zawalski91493c82013-01-25 16:15:20 -0500305 test_retry = parser.options.test_retry
beepscb6f1e22013-06-28 19:14:10 -0700306 verify_job_repo_url = parser.options.verify_job_repo_url
Christopher Wileyf594c5e2013-07-03 18:25:30 -0700307 skip_crash_collection = parser.options.skip_crash_collection
Aviv Keshet18ee3142013-08-12 15:01:51 -0700308 ssh_verbosity = int(parser.options.ssh_verbosity)
Fang Deng6cc20de2013-09-06 15:47:32 -0700309 ssh_options = parser.options.ssh_options
Dan Shib669cbd2013-09-13 11:17:17 -0700310 no_use_packaging = parser.options.no_use_packaging
mbligha46678d2008-05-01 20:00:01 +0000311
mblighb2bea302008-07-24 20:25:57 +0000312 # can't be both a client and a server side test
313 if client and server:
Eric Li861b2d52011-02-04 14:50:35 -0800314 parser.parser.error("Can not specify a test as both server and client!")
mblighb2bea302008-07-24 20:25:57 +0000315
Alex Millercb79ba72013-05-29 14:43:00 -0700316 if provision and client:
317 parser.parser.error("Cannot specify provisioning and client!")
318
319 is_special_task = (verify or repair or cleanup or collect_crashinfo or
Dan Shi07e09af2013-04-12 09:31:29 -0700320 provision or reset)
Alex Millercb79ba72013-05-29 14:43:00 -0700321 if len(parser.args) < 1 and not is_special_task:
Eric Li861b2d52011-02-04 14:50:35 -0800322 parser.parser.error("Missing argument: control file")
mbligha46678d2008-05-01 20:00:01 +0000323
Aviv Keshet18ee3142013-08-12 15:01:51 -0700324 if ssh_verbosity > 0:
325 # ssh_verbosity is an integer between 0 and 3, inclusive
326 ssh_verbosity_flag = '-' + 'v' * ssh_verbosity
Fang Dengd1c2b732013-08-20 12:59:46 -0700327 else:
328 ssh_verbosity_flag = ''
Aviv Keshet18ee3142013-08-12 15:01:51 -0700329
showard45ae8192008-11-05 19:32:53 +0000330 # We have a control file unless it's just a verify/repair/cleanup job
jadmanski0afbb632008-06-06 21:10:57 +0000331 if len(parser.args) > 0:
332 control = parser.args[0]
333 else:
334 control = None
mbligha46678d2008-05-01 20:00:01 +0000335
Dan Shicf4d2032015-03-12 15:04:21 -0700336 machines = _get_machines(parser)
mbligh374f3412009-05-13 21:29:45 +0000337 if group_name and len(machines) < 2:
Dan Shicf4d2032015-03-12 15:04:21 -0700338 parser.parser.error('-G %r may only be supplied with more than one '
339 'machine.' % group_name)
mbligh374f3412009-05-13 21:29:45 +0000340
Christopher Wiley8a91f232013-07-09 11:02:27 -0700341 kwargs = {'group_name': group_name, 'tag': execution_tag,
Dan Shicf4d2032015-03-12 15:04:21 -0700342 'disable_sysinfo': parser.options.disable_sysinfo}
mblighe0cbc912010-03-11 18:03:07 +0000343 if control_filename:
344 kwargs['control_filename'] = control_filename
jadmanski0afbb632008-06-06 21:10:57 +0000345 job = server_job.server_job(control, parser.args[1:], results, label,
346 user, machines, client, parse_job,
Fang Dengd1c2b732013-08-20 12:59:46 -0700347 ssh_user, ssh_port, ssh_pass,
Aviv Keshetc5947fa2013-09-04 14:06:29 -0700348 ssh_verbosity_flag, ssh_options,
349 test_retry, **kwargs)
Dan Shicf4d2032015-03-12 15:04:21 -0700350
showard75cdfee2009-06-10 17:40:41 +0000351 job.logging.start_logging()
mbligh4608b002010-01-05 18:22:35 +0000352 job.init_parser()
mbligha46678d2008-05-01 20:00:01 +0000353
mbligh161fe6f2008-06-19 16:26:04 +0000354 # perform checks
355 job.precheck()
356
jadmanski0afbb632008-06-06 21:10:57 +0000357 # run the job
358 exit_code = 0
359 try:
mbligh332000a2009-06-08 16:47:28 +0000360 try:
361 if repair:
Alex Miller667b5f22014-02-28 15:33:39 -0800362 job.repair(host_protection, job_labels)
mbligh332000a2009-06-08 16:47:28 +0000363 elif verify:
Alex Miller667b5f22014-02-28 15:33:39 -0800364 job.verify(job_labels)
Alex Millercb79ba72013-05-29 14:43:00 -0700365 elif provision:
Alex Miller667b5f22014-02-28 15:33:39 -0800366 job.provision(job_labels)
Dan Shi07e09af2013-04-12 09:31:29 -0700367 elif reset:
Alex Miller667b5f22014-02-28 15:33:39 -0800368 job.reset(job_labels)
Fang Dengad78aca2014-10-02 18:15:46 -0700369 elif cleanup:
370 job.cleanup(job_labels)
mbligh332000a2009-06-08 16:47:28 +0000371 else:
Dan Shic68fefb2015-04-07 10:10:52 -0700372 if use_ssp:
Dan Shicf4d2032015-03-12 15:04:21 -0700373 try:
374 _run_with_ssp(container_name, job_or_task_id, results,
375 parser, ssp_url)
376 finally:
377 # Update the ownership of files in result folder.
378 # TODO(dshi): crbug.com/459344 Skip following action
379 # when test container can be unprivileged container.
380 if results:
381 lxc.run('chown -R %s %s' % (os.getuid(), results))
382 lxc.run('chgrp -R %s %s' % (os.getgid(), results))
383 else:
384 job.run(install_before, install_after,
385 verify_job_repo_url=verify_job_repo_url,
386 only_collect_crashinfo=collect_crashinfo,
387 skip_crash_collection=skip_crash_collection,
Dan Shib669cbd2013-09-13 11:17:17 -0700388 job_labels=job_labels,
389 use_packaging=(not no_use_packaging))
mbligh332000a2009-06-08 16:47:28 +0000390 finally:
391 while job.hosts:
392 host = job.hosts.pop()
393 host.close()
jadmanski0afbb632008-06-06 21:10:57 +0000394 except:
jadmanski27b37ea2008-10-29 23:54:31 +0000395 exit_code = 1
jadmanski0afbb632008-06-06 21:10:57 +0000396 traceback.print_exc()
mbligha46678d2008-05-01 20:00:01 +0000397
mblighff7d61f2008-12-22 14:53:35 +0000398 if pid_file_manager:
399 pid_file_manager.num_tests_failed = job.num_tests_failed
400 pid_file_manager.close_file(exit_code)
jadmanskie0dffc32008-12-15 17:30:30 +0000401 job.cleanup_parser()
showard21baa452008-10-21 00:08:39 +0000402
jadmanski27b37ea2008-10-29 23:54:31 +0000403 sys.exit(exit_code)
mbligha46678d2008-05-01 20:00:01 +0000404
405
Fang Deng042c1472014-10-23 13:56:41 -0700406def record_autoserv(options, duration_secs):
407 """Record autoserv end-to-end time in metadata db.
408
409 @param options: parser options.
410 @param duration_secs: How long autoserv has taken, in secs.
411 """
412 # Get machine hostname
413 machines = options.machines.replace(
414 ',', ' ').strip().split() if options.machines else []
415 num_machines = len(machines)
416 if num_machines > 1:
417 # Skip the case where atomic group is used.
418 return
419 elif num_machines == 0:
420 machines.append('hostless')
421
422 # Determine the status that will be reported.
423 s = job_overhead.STATUS
424 task_mapping = {
425 'reset': s.RESETTING, 'verify': s.VERIFYING,
426 'provision': s.PROVISIONING, 'repair': s.REPAIRING,
427 'cleanup': s.CLEANING, 'collect_crashinfo': s.GATHERING}
428 # option_dict will be like {'reset': True, 'repair': False, ...}
429 option_dict = ast.literal_eval(str(options))
430 match = filter(lambda task: option_dict.get(task) == True, task_mapping)
431 status = task_mapping[match[0]] if match else s.RUNNING
432 is_special_task = status not in [s.RUNNING, s.GATHERING]
Dan Shicf4d2032015-03-12 15:04:21 -0700433 job_or_task_id = job_directories.get_job_id_or_task_id(options.results)
Fang Deng042c1472014-10-23 13:56:41 -0700434 job_overhead.record_state_duration(
435 job_or_task_id, machines[0], status, duration_secs,
436 is_special_task=is_special_task)
437
438
mbligha46678d2008-05-01 20:00:01 +0000439def main():
Fang Deng042c1472014-10-23 13:56:41 -0700440 start_time = datetime.datetime.now()
Dan Shia1ecd5c2013-06-06 11:21:31 -0700441 # White list of tests with run time measurement enabled.
442 measure_run_time_tests_names = global_config.global_config.get_config_value(
443 'AUTOSERV', 'measure_run_time_tests', type=str)
444 if measure_run_time_tests_names:
445 measure_run_time_tests = [t.strip() for t in
446 measure_run_time_tests_names.split(',')]
447 else:
448 measure_run_time_tests = []
jadmanski0afbb632008-06-06 21:10:57 +0000449 # grab the parser
450 parser = autoserv_parser.autoserv_parser
mbligha5cb4062009-02-17 15:53:39 +0000451 parser.parse_args()
mbligha46678d2008-05-01 20:00:01 +0000452
jadmanski0afbb632008-06-06 21:10:57 +0000453 if len(sys.argv) == 1:
454 parser.parser.print_help()
455 sys.exit(1)
mbligha6f13082008-06-05 23:53:46 +0000456
Dan Shicf4d2032015-03-12 15:04:21 -0700457 # If the job requires to run with server-side package, try to stage server-
458 # side package first. If that fails with error that autotest server package
Dan Shic68fefb2015-04-07 10:10:52 -0700459 # does not exist, fall back to run the job without using server-side
460 # packaging. If option warn_no_ssp is specified, that means autoserv is
461 # running in a drone does not support SSP, thus no need to stage server-side
462 # package.
Dan Shicf4d2032015-03-12 15:04:21 -0700463 ssp_url = None
Dan Shi0b754c52015-04-20 14:20:38 -0700464 ssp_url_warning = False
Dan Shic68fefb2015-04-07 10:10:52 -0700465 if (not parser.options.warn_no_ssp and parser.options.require_ssp):
Dan Shicf4d2032015-03-12 15:04:21 -0700466 ssp_url = _stage_ssp(parser)
Dan Shi0b754c52015-04-20 14:20:38 -0700467 # The build does not have autotest server package. Fall back to not
468 # to use server-side package. Logging is postponed until logging being
469 # set up.
470 ssp_url_warning = not ssp_url
Dan Shicf4d2032015-03-12 15:04:21 -0700471
showard75cdfee2009-06-10 17:40:41 +0000472 if parser.options.no_logging:
473 results = None
474 else:
475 results = parser.options.results
mbligh80e1eba2008-11-19 00:26:18 +0000476 if not results:
477 results = 'results.' + time.strftime('%Y-%m-%d-%H.%M.%S')
478 results = os.path.abspath(results)
showard566d3c02010-01-12 18:57:01 +0000479 resultdir_exists = False
480 for filename in ('control.srv', 'status.log', '.autoserv_execute'):
481 if os.path.exists(os.path.join(results, filename)):
482 resultdir_exists = True
mbligh4608b002010-01-05 18:22:35 +0000483 if not parser.options.use_existing_results and resultdir_exists:
mbligh80e1eba2008-11-19 00:26:18 +0000484 error = "Error: results directory already exists: %s\n" % results
485 sys.stderr.write(error)
486 sys.exit(1)
mbligha788dc42009-03-26 21:10:16 +0000487
488 # Now that we certified that there's no leftover results dir from
489 # previous jobs, lets create the result dir since the logging system
490 # needs to create the log file in there.
491 if not os.path.isdir(results):
492 os.makedirs(results)
showard75cdfee2009-06-10 17:40:41 +0000493
Dan Shic68fefb2015-04-07 10:10:52 -0700494 # Server-side packaging will only be used if it's required and the package
495 # is available. If warn_no_ssp is specified, it means that autoserv is
496 # running in a drone does not have SSP supported and a warning will be logs.
497 # Therefore, it should not run with SSP.
498 use_ssp = (not parser.options.warn_no_ssp and parser.options.require_ssp
499 and ssp_url)
500 if use_ssp:
Dan Shicf4d2032015-03-12 15:04:21 -0700501 log_dir = os.path.join(results, 'wrapper') if results else None
502 if log_dir and not os.path.exists(log_dir):
503 os.makedirs(log_dir)
504 else:
505 log_dir = results
showard75cdfee2009-06-10 17:40:41 +0000506 logging_manager.configure_logging(
Dan Shicf4d2032015-03-12 15:04:21 -0700507 server_logging_config.ServerLoggingConfig(),
508 results_dir=log_dir,
showard10d84172009-06-18 23:16:50 +0000509 use_console=not parser.options.no_tee,
510 verbose=parser.options.verbose,
511 no_console_prefix=parser.options.no_console_prefix)
Dan Shicf4d2032015-03-12 15:04:21 -0700512
Dan Shi0b754c52015-04-20 14:20:38 -0700513 if ssp_url_warning:
514 logging.warn(
515 'Autoserv is required to run with server-side packaging. '
516 'However, no server-side package can be found based on '
517 '`--image`, host attribute job_repo_url or host label of '
518 'cros-version. The test will be executed without '
519 'server-side packaging supported.')
520
showard75cdfee2009-06-10 17:40:41 +0000521 if results:
mbligha788dc42009-03-26 21:10:16 +0000522 logging.info("Results placed in %s" % results)
mbligh10717632008-11-19 00:21:57 +0000523
mbligh4608b002010-01-05 18:22:35 +0000524 # wait until now to perform this check, so it get properly logged
Dan Shicf4d2032015-03-12 15:04:21 -0700525 if (parser.options.use_existing_results and not resultdir_exists and
526 not lxc.is_in_container()):
mbligh4608b002010-01-05 18:22:35 +0000527 logging.error("No existing results directory found: %s", results)
528 sys.exit(1)
529
Dan Shicf4d2032015-03-12 15:04:21 -0700530 logging.debug('autoserv is running in drone %s.', socket.gethostname())
Aviv Keshet5c40ec62013-08-20 12:11:12 -0700531 logging.debug('autoserv command was: %s', ' '.join(sys.argv))
mbligh4608b002010-01-05 18:22:35 +0000532
Dan Shicf4d2032015-03-12 15:04:21 -0700533 if parser.options.write_pidfile and results:
mbligh4608b002010-01-05 18:22:35 +0000534 pid_file_manager = pidfile.PidFileManager(parser.options.pidfile_label,
535 results)
jadmanskid5ab8c52008-12-03 16:27:07 +0000536 pid_file_manager.open_file()
mblighff7d61f2008-12-22 14:53:35 +0000537 else:
538 pid_file_manager = None
mbligha46678d2008-05-01 20:00:01 +0000539
jadmanskif22fea82008-11-26 20:57:07 +0000540 autotest.BaseAutotest.set_install_in_tmpdir(
541 parser.options.install_in_tmpdir)
542
Dan Shia1ecd5c2013-06-06 11:21:31 -0700543 timer = None
544 try:
545 # Take the first argument as control file name, get the test name from
546 # the control file. If the test name exists in the list of tests with
547 # run time measurement enabled, start a timer to begin measurement.
548 if (len(parser.args) > 0 and parser.args[0] != '' and
549 parser.options.machines):
Dan Shibbc16132013-07-09 16:23:59 -0700550 try:
551 test_name = control_data.parse_control(parser.args[0],
552 raise_warnings=True).name
553 except control_data.ControlVariableException:
554 logging.debug('Failed to retrieve test name from control file.')
555 test_name = None
Dan Shia1ecd5c2013-06-06 11:21:31 -0700556 if test_name in measure_run_time_tests:
557 machines = parser.options.machines.replace(',', ' '
558 ).strip().split()
Dan Shi8eac5af2014-09-17 00:15:15 -0700559 try:
560 afe = frontend.AFE()
561 board = server_utils.get_board_from_afe(machines[0], afe)
Gabe Black1e1c41b2015-02-04 23:55:15 -0800562 timer = autotest_stats.Timer('autoserv_run_time.%s.%s' %
563 (board, test_name))
Dan Shi8eac5af2014-09-17 00:15:15 -0700564 timer.start()
565 except (urllib2.HTTPError, urllib2.URLError):
566 # Ignore error if RPC failed to get board
567 pass
Dan Shia1ecd5c2013-06-06 11:21:31 -0700568 except control_data.ControlVariableException as e:
569 logging.error(str(e))
jadmanski0afbb632008-06-06 21:10:57 +0000570 exit_code = 0
Prashanth B6285f6a2014-05-08 18:01:27 -0700571 # TODO(beeps): Extend this to cover different failure modes.
572 # Testing exceptions are matched against labels sent to autoserv. Eg,
573 # to allow only the hostless job to run, specify
574 # testing_exceptions: test_suite in the shadow_config. To allow both
575 # the hostless job and dummy_Pass to run, specify
576 # testing_exceptions: test_suite,dummy_Pass. You can figure out
577 # what label autoserv is invoked with by looking through the logs of a test
578 # for the autoserv command's -l option.
579 testing_exceptions = global_config.global_config.get_config_value(
580 'AUTOSERV', 'testing_exceptions', type=list, default=[])
581 test_mode = global_config.global_config.get_config_value(
582 'AUTOSERV', 'testing_mode', type=bool, default=False)
Prashanth Balasubramanianf8b83712014-11-06 15:58:21 -0800583 test_mode = (results_mocker and test_mode and not
584 any([ex in parser.options.label
585 for ex in testing_exceptions]))
586 is_task = (parser.options.verify or parser.options.repair or
587 parser.options.provision or parser.options.reset or
588 parser.options.cleanup or parser.options.collect_crashinfo)
jadmanski0afbb632008-06-06 21:10:57 +0000589 try:
590 try:
Prashanth B6285f6a2014-05-08 18:01:27 -0700591 if test_mode:
Prashanth Balasubramanianf8b83712014-11-06 15:58:21 -0800592 # The parser doesn't run on tasks anyway, so we can just return
593 # happy signals without faking results.
594 if not is_task:
595 machine = parser.options.results.split('/')[-1]
596
597 # TODO(beeps): The proper way to do this would be to
598 # refactor job creation so we can invoke job.record
599 # directly. To do that one needs to pipe the test_name
600 # through run_autoserv and bail just before invoking
601 # the server job. See the comment in
602 # puppylab/results_mocker for more context.
603 results_mocker.ResultsMocker(
Prashanth Balasubramanian22dd2262014-11-28 18:19:18 -0800604 test_name if test_name else 'unknown-test',
605 parser.options.results, machine
Prashanth Balasubramanianf8b83712014-11-06 15:58:21 -0800606 ).mock_results()
607 return
Prashanth B6285f6a2014-05-08 18:01:27 -0700608 else:
Dan Shic68fefb2015-04-07 10:10:52 -0700609 run_autoserv(pid_file_manager, results, parser, ssp_url,
610 use_ssp)
Aviv Keshet5c40ec62013-08-20 12:11:12 -0700611 except SystemExit as e:
jadmanski0afbb632008-06-06 21:10:57 +0000612 exit_code = e.code
Aviv Keshet5c40ec62013-08-20 12:11:12 -0700613 if exit_code:
614 logging.exception(e)
615 except Exception as e:
jadmanski0afbb632008-06-06 21:10:57 +0000616 # If we don't know what happened, we'll classify it as
617 # an 'abort' and return 1.
Aviv Keshet5c40ec62013-08-20 12:11:12 -0700618 logging.exception(e)
jadmanski0afbb632008-06-06 21:10:57 +0000619 exit_code = 1
620 finally:
mblighff7d61f2008-12-22 14:53:35 +0000621 if pid_file_manager:
622 pid_file_manager.close_file(exit_code)
Dan Shia1ecd5c2013-06-06 11:21:31 -0700623 if timer:
624 timer.stop()
Fang Deng042c1472014-10-23 13:56:41 -0700625 # Record the autoserv duration time. Must be called
626 # just before the system exits to ensure accuracy.
627 duration_secs = (datetime.datetime.now() - start_time).total_seconds()
628 record_autoserv(parser.options, duration_secs)
jadmanski0afbb632008-06-06 21:10:57 +0000629 sys.exit(exit_code)
mblighfaf0cd42007-11-19 16:00:24 +0000630
mblighbb421852008-03-11 22:36:16 +0000631
mbligha46678d2008-05-01 20:00:01 +0000632if __name__ == '__main__':
jadmanski0afbb632008-06-06 21:10:57 +0000633 main()