Blame - site_utils/test_push.py - platform/external/autotest

2013-07-25 15:08:48 -0700

[diff] [blame]

#!/usr/bin/python

#

# Use of this source code is governed by a BSD-style license that can be

5

# found in the LICENSE file.

6

7

"""Tool to validate code in prod branch before pushing to lab.

8

9

The script runs push_to_prod suite to verify code in prod branch is ready to be

10

pushed. Link to design document:

11

https://docs.google.com/a/google.com/document/d/1JMz0xS3fZRSHMpFkkKAL_rxsdbNZomhHbC3B8L71uuI/edit

12

13

To verify if prod branch can be pushed to lab, run following command in

14

chromeos-autotest.cbf server:

Michael Liang

52d9f1f

2014-06-17 15:01:24 -0700

[diff] [blame]

15

/usr/local/autotest/site_utils/test_push.py -e someone@company.com

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

16

Shuqian Zhao

2016-09-21 11:02:15 -0700

[diff] [blame]

17

The script uses latest gandof stable build as test build by default.

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

"""

import argparse

Shuqian Zhao

2016-09-01 19:30:54 -0700

[diff] [blame]

22

import ast

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

23

import getpass

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

24

import multiprocessing

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

import os

import re

import subprocess

import sys

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

29

import time

30

import traceback

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

31

import urllib2

32

33

import common

Dan Shi

2014-05-09 15:18:15 -0700

[diff] [blame]

34

try:

35

from autotest_lib.frontend import setup_django_environment

36

from autotest_lib.frontend.afe import models

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

37

from autotest_lib.frontend.afe import rpc_utils

Dan Shi

2014-05-09 15:18:15 -0700

[diff] [blame]

38

except ImportError:

39

# Unittest may not have Django database configured and will fail to import.

40

pass

Dan Shi

2015-03-26 17:54:13 -0700

[diff] [blame]

41

from autotest_lib.client.common_lib import global_config

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

42

from autotest_lib.client.common_lib import priorities

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

43

from autotest_lib.server import site_utils

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

44

from autotest_lib.server import utils

Dan Shi

2014-12-22 16:25:05 -0800

[diff] [blame]

45

from autotest_lib.server.cros import provision

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

46

from autotest_lib.server.cros.dynamic_suite import frontend_wrappers

Dan Shi

2015-03-26 17:54:13 -0700

[diff] [blame]

47

from autotest_lib.site_utils import gmail_lib

Dan Shi

2014-12-22 16:25:05 -0800

[diff] [blame]

48

from autotest_lib.site_utils.suite_scheduler import constants

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

49

Shuqian Zhao

2016-08-31 19:23:17 -0700

[diff] [blame]

50

AUTOTEST_DIR='/usr/local/autotest'

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

51

CONFIG = global_config.global_config

52

Dan Shi

2016-02-03 11:37:02 -0800

[diff] [blame]

53

AFE = frontend_wrappers.RetryingAFE(timeout_min=0.5, delay_sec=2)

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

54

TKO = frontend_wrappers.RetryingTKO(timeout_min=0.1, delay_sec=10)

Dan Shi

2016-02-03 11:37:02 -0800

[diff] [blame]

55

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

56

MAIL_FROM = 'chromeos-test@google.com'

Shuqian Zhao

2016-08-31 19:23:17 -0700

[diff] [blame]

57

BUILD_REGEX = 'R[\d]+-[\d]+\.[\d]+\.[\d]+'

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

58

RUN_SUITE_COMMAND = 'run_suite.py'

59

PUSH_TO_PROD_SUITE = 'push_to_prod'

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

60

DUMMY_SUITE = 'dummy'

Shuqian Zhao

2016-09-21 11:02:15 -0700

[diff] [blame]

61

AU_SUITE = 'paygen_au_beta'

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

62

TESTBED_SUITE = 'testbed_push'

xixuan

2d66858

2016-06-10 14:02:32 -0700

[diff] [blame]

63

DEFAULT_TIMEOUT_MIN_FOR_SUITE_JOB = 30

Shuqian Zhao

2016-08-31 19:23:17 -0700

[diff] [blame]

64

IMAGE_BUCKET = CONFIG.get_config_value('CROS', 'image_storage_server')

Shuqian Zhao

2016-09-01 19:30:54 -0700

[diff] [blame]

65

DEFAULT_NUM_DUTS = "{'board:gandof': 4, 'board:quawks': 2}"

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

66

Fang Deng

6dddf60

2014-04-17 17:01:47 -0700

[diff] [blame]

67

SUITE_JOB_START_INFO_REGEX = ('^.*Created suite job:.*'

68

'tab_id=view_job&object_id=(\d+)$')

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

69

70

# Dictionary of test results keyed by test name regular expression.

71

EXPECTED_TEST_RESULTS = {'^SERVER_JOB$': 'GOOD',

72

# This is related to dummy_Fail/control.dependency.

73

'dummy_Fail.dependency$': 'TEST_NA',

Dan Shi

dc9eb17

2014-12-09 16:05:02 -0800

[diff] [blame]

74

'login_LoginSuccess.*': 'GOOD',

Dan Shi

2014-12-22 16:25:05 -0800

[diff] [blame]

75

'provision_AutoUpdate.double': 'GOOD',

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

76

'dummy_Pass.*': 'GOOD',

77

'dummy_Fail.Fail$': 'FAIL',

78

'dummy_Fail.RetryFail$': 'FAIL',

79

'dummy_Fail.RetrySuccess': 'GOOD',

80

'dummy_Fail.Error$': 'ERROR',

81

'dummy_Fail.Warn$': 'WARN',

82

'dummy_Fail.NAError$': 'TEST_NA',

83

'dummy_Fail.Crash$': 'GOOD',

84

}

85

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

86

EXPECTED_TEST_RESULTS_DUMMY = {'^SERVER_JOB$': 'GOOD',

87

'dummy_Pass.*': 'GOOD',

88

'dummy_Fail.Fail': 'FAIL',

89

'dummy_Fail.Warn': 'WARN',

90

'dummy_Fail.Crash': 'GOOD',

91

'dummy_Fail.Error': 'ERROR',

92

'dummy_Fail.NAError': 'TEST_NA',}

93

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

94

EXPECTED_TEST_RESULTS_AU = {'SERVER_JOB$': 'GOOD',

Shuqian Zhao

2016-09-21 11:02:15 -0700

[diff] [blame]

95

'autoupdate_EndToEndTest.paygen_au_beta_delta.*': 'GOOD',

96

'autoupdate_EndToEndTest.paygen_au_beta_full.*': 'GOOD',

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

97

}

98

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

99

EXPECTED_TEST_RESULTS_TESTBED = {'^SERVER_JOB$': 'GOOD',

100

'testbed_DummyTest': 'GOOD',}

101

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

102

EXPECTED_TEST_RESULTS_POWERWASH = {'platform_Powerwash': 'GOOD',

103

'SERVER_JOB': 'GOOD'}

104

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

105

URL_HOST = CONFIG.get_config_value('SERVER', 'hostname', type=str)

106

URL_PATTERN = CONFIG.get_config_value('CROS', 'log_url_pattern', type=str)

107

Dan Shi

dc9eb17

2014-12-09 16:05:02 -0800

[diff] [blame]

108

# Some test could be missing from the test results for various reasons. Add

109

# such test in this list and explain the reason.

110

IGNORE_MISSING_TESTS = [

111

# For latest build, npo_test_delta does not exist.

112

'autoupdate_EndToEndTest.npo_test_delta.*',

113

# For trybot build, nmo_test_delta does not exist.

114

'autoupdate_EndToEndTest.nmo_test_delta.*',

115

# Older build does not have login_LoginSuccess test in push_to_prod suite.

116

# TODO(dshi): Remove following lines after R41 is stable.

117

'login_LoginSuccess']

118

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

119

# Save all run_suite command output.

Shuqian Zhao

7b68219

2016-09-16 14:38:41 -0700

[diff] [blame]

120

manager = multiprocessing.Manager()

121

run_suite_output = manager.list()

Shuqian Zhao

1b4ca27

2016-09-18 14:58:19 -0700

[diff] [blame]

122

all_suite_ids = manager.list()

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

123

124

class TestPushException(Exception):

125

"""Exception to be raised when the test to push to prod failed."""

126

pass

127

Dan Shi

2014-05-09 13:47:00 -0700

[diff] [blame]

128

Shuqian Zhao

2016-09-01 19:30:54 -0700

[diff] [blame]

129

def check_dut_inventory(required_num_duts):

130

"""Check DUT inventory for each board.

131

132

@param required_num_duts: a dict specified the number of DUT each board

133

requires in order to finish push tests.

134

@raise TestPushException: if number of DUTs are less than the requirement.

135

"""

136

hosts = AFE.run('get_hosts', status='Ready', locked=False)

137

boards = [[l for l in host['labels'] if l.startswith('board:')][0]

138

for host in hosts]

139

current_inventory = {b:boards.count(b) for b in boards}

140

error_msg = ''

141

for board, req_num in required_num_duts.items():

142

curr_num = current_inventory.get(board, 0)

143

if curr_num < req_num:

144

error_msg += ('\nRequire %d %s DUTs, only %d are Ready now' %

145

(req_num, board, curr_num))

146

if error_msg:

147

raise TestPushException('Not enough DUTs to run push tests. %s' %

error_msg)

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

151

def powerwash_dut_to_test_repair(hostname, timeout):

152

"""Powerwash dut to test repair workflow.

Kevin Cheng

2015-12-11 09:45:57 -0800

[diff] [blame]

153

154

@param hostname: hostname of the dut.

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

155

@param timeout: seconds of the powerwash test to hit timeout.

156

@raise TestPushException: if DUT fail to run the test.

Kevin Cheng

2015-12-11 09:45:57 -0800

[diff] [blame]

157

"""

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

158

t = models.Test.objects.get(name='platform_Powerwash')

159

c = utils.read_file(os.path.join(common.autotest_dir, t.path))

160

job_id = rpc_utils.create_job_common(

161

'powerwash', priority=priorities.Priority.SUPER,

162

control_type='Server', control_file=c, hosts=[hostname])

163

Shuqian Zhao

e83a78c

2016-09-16 15:01:25 -0700

[diff] [blame]

164

end = time.time() + timeout

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

165

while not TKO.get_job_test_statuses_from_db(job_id):

Shuqian Zhao

e83a78c

2016-09-16 15:01:25 -0700

[diff] [blame]

166

if time.time() >= end:

167

AFE.run('abort_host_queue_entries', job=job_id)

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

168

raise TestPushException(

Shuqian Zhao

e83a78c

2016-09-16 15:01:25 -0700

[diff] [blame]

169

'Powerwash test on %s timeout after %ds, abort it.' %

170

(hostname, timeout))

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

171

time.sleep(10)

172

verify_test_results(job_id, EXPECTED_TEST_RESULTS_POWERWASH)

173

# Kick off verify, verify will fail and a repair should be triggered.

174

AFE.reverify_hosts(hostnames=[hostname])

Kevin Cheng

2015-12-11 09:45:57 -0800

[diff] [blame]

175

176

Shuqian Zhao

d2a99f0

2016-09-22 13:31:30 -0700

[diff] [blame]

177

def reverify_all_push_duts(pool):

178

"""Reverify all the push DUTs.

179

180

@param pool: Name of the pool used by test_push.

181

"""

182

pool_label = constants.Labels.POOL_PREFIX + pool

183

hosts = [h.hostname for h in AFE.get_hosts(label=pool_label)]

184

AFE.reverify_hosts(hostnames=hosts)

185

186

Shuqian Zhao

2016-08-31 19:23:17 -0700

[diff] [blame]

187

def get_default_build(board='gandof'):

Dan Shi

2014-05-09 13:47:00 -0700

[diff] [blame]

188

"""Get the default build to be used for test.

189

Dan Shi

8df9c00

2016-03-08 15:37:39 -0800

[diff] [blame]

190

@param board: Name of board to be tested, default is gandof.

191

@return: Build to be tested, e.g., gandof-release/R36-5881.0.0

Dan Shi

2014-05-09 13:47:00 -0700

[diff] [blame]

192

"""

Dan Shi

2014-05-09 13:47:00 -0700

[diff] [blame]

193

build = None

Shuqian Zhao

2016-08-31 19:23:17 -0700

[diff] [blame]

194

cmd = ('%s/cli/atest stable_version list --board=%s -w cautotest' %

195

(AUTOTEST_DIR, board))

196

result = subprocess.check_output(cmd, shell=True).strip()

197

build = re.search(BUILD_REGEX, result)

198

if build:

199

return '%s-release/%s' % (board, build.group(0))

Dan Shi

2014-05-09 13:47:00 -0700

[diff] [blame]

200

Shuqian Zhao

2016-08-31 19:23:17 -0700

[diff] [blame]

201

# If fail to get stable version from cautotest, use that defined in config

Dan Shi

2014-05-09 13:47:00 -0700

[diff] [blame]

202

build = CONFIG.get_config_value('CROS', 'stable_cros_version')

203

return '%s-release/%s' % (board, build)

204

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

205

def parse_arguments():

206

"""Parse arguments for test_push tool.

207

208

@return: Parsed arguments.

209

210

"""

211

parser = argparse.ArgumentParser()

Dan Shi

8df9c00

2016-03-08 15:37:39 -0800

[diff] [blame]

212

parser.add_argument('-b', '--board', dest='board', default='gandof',

213

help='Default is gandof.')

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

214

parser.add_argument('-sb', '--shard_board', dest='shard_board',

215

default='quawks',

216

help='Default is quawks.')

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

217

parser.add_argument('-i', '--build', dest='build', default=None,

Shuqian Zhao

2016-09-21 11:02:15 -0700

[diff] [blame]

218

help='Default is the latest stale build of given '

219

'board. Must be a stable build, otherwise AU test '

220

'will fail. (ex: gandolf-release/R54-8743.25.0)')

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

221

parser.add_argument('-si', '--shard_build', dest='shard_build', default=None,

Shuqian Zhao

2016-09-21 11:02:15 -0700

[diff] [blame]

222

help='Default is the latest stable build of given '

223

'board. Must be a stable build, otherwise AU test '

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

224

'will fail.')

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

225

parser.add_argument('-ab', '--android_board', dest='android_board',

226

help='Android board to test.')

227

parser.add_argument('-ai', '--android_build', dest='android_build',

228

help='Android build to test.')

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

229

parser.add_argument('-p', '--pool', dest='pool', default='bvt')

230

parser.add_argument('-u', '--num', dest='num', type=int, default=3,

231

help='Run on at most NUM machines.')

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

232

parser.add_argument('-e', '--email', dest='email', default=None,

233

help='Email address for the notification to be sent to '

234

'after the script finished running.')

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

235

parser.add_argument('-t', '--timeout_min', dest='timeout_min', type=int,

xixuan

2d66858

2016-06-10 14:02:32 -0700

[diff] [blame]

236

default=DEFAULT_TIMEOUT_MIN_FOR_SUITE_JOB,

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

237

help='Time in mins to wait before abort the jobs we '

238

'are waiting on. Only for the asynchronous suites '

239

'triggered by create_and_return flag.')

Shuqian Zhao

2016-09-01 19:30:54 -0700

[diff] [blame]

240

parser.add_argument('-ud', '--num_duts', dest='num_duts',

241

default=DEFAULT_NUM_DUTS,

242

help="String of dict that indicates the required number"

243

" of DUTs for each board. E.g {'gandof':4}")

Shuqian Zhao

2016-09-21 14:20:50 -0700

[diff] [blame]

244

parser.add_argument('-c', '--continue_on_failure', action='store_true',

245

dest='continue_on_failure',

246

help='All tests continue to run when there is failure')

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

247

248

arguments = parser.parse_args(sys.argv[1:])

249

Shuqian Zhao

2016-09-21 11:02:15 -0700

[diff] [blame]

250

# Get latest stable build as default build.

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

251

if not arguments.build:

Shuqian Zhao

2016-08-31 19:23:17 -0700

[diff] [blame]

252

arguments.build = get_default_build(arguments.board)

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

253

if not arguments.shard_build:

Shuqian Zhao

2016-08-31 19:23:17 -0700

[diff] [blame]

254

arguments.shard_build = get_default_build(arguments.shard_board)

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

255

Shuqian Zhao

2016-09-01 19:30:54 -0700

[diff] [blame]

256

arguments.num_duts = ast.literal_eval(arguments.num_duts)

257

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

return arguments

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

261

def do_run_suite(suite_name, arguments, use_shard=False,

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

262

create_and_return=False, testbed_test=False):

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

263

"""Call run_suite to run a suite job, and return the suite job id.

264

265

The script waits the suite job to finish before returning the suite job id.

266

Also it will echo the run_suite output to stdout.

267

268

@param suite_name: Name of a suite, e.g., dummy.

269

@param arguments: Arguments for run_suite command.

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

270

@param use_shard: If true, suite is scheduled for shard board.

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

271

@param create_and_return: If True, run_suite just creates the suite, print

272

the job id, then finish immediately.

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

273

@param testbed_test: True to run testbed test. Default is False.

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

274

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

275

@return: Suite job ID.

276

277

"""

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

278

if use_shard and not testbed_test:

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

279

board = arguments.shard_board

280

build = arguments.shard_build

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

281

elif testbed_test:

282

board = arguments.android_board

283

build = arguments.android_build

284

else:

285

board = arguments.board

286

build = arguments.build

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

287

Dan Shi

2014-12-22 16:25:05 -0800

[diff] [blame]

288

# Remove cros-version label to force provision.

Dan Shi

2016-02-03 11:37:02 -0800

[diff] [blame]

289

hosts = AFE.get_hosts(label=constants.Labels.BOARD_PREFIX+board)

Dan Shi

2014-12-22 16:25:05 -0800

[diff] [blame]

290

for host in hosts:

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

291

labels_to_remove = [

292

l for l in host.labels

293

if (l.startswith(provision.CROS_VERSION_PREFIX) or

294

l.startswith(provision.TESTBED_BUILD_VERSION_PREFIX))]

295

if labels_to_remove:

296

AFE.run('host_remove_labels', id=host.id, labels=labels_to_remove)

Dan Shi

2014-12-22 16:25:05 -0800

[diff] [blame]

297

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

298

# Test repair work flow on shards

Kevin Cheng

2015-12-11 09:45:57 -0800

[diff] [blame]

299

if use_shard and not create_and_return:

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

300

powerwash_dut_to_test_repair(host.hostname, timeout=300)

Kevin Cheng

2015-12-11 09:45:57 -0800

[diff] [blame]

301

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

302

current_dir = os.path.dirname(os.path.realpath(__file__))

303

cmd = [os.path.join(current_dir, RUN_SUITE_COMMAND),

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

304

'-s', suite_name,

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

305

'-b', board,

306

'-i', build,

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

307

'-p', arguments.pool,

Shuqian Zhao

178ac01

2016-06-03 15:08:52 -0700

[diff] [blame]

308

'-u', str(arguments.num)]

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

309

if create_and_return:

310

cmd += ['-c']

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

311

if testbed_test:

312

cmd += ['--run_prod_code']

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

313

314

suite_job_id = None

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

315

316

proc = subprocess.Popen(cmd, stdout=subprocess.PIPE,

317

stderr=subprocess.STDOUT)

318

319

while True:

320

line = proc.stdout.readline()

321

322

# Break when run_suite process completed.

323

if not line and proc.poll() != None:

324

break

325

print line.rstrip()

326

run_suite_output.append(line.rstrip())

327

328

if not suite_job_id:

329

m = re.match(SUITE_JOB_START_INFO_REGEX, line)

330

if m and m.group(1):

331

suite_job_id = int(m.group(1))

Shuqian Zhao

1b4ca27

2016-09-18 14:58:19 -0700

[diff] [blame]

332

all_suite_ids.append(suite_job_id)

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

333

334

if not suite_job_id:

335

raise TestPushException('Failed to retrieve suite job ID.')

Dan Shi

2014-05-09 15:18:15 -0700

[diff] [blame]

336

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

337

# If create_and_return specified, wait for the suite to finish.

338

if create_and_return:

339

end = time.time() + arguments.timeout_min * 60

Dan Shi

2016-02-03 11:37:02 -0800

[diff] [blame]

340

while not AFE.get_jobs(id=suite_job_id, finished=True):

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

341

if time.time() < end:

342

time.sleep(10)

343

else:

Dan Shi

2016-02-03 11:37:02 -0800

[diff] [blame]

344

AFE.run('abort_host_queue_entries', job=suite_job_id)

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

345

raise TestPushException(

346

'Asynchronous suite triggered by create_and_return '

347

'flag has timed out after %d mins. Aborting it.' %

348

arguments.timeout_min)

349

Dan Shi

2014-05-09 15:18:15 -0700

[diff] [blame]

350

print 'Suite job %s is completed.' % suite_job_id

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

return suite_job_id

Dan Shi

2014-05-09 15:18:15 -0700

[diff] [blame]

354

def check_dut_image(build, suite_job_id):

355

"""Confirm all DUTs used for the suite are imaged to expected build.

356

357

@param build: Expected build to be imaged.

358

@param suite_job_id: job ID of the suite job.

359

@raise TestPushException: If a DUT does not have expected build imaged.

360

"""

361

print 'Checking image installed in DUTs...'

362

job_ids = [job.id for job in

363

models.Job.objects.filter(parent_job_id=suite_job_id)]

364

hqes = [models.HostQueueEntry.objects.filter(job_id=job_id)[0]

365

for job_id in job_ids]

366

hostnames = set([hqe.host.hostname for hqe in hqes])

367

for hostname in hostnames:

Dan Shi

2016-02-03 11:37:02 -0800

[diff] [blame]

368

found_build = site_utils.get_build_from_afe(hostname, AFE)

Dan Shi

2014-05-09 15:18:15 -0700

[diff] [blame]

369

if found_build != build:

370

raise TestPushException('DUT is not imaged properly. Host %s has '

371

'build %s, while build %s is expected.' %

372

(hostname, found_build, build))

373

374

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

375

def test_suite(suite_name, expected_results, arguments, use_shard=False,

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

376

create_and_return=False, testbed_test=False):

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

377

"""Call run_suite to start a suite job and verify results.

378

379

@param suite_name: Name of a suite, e.g., dummy

380

@param expected_results: A dictionary of test name to test result.

381

@param arguments: Arguments for run_suite command.

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

382

@param use_shard: If true, suite is scheduled for shard board.

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

383

@param create_and_return: If True, run_suite just creates the suite, print

384

the job id, then finish immediately.

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

385

@param testbed_test: True to run testbed test. Default is False.

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

386

"""

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

387

suite_job_id = do_run_suite(suite_name, arguments, use_shard,

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

388

create_and_return, testbed_test)

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

389

Dan Shi

2014-05-09 15:18:15 -0700

[diff] [blame]

390

# Confirm all DUTs used for the suite are imaged to expected build.

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

391

# hqe.host_id for jobs running in shard is not synced back to master db,

392

# therefore, skip verifying dut build for jobs running in shard.

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

393

build_expected = (arguments.android_build if testbed_test

394

else arguments.build)

395

if suite_name != AU_SUITE and not use_shard and not testbed_test:

396

check_dut_image(build_expected, suite_job_id)

Dan Shi

2014-05-09 15:18:15 -0700

[diff] [blame]

397

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

398

# Verify test results are the expected results.

399

verify_test_results(suite_job_id, expected_results)

400

401

402

def verify_test_results(job_id, expected_results):

403

"""Verify the test results with the expected results.

404

405

@param job_id: id of the running jobs. For suite job, it is suite_job_id.

406

@param expected_results: A dictionary of test name to test result.

407

@raise TestPushException: If verify fails.

408

"""

Dan Shi

2014-05-09 15:18:15 -0700

[diff] [blame]

409

print 'Comparing test results...'

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

410

test_views = site_utils.get_test_views_from_tko(job_id, TKO)

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

411

412

mismatch_errors = []

413

extra_test_errors = []

414

415

found_keys = set()

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

416

for test_name, test_status in test_views.items():

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

417

print "%s%s" % (test_name.ljust(30), test_status)

Dan Shi

80b6ec0

2016-07-21 15:49:18 -0700

[diff] [blame]

418

# platform_InstallTestImage test may exist in old builds.

419

if re.search('platform_InstallTestImage_SERVER_JOB$', test_name):

420

continue

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

421

test_found = False

422

for key,val in expected_results.items():

423

if re.search(key, test_name):

424

test_found = True

425

found_keys.add(key)

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

426

if val != test_status:

427

error = ('%s Expected: [%s], Actual: [%s]' %

428

(test_name, val, test_status))

429

mismatch_errors.append(error)

430

if not test_found:

431

extra_test_errors.append(test_name)

432

433

missing_test_errors = set(expected_results.keys()) - found_keys

Dan Shi

dc9eb17

2014-12-09 16:05:02 -0800

[diff] [blame]

434

for exception in IGNORE_MISSING_TESTS:

435

try:

436

missing_test_errors.remove(exception)

except KeyError:

pass

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

440

summary = []

441

if mismatch_errors:

442

summary.append(('Results of %d test(s) do not match expected '

443

'values:') % len(mismatch_errors))

444

summary.extend(mismatch_errors)

445

summary.append('\n')

446

447

if extra_test_errors:

448

summary.append('%d test(s) are not expected to be run:' %

449

len(extra_test_errors))

450

summary.extend(extra_test_errors)

451

summary.append('\n')

452

453

if missing_test_errors:

454

summary.append('%d test(s) are missing from the results:' %

455

len(missing_test_errors))

456

summary.extend(missing_test_errors)

457

summary.append('\n')

458

459

# Test link to log can be loaded.

Shuqian Zhao

2016-09-12 10:42:03 -0700

[diff] [blame]

460

job_name = '%s-%s' % (job_id, getpass.getuser())

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

461

log_link = URL_PATTERN % (URL_HOST, job_name)

462

try:

463

urllib2.urlopen(log_link).read()

464

except urllib2.URLError:

465

summary.append('Failed to load page for link to log: %s.' % log_link)

466

467

if summary:

468

raise TestPushException('\n'.join(summary))

469

470

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

471

def test_suite_wrapper(queue, suite_name, expected_results, arguments,

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

472

use_shard=False, create_and_return=False,

473

testbed_test=False):

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

474

"""Wrapper to call test_suite. Handle exception and pipe it to parent

475

process.

476

477

@param queue: Queue to save exception to be accessed by parent process.

478

@param suite_name: Name of a suite, e.g., dummy

479

@param expected_results: A dictionary of test name to test result.

480

@param arguments: Arguments for run_suite command.

481

@param use_shard: If true, suite is scheduled for shard board.

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

482

@param create_and_return: If True, run_suite just creates the suite, print

483

the job id, then finish immediately.

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

484

@param testbed_test: True to run testbed test. Default is False.

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

485

"""

486

try:

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

487

test_suite(suite_name, expected_results, arguments, use_shard,

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

488

create_and_return, testbed_test)

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

489

except:

490

# Store the whole exc_info leads to a PicklingError.

491

except_type, except_value, tb = sys.exc_info()

492

queue.put((except_type, except_value, traceback.extract_tb(tb)))

493

494

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

495

def check_queue(queue):

496

"""Check the queue for any exception being raised.

497

498

@param queue: Queue used to store exception for parent process to access.

499

@raise: Any exception found in the queue.

"""

if queue.empty():

return

exc_info = queue.get()

504

# Raise the exception with original backtrace.

505

print 'Original stack trace of the exception:\n%s' % exc_info[2]

506

raise exc_info[0](exc_info[1])

507

508

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

509

def main():

510

"""Entry point for test_push script."""

511

arguments = parse_arguments()

512

513

try:

Shuqian Zhao

2016-09-21 14:20:50 -0700

[diff] [blame]

514

# Use daemon flag will kill child processes when parent process fails.

515

use_daemon = not arguments.continue_on_failure

Shuqian Zhao

2016-09-01 19:30:54 -0700

[diff] [blame]

516

check_dut_inventory(arguments.num_duts)

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

517

queue = multiprocessing.Queue()

518

519

push_to_prod_suite = multiprocessing.Process(

520

target=test_suite_wrapper,

521

args=(queue, PUSH_TO_PROD_SUITE, EXPECTED_TEST_RESULTS,

522

arguments))

Shuqian Zhao

2016-09-21 14:20:50 -0700

[diff] [blame]

523

push_to_prod_suite.daemon = use_daemon

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

524

push_to_prod_suite.start()

Jakob Juelich

2014-10-10 14:08:05 -0700

[diff] [blame]

525

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

526

# TODO(dshi): Remove following line after crbug.com/267644 is fixed.

527

# Also, merge EXPECTED_TEST_RESULTS_AU to EXPECTED_TEST_RESULTS

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

528

au_suite = multiprocessing.Process(

529

target=test_suite_wrapper,

530

args=(queue, AU_SUITE, EXPECTED_TEST_RESULTS_AU,

531

arguments))

Shuqian Zhao

2016-09-21 14:20:50 -0700

[diff] [blame]

532

au_suite.daemon = use_daemon

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

533

au_suite.start()

534

535

shard_suite = multiprocessing.Process(

536

target=test_suite_wrapper,

537

args=(queue, DUMMY_SUITE, EXPECTED_TEST_RESULTS_DUMMY,

538

arguments, True))

Shuqian Zhao

2016-09-21 14:20:50 -0700

[diff] [blame]

539

shard_suite.daemon = use_daemon

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

540

shard_suite.start()

541

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

542

# suite test with --create_and_return flag

543

asynchronous_suite = multiprocessing.Process(

544

target=test_suite_wrapper,

545

args=(queue, DUMMY_SUITE, EXPECTED_TEST_RESULTS_DUMMY,

546

arguments, True, True))

Shuqian Zhao

1b4ca27

2016-09-18 14:58:19 -0700

[diff] [blame]

547

asynchronous_suite.daemon = True

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

548

asynchronous_suite.start()

549

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

550

# Test suite for testbed

551

testbed_suite = multiprocessing.Process(

552

target=test_suite_wrapper,

553

args=(queue, TESTBED_SUITE, EXPECTED_TEST_RESULTS_TESTBED,

554

arguments, False, False, True))

Shuqian Zhao

2016-09-21 14:20:50 -0700

[diff] [blame]

555

testbed_suite.daemon = use_daemon

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

556

testbed_suite.start()

557

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

558

while (push_to_prod_suite.is_alive() or au_suite.is_alive() or

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

559

shard_suite.is_alive() or asynchronous_suite.is_alive() or

560

testbed_suite.is_alive()):

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

561

check_queue(queue)

Dan Shi

2015-04-07 17:37:09 -0700

[diff] [blame]

time.sleep(5)

check_queue(queue)

push_to_prod_suite.join()

567

au_suite.join()

568

shard_suite.join()

Shuqian Zhao

2015-08-06 09:46:22 -0700

[diff] [blame]

569

asynchronous_suite.join()

Dan Shi

2016-09-09 13:58:31 -0700

[diff] [blame]

570

testbed_suite.join()

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

571

except Exception as e:

572

print 'Test for pushing to prod failed:\n'

573

print str(e)

Shuqian Zhao

2016-09-21 14:20:50 -0700

[diff] [blame]

574

# Abort running jobs when choose not to continue when there is failure.

575

if not arguments.continue_on_failure:

576

for suite_id in all_suite_ids:

577

if AFE.get_jobs(id=suite_id, finished=False):

578

AFE.run('abort_host_queue_entries', job=suite_id)

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

579

# Send out email about the test failure.

580

if arguments.email:

Dan Shi

2015-03-26 17:54:13 -0700

[diff] [blame]

581

gmail_lib.send_email(

582

arguments.email,

583

'Test for pushing to prod failed. Do NOT push!',

584

('Errors occurred during the test:\n\n%s\n\n' % str(e) +

Shuqian Zhao

2016-09-01 19:30:54 -0700

[diff] [blame]

585

'\n'.join(run_suite_output)))

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

586

raise

Shuqian Zhao

d2a99f0

2016-09-22 13:31:30 -0700

[diff] [blame]

587

finally:

588

# Reverify all the hosts

589

reverify_all_push_duts(arguments.pool)

Dan Shi

2013-07-25 15:08:48 -0700

[diff] [blame]

590

591

message = ('\nAll tests are completed successfully, prod branch is ready to'

592

' be pushed.')

593

print message

594

# Send out email about test completed successfully.

595

if arguments.email:

Dan Shi

2015-03-26 17:54:13 -0700

[diff] [blame]

596

gmail_lib.send_email(

597

arguments.email,

598

'Test for pushing to prod completed successfully',

599

message)

Dan Shi