Blame - server/cros/dynamic_suite/suite.py - platform/external/autotest

2012-08-15 14:25:53 -0700

[diff] [blame]

1

2

# Use of this source code is governed by a BSD-style license that can be

3

# found in the LICENSE file.

4

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

5

import datetime

6

import difflib

Allen Li

98a26a4

2017-02-28 18:43:24 -0800

[diff] [blame]

7

import functools

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

import hashlib

import logging

import operator

import os

import re

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

13

import sys

Allen Li

98a26a4

2017-02-28 18:43:24 -0800

[diff] [blame]

14

import warnings

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

import common

J. Richard Barnette

2014-04-02 10:27:33 -0700

[diff] [blame]

18

from autotest_lib.frontend.afe.json_rpc import proxy

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

19

from autotest_lib.client.common_lib import control_data

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

20

from autotest_lib.client.common_lib import enum

Dan Shi

dfea368

2014-08-10 23:38:40 -0700

[diff] [blame]

21

from autotest_lib.client.common_lib import error

Simran Basi

5ace6f2

2016-01-06 17:30:44 -0800

[diff] [blame]

22

from autotest_lib.client.common_lib import global_config

Alex Miller

7d658cf

2013-09-04 16:00:35 -0700

[diff] [blame]

23

from autotest_lib.client.common_lib import priorities

Dan Shi

dfea368

2014-08-10 23:38:40 -0700

[diff] [blame]

24

from autotest_lib.client.common_lib import time_utils

25

from autotest_lib.client.common_lib import utils

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

26

from autotest_lib.frontend.afe.json_rpc import proxy

Dan Shi

2014-10-10 13:38:51 -0700

[diff] [blame]

27

from autotest_lib.server.cros import provision

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

28

from autotest_lib.server.cros.dynamic_suite import constants

29

from autotest_lib.server.cros.dynamic_suite import control_file_getter

30

from autotest_lib.server.cros.dynamic_suite import frontend_wrappers

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

31

from autotest_lib.server.cros.dynamic_suite import job_status

J. Richard Barnette

e7b98bb

2013-08-21 16:34:16 -0700

[diff] [blame]

32

from autotest_lib.server.cros.dynamic_suite import tools

33

from autotest_lib.server.cros.dynamic_suite.job_status import Status

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

34

Shuqian Zhao

ab46881

2015-04-08 14:40:38 -0700

[diff] [blame]

35

try:

36

from chromite.lib import boolparse_lib

37

from chromite.lib import cros_logging as logging

38

except ImportError:

39

print 'Unable to import chromite.'

40

print 'This script must be either:'

41

print ' - Be run in the chroot.'

42

print ' - (not yet supported) be run after running '

43

print ' ../utils/build_externals.py'

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

44

Shuqian Zhao

490f78f

2016-01-20 13:18:40 -0800

[diff] [blame]

45

_FILE_BUG_SUITES = ['au', 'bvt', 'bvt-cq', 'bvt-inline', 'paygen_au_beta',

46

'paygen_au_canary', 'paygen_au_dev', 'paygen_au_stable',

47

'sanity', 'push_to_prod']

Simran Basi

5ace6f2

2016-01-06 17:30:44 -0800

[diff] [blame]

48

_AUTOTEST_DIR = global_config.global_config.get_config_value(

49

'SCHEDULER', 'drone_installation_directory')

xixuan

0f7755d

2016-04-18 14:49:12 -0700

[diff] [blame]

50

ENABLE_CONTROLS_IN_BATCH = global_config.global_config.get_config_value(

51

'CROS', 'enable_getting_controls_in_batch', type=bool, default=False)

Shuqian Zhao

e33ba4a

2015-09-11 18:51:43 -0700

[diff] [blame]

52

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

53

class RetryHandler(object):

54

"""Maintain retry information.

55

56

@var _retry_map: A dictionary that stores retry history.

57

The key is afe job id. The value is a dictionary.

58

{job_id: {'state':RetryHandler.States, 'retry_max':int}}

59

- state:

60

The retry state of a job.

61

NOT_ATTEMPTED:

62

We haven't done anything about the job.

63

ATTEMPTED:

64

We've made an attempt to schedule a retry job. The

65

scheduling may or may not be successful, e.g.

66

it might encounter an rpc error. Note failure

67

in scheduling a retry is different from a retry job failure.

68

For each job, we only attempt to schedule a retry once.

69

For example, assume we have a test with JOB_RETRIES=5 and

70

its second retry job failed. When we attempt to create

71

a third retry job to retry the second, we hit an rpc

72

error. In such case, we will give up on all following

73

retries.

74

RETRIED:

75

A retry job has already been successfully

76

scheduled.

77

- retry_max:

78

The maximum of times the job can still

79

be retried, taking into account retries

80

that have occurred.

81

@var _retry_level: A retry might be triggered only if the result

82

is worse than the level.

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

83

@var _max_retries: Maximum retry limit at suite level.

84

Regardless how many times each individual test

85

has been retried, the total number of retries happening in

86

the suite can't exceed _max_retries.

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

87

"""

88

89

States = enum.Enum('NOT_ATTEMPTED', 'ATTEMPTED', 'RETRIED',

90

start_value=1, step=1)

91

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

92

def __init__(self, initial_jobs_to_tests, retry_level='WARN',

93

max_retries=None):

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

94

"""Initialize RetryHandler.

95

96

@param initial_jobs_to_tests: A dictionary that maps a job id to

97

a ControlData object. This dictionary should contain

98

jobs that are originally scheduled by the suite.

99

@param retry_level: A retry might be triggered only if the result is

100

worse than the level.

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

101

@param max_retries: Integer, maxmium total retries allowed

102

for the suite. Default to None, no max.

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

103

"""

104

self._retry_map = {}

105

self._retry_level = retry_level

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

106

self._max_retries = (max_retries

107

if max_retries is not None else sys.maxint)

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

108

for job_id, test in initial_jobs_to_tests.items():

109

if test.job_retries > 0:

Allen Li

fb89e2b

2017-01-03 12:47:58 -0800

[diff] [blame]

110

self._add_job(new_job_id=job_id,

111

retry_max=test.job_retries)

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

112

113

Allen Li

fb89e2b

2017-01-03 12:47:58 -0800

[diff] [blame]

114

def _add_job(self, new_job_id, retry_max):

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

115

"""Add a newly-created job to the retry map.

116

117

@param new_job_id: The afe_job_id of a newly created job.

118

@param retry_max: The maximum of times that we could retry

119

the test if the job fails.

120

121

@raises ValueError if new_job_id is already in retry map.

122

123

"""

124

if new_job_id in self._retry_map:

125

raise ValueError('add_job called when job is already in retry map.')

126

127

self._retry_map[new_job_id] = {

128

'state': self.States.NOT_ATTEMPTED,

129

'retry_max': retry_max}

130

131

Allen Li

0cd1926

2017-01-03 12:56:08 -0800

[diff] [blame]

132

def _suite_max_reached(self):

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

133

"""Return whether maximum retry limit for a suite has been reached."""

Fang Deng

e4326d6

2015-01-06 13:15:15 -0800

[diff] [blame]

134

return self._max_retries <= 0

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

135

136

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

137

def add_retry(self, old_job_id, new_job_id):

138

"""Record a retry.

139

140

Update retry map with the retry information.

141

142

@param old_job_id: The afe_job_id of the job that is retried.

143

@param new_job_id: The afe_job_id of the retry job.

144

145

@raises KeyError if old_job_id isn't in the retry map.

146

@raises ValueError if we have already retried or made an attempt

147

to retry the old job.

148

149

"""

150

old_record = self._retry_map[old_job_id]

151

if old_record['state'] != self.States.NOT_ATTEMPTED:

152

raise ValueError(

153

'We have already retried or attempted to retry job %d' %

154

old_job_id)

155

old_record['state'] = self.States.RETRIED

Allen Li

fb89e2b

2017-01-03 12:47:58 -0800

[diff] [blame]

156

self._add_job(new_job_id=new_job_id,

157

retry_max=old_record['retry_max'] - 1)

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

158

self._max_retries -= 1

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

159

160

161

def set_attempted(self, job_id):

162

"""Set the state of the job to ATTEMPTED.

163

164

@param job_id: afe_job_id of a job.

165

166

@raises KeyError if job_id isn't in the retry map.

167

@raises ValueError if the current state is not NOT_ATTEMPTED.

168

169

"""

170

current_state = self._retry_map[job_id]['state']

171

if current_state != self.States.NOT_ATTEMPTED:

172

# We are supposed to retry or attempt to retry each job

173

# only once. Raise an error if this is not the case.

174

raise ValueError('Unexpected state transition: %s -> %s' %

175

(self.States.get_string(current_state),

176

self.States.get_string(self.States.ATTEMPTED)))

177

else:

178

self._retry_map[job_id]['state'] = self.States.ATTEMPTED

179

180

181

def has_following_retry(self, result):

182

"""Check whether there will be a following retry.

183

184

We have the following cases for a given job id (result.id),

185

- no retry map entry -> retry not required, no following retry

186

- has retry map entry:

187

- already retried -> has following retry

188

- has not retried

189

(this branch can be handled by checking should_retry(result))

190

- retry_max == 0 --> the last retry job, no more retry

191

- retry_max > 0

192

- attempted, but has failed in scheduling a

193

following retry due to rpc error --> no more retry

194

- has not attempped --> has following retry if test failed.

195

196

@param result: A result, encapsulating the status of the job.

197

198

@returns: True, if there will be a following retry.

199

False otherwise.

200

201

"""

Allen Li

2ee2a26

2017-01-03 13:21:10 -0800

[diff] [blame]

202

return (result.test_executed

203

and result.id in self._retry_map

204

and (self._retry_map[result.id]['state'] == self.States.RETRIED

205

or self._should_retry(result)))

Allen Li

5cb0065

2017-01-03 13:06:30 -0800

[diff] [blame]

206

207

208

def _should_retry(self, result):

209

"""Check whether we should retry a job based on its result.

210

211

We will retry the job that corresponds to the result

212

when all of the following are true.

213

a) The test was actually executed, meaning that if

214

a job was aborted before it could ever reach the state

215

of 'Running', the job will not be retried.

216

b) The result is worse than |self._retry_level| which

217

defaults to 'WARN'.

218

c) The test requires retry, i.e. the job has an entry in the retry map.

219

d) We haven't made any retry attempt yet, i.e. state == NOT_ATTEMPTED

220

Note that if a test has JOB_RETRIES=5, and the second time

221

it was retried it hit an rpc error, we will give up on

222

all following retries.

223

e) The job has not reached its retry max, i.e. retry_max > 0

224

225

@param result: A result, encapsulating the status of the job.

226

227

@returns: True if we should retry the job.

228

229

"""

230

return (

xixuan

bf854f8

2017-04-20 10:40:15 -0700

[diff] [blame]

231

result.test_executed

232

and result.id in self._retry_map

233

and not self._suite_max_reached()

Allen Li

5cb0065

2017-01-03 13:06:30 -0800

[diff] [blame]

234

and result.is_worse_than(

235

job_status.Status(self._retry_level, '', 'reason'))

Allen Li

5cb0065

2017-01-03 13:06:30 -0800

[diff] [blame]

236

and self._retry_map[result.id]['state'] == self.States.NOT_ATTEMPTED

237

and self._retry_map[result.id]['retry_max'] > 0

238

)

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

239

240

241

def get_retry_max(self, job_id):

242

"""Get the maximum times the job can still be retried.

243

244

@param job_id: afe_job_id of a job.

245

246

@returns: An int, representing the maximum times the job can still be

247

retried.

248

@raises KeyError if job_id isn't in the retry map.

249

250

"""

251

return self._retry_map[job_id]['retry_max']

252

253

Allen Li

2017-02-28 13:09:40 -0800

[diff] [blame]

254

class _ExperimentalTestFilter(object):

255

"""Filter experimental tests."""

Allen Li

6b161c6

2017-02-28 13:08:54 -0800

[diff] [blame]

256

257

258

def __init__(self, tests, add_experimental=True):

259

"""Initialize instance.

260

261

@param tests: iterable of tests (ControlData objects)

262

@param add_experimental: schedule experimental tests as well, or not.

263

"""

264

self._tests = list(tests)

265

self._add_experimental = add_experimental

266

267

Allen Li

2017-02-28 13:09:40 -0800

[diff] [blame]

268

def get_tests_to_schedule(self):

Allen Li

6b161c6

2017-02-28 13:08:54 -0800

[diff] [blame]

269

"""Return a list of tests to be scheduled for this suite.

270

271

@returns: list of tests (ControlData objects)

272

"""

273

tests = self.stable_tests

274

if self._add_experimental:

275

for test in self.unstable_tests:

276

if not test.name.startswith(constants.EXPERIMENTAL_PREFIX):

277

test.name = constants.EXPERIMENTAL_PREFIX + test.name

tests.append(test)

return tests

@property

def stable_tests(self):

284

"""Non-experimental tests.

@returns: list

"""

return filter(lambda t: not t.experimental, self._tests)

@property

def unstable_tests(self):

293

"""Experimental tests.

@returns: list

"""

return filter(lambda t: t.experimental, self._tests)

298

299

Allen Li

da198fd

2017-03-29 17:22:13 -0700

[diff] [blame]

300

class _SuiteChildJobCreator(object):

301

"""Create test jobs for a suite."""

302

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

303

def __init__(

304

self,

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

305

tag,

Allen Li

2017-03-29 17:37:43 -0700

[diff] [blame]

306

builds,

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

307

board,

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

308

afe=None,

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

309

max_runtime_mins=24*60,

310

timeout_mins=24*60,

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

311

suite_job_id=None,

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

312

ignore_deps=False,

Allen Li

37e1a29

2017-02-28 18:28:41 -0800

[diff] [blame]

313

extra_deps=(),

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

314

priority=priorities.Priority.DEFAULT,

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

315

offload_failures_only=False,

316

test_source_build=None):

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

"""

Constructor

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

320

@param tag: a string with which to tag jobs run in this suite.

Allen Li

2017-03-29 17:37:43 -0700

[diff] [blame]

321

@param builds: the builds on which we're running this suite.

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

322

@param board: the board on which we're running this suite.

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

323

@param afe: an instance of AFE as defined in server/frontend.py.

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

324

@param max_runtime_mins: Maximum suite runtime, in minutes.

325

@param timeout_mins: Maximum job lifetime, in minutes.

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

326

@param suite_job_id: Job id that will act as parent id to all sub jobs.

327

Default: None

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

328

@param ignore_deps: True if jobs should ignore the DEPENDENCIES

329

attribute and skip applying of dependency labels.

330

(Default:False)

331

@param extra_deps: A list of strings which are the extra DEPENDENCIES

332

to add to each test being scheduled.

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

333

@param priority: Integer priority level. Higher is more important.

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

334

@param offload_failures_only: Only enable gs_offloading for failed

335

jobs.

336

@param test_source_build: Build that contains the server-side test code.

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

337

"""

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

338

self._tag = tag

Allen Li

2017-03-29 17:37:43 -0700

[diff] [blame]

339

self._builds = builds

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

340

self._board = board

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

341

self._afe = afe or frontend_wrappers.RetryingAFE(timeout_min=30,

342

delay_sec=10,

343

debug=False)

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

344

self._max_runtime_mins = max_runtime_mins

345

self._timeout_mins = timeout_mins

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

346

self._suite_job_id = suite_job_id

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

347

self._ignore_deps = ignore_deps

Allen Li

37e1a29

2017-02-28 18:28:41 -0800

[diff] [blame]

348

self._extra_deps = tuple(extra_deps)

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

349

self._priority = priority

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

350

self._offload_failures_only = offload_failures_only

351

self._test_source_build = test_source_build

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

352

353

Allen Li

2017-03-29 17:37:43 -0700

[diff] [blame]

354

@property

355

def cros_build(self):

356

"""Return the CrOS build or the first build in the builds dict."""

357

# TODO(ayatane): Note that the builds dict isn't ordered. I'm not

358

# sure what the implications of this are, but it's probably not a

359

# good thing.

360

return self._builds.get(provision.CROS_VERSION_PREFIX,

361

self._builds.values()[0])

362

363

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

364

def create_job(self, test, retry_for=None):

365

"""

366

Thin wrapper around frontend.AFE.create_job().

367

368

@param test: ControlData object for a test to run.

369

@param retry_for: If the to-be-created job is a retry for an

370

old job, the afe_job_id of the old job will

371

be passed in as |retry_for|, which will be

372

recorded in the new job's keyvals.

373

@returns: A frontend.Job object with an added test_name member.

374

test_name is used to preserve the higher level TEST_NAME

375

name of the job.

376

"""

377

test_obj = self._afe.create_job(

378

control_file=test.text,

379

name=tools.create_job_name(

380

self._test_source_build or self.cros_build,

381

self._tag,

382

test.name),

383

control_type=test.test_type.capitalize(),

384

meta_hosts=[self._board]*test.sync_count,

385

dependencies=self._create_job_deps(test),

386

keyvals=self._create_keyvals_for_test_job(test, retry_for),

387

max_runtime_mins=self._max_runtime_mins,

388

timeout_mins=self._timeout_mins,

389

parent_job_id=self._suite_job_id,

390

test_retry=test.retries,

391

priority=self._priority,

392

synch_count=test.sync_count,

393

require_ssp=test.require_ssp)

394

395

test_obj.test_name = test.name

return test_obj

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

399

def _create_job_deps(self, test):

400

"""Create job deps list for a test job.

401

402

@returns: A list of dependency strings.

403

"""

404

if self._ignore_deps:

405

job_deps = []

406

else:

407

job_deps = list(test.dependencies)

408

job_deps.extend(self._extra_deps)

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

409

return job_deps

410

Allen Li

da198fd

2017-03-29 17:22:13 -0700

[diff] [blame]

411

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

412

def _create_keyvals_for_test_job(self, test, retry_for=None):

413

"""Create keyvals dict for creating a test job.

414

415

@param test: ControlData object for a test to run.

416

@param retry_for: If the to-be-created job is a retry for an

417

old job, the afe_job_id of the old job will

418

be passed in as |retry_for|, which will be

419

recorded in the new job's keyvals.

420

@returns: A keyvals dict for creating the test job.

421

"""

422

keyvals = {

423

constants.JOB_BUILD_KEY: self.cros_build,

424

constants.JOB_SUITE_KEY: self._tag,

425

constants.JOB_EXPERIMENTAL_KEY: test.experimental,

426

constants.JOB_BUILDS_KEY: self._builds

427

}

428

# test_source_build is saved to job_keyvals so scheduler can retrieve

429

# the build name from database when compiling autoserv commandline.

430

# This avoid a database change to add a new field in afe_jobs.

431

#

432

# Only add `test_source_build` to job keyvals if the build is different

433

# from the CrOS build or the job uses more than one build, e.g., both

434

# firmware and CrOS will be updated in the dut.

435

# This is for backwards compatibility, so the update Autotest code can

436

# compile an autoserv command line to run in a SSP container using

437

# previous builds.

438

if (self._test_source_build and

439

(self.cros_build != self._test_source_build or

440

len(self._builds) > 1)):

441

keyvals[constants.JOB_TEST_SOURCE_BUILD_KEY] = \

442

self._test_source_build

443

for prefix, build in self._builds.iteritems():

444

if prefix == provision.FW_RW_VERSION_PREFIX:

445

keyvals[constants.FWRW_BUILD]= build

446

elif prefix == provision.FW_RO_VERSION_PREFIX:

447

keyvals[constants.FWRO_BUILD] = build

448

# Add suite job id to keyvals so tko parser can read it from keyval

449

# file.

450

if self._suite_job_id:

451

keyvals[constants.PARENT_JOB_ID] = self._suite_job_id

452

# We drop the old job's id in the new job's keyval file so that

453

# later our tko parser can figure out the retry relationship and

454

# invalidate the results of the old job in tko database.

455

if retry_for:

456

keyvals[constants.RETRY_ORIGINAL_JOB_ID] = retry_for

457

if self._offload_failures_only:

458

keyvals[constants.JOB_OFFLOAD_FAILURES_KEY] = True

return keyvals

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

462

def _get_cf_retriever(cf_getter, forgiving_parser=True, run_prod_code=False,

463

test_args=None):

Allen Li

ec99911

2017-03-10 16:46:47 -0800

[diff] [blame]

464

"""Return the correct _ControlFileRetriever instance.

465

466

If cf_getter is a File system ControlFileGetter, return a

467

_ControlFileRetriever. This performs a full parse of the root

468

directory associated with the getter. This is the case when it's

469

invoked from suite_preprocessor.

470

471

If cf_getter is a devserver getter, return a

472

_BatchControlFileRetriever. This looks up the suite_name in a suite

473

to control file map generated at build time, and parses the relevant

474

control files alone. This lookup happens on the devserver, so as far

475

as this method is concerned, both cases are equivalent. If

476

enable_controls_in_batch is switched on, this function will call

477

cf_getter.get_suite_info() to get a dict of control files and

478

contents in batch.

479

"""

Allen Li

2d7c956

2017-03-10 16:33:31 -0800

[diff] [blame]

480

if _should_batch_with(cf_getter):

Allen Li

4890529

2017-03-10 17:06:53 -0800

[diff] [blame^]

481

cls = _BatchControlFileRetriever

Allen Li

2d7c956

2017-03-10 16:33:31 -0800

[diff] [blame]

482

else:

Allen Li

4890529

2017-03-10 17:06:53 -0800

[diff] [blame^]

483

cls = _ControlFileRetriever

484

return cls(cf_getter, forgiving_parser, run_prod_code, test_args)

Allen Li

65258bf

2017-03-10 16:20:11 -0800

[diff] [blame]

485

486

Allen Li

ce93df7

2017-03-10 16:38:30 -0800

[diff] [blame]

487

def _should_batch_with(cf_getter):

488

"""Return whether control files should be fetched in batch.

489

490

This depends on the control file getter and configuration options.

491

492

@param cf_getter: a control_file_getter.ControlFileGetter used to list

493

and fetch the content of control files

494

"""

495

return (ENABLE_CONTROLS_IN_BATCH

496

and isinstance(cf_getter, control_file_getter.DevServerGetter))

497

498

Allen Li

2017-03-10 16:11:53 -0800

[diff] [blame]

499

class _ControlFileRetriever(object):

500

"""Retrieves control files.

501

502

This returns control data instances, unlike control file getters

503

which simply return the control file text contents.

Allen Li

066f587

2017-02-28 13:30:44 -0800

[diff] [blame]

504

"""

Allen Li

066f587

2017-02-28 13:30:44 -0800

[diff] [blame]

505

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

506

def __init__(self, cf_getter, forgiving_parser=True, run_prod_code=False,

507

test_args=None):

Allen Li

3674697

2017-03-10 16:17:46 -0800

[diff] [blame]

508

"""Initialize instance.

509

510

@param cf_getter: a control_file_getter.ControlFileGetter used to list

511

and fetch the content of control files

Allen Li

2017-03-10 16:11:53 -0800

[diff] [blame]

512

@param forgiving_parser: If False, will raise ControlVariableExceptions

513

if any are encountered when parsing control

514

files. Note that this can raise an exception

515

for syntax errors in unrelated files, because

516

we parse them before applying the predicate.

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

517

@param run_prod_code: If true, the retrieved tests will run the test

518

code that lives in prod aka the test code

519

currently on the lab servers by disabling

520

SSP for the discovered tests.

Allen Li

2017-03-10 16:11:53 -0800

[diff] [blame]

521

@param test_args: A dict of args to be seeded in test control file under

522

the name |args_dict|.

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

523

"""

524

self._cf_getter = cf_getter

525

self._forgiving_parser = forgiving_parser

526

self._run_prod_code = run_prod_code

527

self._test_args = test_args

528

529

530

def retrieve_for_suite(self, suite_name=''):

531

"""Scan through all tests and find all tests.

532

533

@param suite_name: If specified, this method will attempt to restrain

534

the search space to just this suite's control files.

Allen Li

066f587

2017-02-28 13:30:44 -0800

[diff] [blame]

535

Allen Li

2017-03-10 16:11:53 -0800

[diff] [blame]

536

@raises ControlVariableException: If forgiving_parser is False and there

537

is a syntax error in a control file.

538

539

@returns a dictionary of ControlData objects that based on given

540

parameters.

541

"""

Allen Li

2017-03-10 16:36:38 -0800

[diff] [blame]

542

control_file_texts = self._get_control_file_texts_for_suite(suite_name)

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

543

return self._parse_control_file_texts(control_file_texts)

Allen Li

9d0be12

2017-02-28 14:13:04 -0800

[diff] [blame]

544

545

Allen Li

374c1b6

2017-03-10 16:29:02 -0800

[diff] [blame]

546

def _filter_cf_paths(self, paths):

547

"""Remove certain control file paths

548

549

@param paths: Iterable of paths

550

@returns: generator yielding paths

551

"""

552

matcher = re.compile(r'[^/]+/(deps|profilers)/.+')

553

return (path for path in paths if not matcher.match(path))

554

555

Allen Li

2017-03-10 16:36:38 -0800

[diff] [blame]

556

def _get_control_file_texts_for_suite(self, suite_name):

557

"""Get control file content for given suite.

558

559

@param suite_name: If specified, this method will attempt to restrain

560

the search space to just this suite's control files.

Allen Li

2017-03-10 16:40:52 -0800

[diff] [blame]

561

@returns: generator yielding (path, text) tuples

Allen Li

2017-03-10 16:36:38 -0800

[diff] [blame]

562

"""

Allen Li

2017-03-10 16:37:57 -0800

[diff] [blame]

563

files = self._cf_getter.get_control_file_list(suite_name=suite_name)

564

filtered_files = self._filter_cf_paths(files)

Allen Li

2017-03-10 16:40:52 -0800

[diff] [blame]

565

for path in filtered_files:

566

yield path, self._cf_getter.get_control_file_contents(path)

Allen Li

2017-03-10 16:36:38 -0800

[diff] [blame]

567

568

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

569

def _parse_control_file_texts(self, control_file_texts):

Allen Li

2017-03-10 16:58:49 -0800

[diff] [blame]

570

"""Parse control file texts.

571

572

@param control_file_texts: iterable of (path, text) pairs

Allen Li

2017-03-10 16:58:49 -0800

[diff] [blame]

573

@returns: a dictionary of ControlData objects

574

"""

575

tests = {}

576

for path, text in control_file_texts:

577

# Seed test_args into the control file.

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

578

if self._test_args:

579

text = tools.inject_vars(self._test_args, text)

Allen Li

2017-03-10 16:58:49 -0800

[diff] [blame]

580

try:

581

found_test = control_data.parse_control_string(

582

text, raise_warnings=True, path=path)

583

except control_data.ControlVariableException, e:

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

584

if not self._forgiving_parser:

Allen Li

2017-03-10 16:58:49 -0800

[diff] [blame]

585

msg = "Failed parsing %s\n%s" % (path, e)

586

raise control_data.ControlVariableException(msg)

587

logging.warning("Skipping %s\n%s", path, e)

588

except Exception, e:

589

logging.error("Bad %s\n%s", path, e)

590

else:

591

found_test.text = text

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

592

if self._run_prod_code:

Allen Li

2017-03-10 16:58:49 -0800

[diff] [blame]

593

found_test.require_ssp = False

594

tests[path] = found_test

return tests

Allen Li

2017-03-10 16:32:38 -0800

[diff] [blame]

598

class _BatchControlFileRetriever(_ControlFileRetriever):

599

"""Subclass that can retrieve suite control files in batch."""

600

601

Allen Li

2017-03-10 16:37:57 -0800

[diff] [blame]

602

def _get_control_file_texts_for_suite(self, suite_name):

603

"""Get control file content for given suite.

604

605

@param suite_name: If specified, this method will attempt to restrain

606

the search space to just this suite's control files.

Allen Li

2017-03-10 16:40:52 -0800

[diff] [blame]

607

@returns: generator yielding (path, text) tuples

Allen Li

2017-03-10 16:37:57 -0800

[diff] [blame]

608

"""

609

suite_info = self._cf_getter.get_suite_info(suite_name=suite_name)

610

files = suite_info.keys()

611

filtered_files = self._filter_cf_paths(files)

Allen Li

2017-03-10 16:40:52 -0800

[diff] [blame]

612

for path in filtered_files:

Allen Li

2017-03-10 16:37:57 -0800

[diff] [blame]

613

yield path, suite_info[path]

614

615

Allen Li

1865f63

2017-03-09 15:58:52 -0800

[diff] [blame]

616

def get_test_source_build(builds, **dargs):

617

"""Get the build of test code.

618

619

Get the test source build from arguments. If parameter

620

`test_source_build` is set and has a value, return its value. Otherwise

621

returns the ChromeOS build name if it exists. If ChromeOS build is not

622

specified either, raise SuiteArgumentException.

623

624

@param builds: the builds on which we're running this suite. It's a

625

dictionary of version_prefix:build.

626

@param **dargs: Any other Suite constructor parameters, as described

627

in Suite.__init__ docstring.

628

629

@return: The build contains the test code.

630

@raise: SuiteArgumentException if both test_source_build and ChromeOS

631

build are not specified.

632

633

"""

634

if dargs.get('test_source_build', None):

635

return dargs['test_source_build']

636

test_source_build = builds.get(provision.CROS_VERSION_PREFIX, None)

637

if not test_source_build:

638

raise error.SuiteArgumentException(

639

'test_source_build must be specified if CrOS build is not '

640

'specified.')

641

return test_source_build

642

643

Allen Li

122cd09

2017-03-09 15:56:46 -0800

[diff] [blame]

644

def list_all_suites(build, devserver, cf_getter=None):

645

"""

646

Parses all ControlData objects with a SUITE tag and extracts all

647

defined suite names.

648

649

@param build: the build on which we're running this suite.

650

@param devserver: the devserver which contains the build.

651

@param cf_getter: control_file_getter.ControlFileGetter. Defaults to

652

using DevServerGetter.

653

654

@return list of suites

655

"""

656

if cf_getter is None:

657

cf_getter = _create_ds_getter(build, devserver)

658

659

suites = set()

660

predicate = lambda t: True

661

for test in find_and_parse_tests(cf_getter, predicate,

662

add_experimental=True):

663

suites.update(test.suite_tag_parts)

return list(suites)

Allen Li

2017-03-09 15:52:33 -0800

[diff] [blame]

667

def test_file_similarity_predicate(test_file_pattern):

668

"""Returns predicate that gets the similarity based on a test's file

669

name pattern.

670

671

Builds a predicate that takes in a parsed control file (a ControlData)

672

and returns a tuple of (file path, ratio), where ratio is the

673

similarity between the test file name and the given test_file_pattern.

674

675

@param test_file_pattern: regular expression (string) to match against

676

control file names.

677

@return a callable that takes a ControlData and and returns a tuple of

678

(file path, ratio), where ratio is the similarity between the

679

test file name and the given test_file_pattern.

680

"""

681

return lambda t: ((None, 0) if not hasattr(t, 'path') else

682

(t.path, difflib.SequenceMatcher(a=t.path,

683

b=test_file_pattern).ratio()))

684

685

Allen Li

b5b4a7a

2017-03-09 15:50:09 -0800

[diff] [blame]

686

def test_name_similarity_predicate(test_name):

687

"""Returns predicate that matched based on a test's name.

688

689

Builds a predicate that takes in a parsed control file (a ControlData)

690

and returns a tuple of (test name, ratio), where ratio is the similarity

691

between the test name and the given test_name.

692

693

@param test_name: the test name to base the predicate on.

694

@return a callable that takes a ControlData and returns a tuple of

695

(test name, ratio), where ratio is the similarity between the

696

test name and the given test_name.

697

"""

698

return lambda t: ((None, 0) if not hasattr(t, 'name') else

699

(t.name,

700

difflib.SequenceMatcher(a=t.name, b=test_name).ratio()))

701

702

Allen Li

e37d6ba

2017-03-09 15:49:25 -0800

[diff] [blame]

703

def matches_attribute_expression_predicate(test_attr_boolstr):

704

"""Returns predicate that matches based on boolean expression of

705

attributes.

706

707

Builds a predicate that takes in a parsed control file (a ControlData)

708

ans returns True if the test attributes satisfy the given attribute

709

boolean expression.

710

711

@param test_attr_boolstr: boolean expression of the attributes to be

712

test, like 'system:all and interval:daily'.

713

714

@return a callable that takes a ControlData and returns True if the test

715

attributes satisfy the given boolean expression.

716

"""

717

return lambda t: boolparse_lib.BoolstrResult(

718

test_attr_boolstr, t.attributes)

719

720

Allen Li

f29b48a

2017-03-09 15:48:41 -0800

[diff] [blame]

721

def test_file_matches_pattern_predicate(test_file_pattern):

722

"""Returns predicate that matches based on a test's file name pattern.

723

724

Builds a predicate that takes in a parsed control file (a ControlData)

725

and returns True if the test's control file name matches the given

726

regular expression.

727

728

@param test_file_pattern: regular expression (string) to match against

729

control file names.

730

@return a callable that takes a ControlData and and returns

731

True if control file name matches the pattern.

732

"""

733

return lambda t: hasattr(t, 'path') and re.match(test_file_pattern,

t.path)

Allen Li

2017-03-09 15:47:25 -0800

[diff] [blame]

737

def test_name_matches_pattern_predicate(test_name_pattern):

738

"""Returns predicate that matches based on a test's name pattern.

739

740

Builds a predicate that takes in a parsed control file (a ControlData)

741

and returns True if the test name matches the given regular expression.

742

743

@param test_name_pattern: regular expression (string) to match against

744

test names.

745

@return a callable that takes a ControlData and returns

746

True if the name fields matches the pattern.

747

"""

748

return lambda t: hasattr(t, 'name') and re.match(test_name_pattern,

t.name)

Allen Li

2017-03-09 15:46:32 -0800

[diff] [blame]

752

def test_name_equals_predicate(test_name):

753

"""Returns predicate that matched based on a test's name.

754

755

Builds a predicate that takes in a parsed control file (a ControlData)

756

and returns True if the test name is equal to |test_name|.

757

758

@param test_name: the test name to base the predicate on.

759

@return a callable that takes a ControlData and looks for |test_name|

760

in that ControlData's name.

761

"""

762

return lambda t: hasattr(t, 'name') and test_name == t.name

763

764

Allen Li

6e2fa4f

2017-03-09 15:45:43 -0800

[diff] [blame]

765

def name_in_tag_similarity_predicate(name):

766

"""Returns predicate that takes a control file and gets the similarity

767

of the suites in the control file and the given name.

768

769

Builds a predicate that takes in a parsed control file (a ControlData)

770

and returns a list of tuples of (suite name, ratio), where suite name

771

is each suite listed in the control file, and ratio is the similarity

772

between each suite and the given name.

773

774

@param name: the suite name to base the predicate on.

775

@return a callable that takes a ControlData and returns a list of tuples

776

of (suite name, ratio), where suite name is each suite listed in

777

the control file, and ratio is the similarity between each suite

778

and the given name.

779

"""

780

return lambda t: [(suite,

781

difflib.SequenceMatcher(a=suite, b=name).ratio())

782

for suite in t.suite_tag_parts] or [(None, 0)]

783

784

Allen Li

398ddbd

2017-03-09 15:44:25 -0800

[diff] [blame]

785

def name_in_tag_predicate(name):

786

"""Returns predicate that takes a control file and looks for |name|.

787

788

Builds a predicate that takes in a parsed control file (a ControlData)

789

and returns True if the SUITE tag is present and contains |name|.

790

791

@param name: the suite name to base the predicate on.

792

@return a callable that takes a ControlData and looks for |name| in that

793

ControlData object's suite member.

794

"""

795

return lambda t: name in t.suite_tag_parts

796

797

Allen Li

a640d6d

2017-03-09 15:41:35 -0800

[diff] [blame]

798

def create_fs_getter(autotest_dir):

799

"""

800

@param autotest_dir: the place to find autotests.

801

@return a FileSystemGetter instance that looks under |autotest_dir|.

802

"""

803

# currently hard-coded places to look for tests.

804

subpaths = ['server/site_tests', 'client/site_tests',

805

'server/tests', 'client/tests']

806

directories = [os.path.join(autotest_dir, p) for p in subpaths]

807

return control_file_getter.FileSystemGetter(directories)

808

809

Allen Li

0f91587

2017-02-28 18:51:04 -0800

[diff] [blame]

810

def _create_ds_getter(build, devserver):

811

"""

812

@param build: the build on which we're running this suite.

813

@param devserver: the devserver which contains the build.

814

@return a FileSystemGetter instance that looks under |autotest_dir|.

815

"""

816

return control_file_getter.DevServerGetter(build, devserver)

817

818

Allen Li

0b1fa38

2017-02-28 18:47:16 -0800

[diff] [blame]

819

def find_and_parse_tests(cf_getter, predicate, suite_name='',

820

add_experimental=False, forgiving_parser=True,

821

run_prod_code=False, test_args=None):

822

"""

823

Function to scan through all tests and find eligible tests.

824

825

Search through all tests based on given cf_getter, suite_name,

826

add_experimental and forgiving_parser, return the tests that match

827

given predicate.

828

829

@param cf_getter: a control_file_getter.ControlFileGetter used to list

830

and fetch the content of control files

831

@param predicate: a function that should return True when run over a

832

ControlData representation of a control file that should be in

833

this Suite.

834

@param suite_name: If specified, this method will attempt to restrain

835

the search space to just this suite's control files.

836

@param add_experimental: add tests with experimental attribute set.

837

@param forgiving_parser: If False, will raise ControlVariableExceptions

838

if any are encountered when parsing control

839

files. Note that this can raise an exception

840

for syntax errors in unrelated files, because

841

we parse them before applying the predicate.

842

@param run_prod_code: If true, the suite will run the test code that

843

lives in prod aka the test code currently on the

844

lab servers by disabling SSP for the discovered

845

tests.

846

@param test_args: A dict of args to be seeded in test control file.

847

848

@raises ControlVariableException: If forgiving_parser is False and there

849

is a syntax error in a control file.

850

851

@return list of ControlData objects that should be run, with control

852

file text added in |text| attribute. Results are sorted based

853

on the TIME setting in control file, slowest test comes first.

854

"""

Allen Li

bb60f44

2017-03-14 12:18:57 -0700

[diff] [blame]

855

logging.debug('Getting control file list for suite: %s', suite_name)

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

856

retriever = _get_cf_retriever(cf_getter,

857

forgiving_parser=forgiving_parser,

858

run_prod_code=run_prod_code,

859

test_args=test_args)

860

tests = retriever.retrieve_for_suite(suite_name)

Allen Li

76b8f31

2017-03-10 16:00:08 -0800

[diff] [blame]

861

if not add_experimental:

862

tests = {path: test_data for path, test_data in tests.iteritems()

863

if not test_data.experimental}

Allen Li

0b1fa38

2017-02-28 18:47:16 -0800

[diff] [blame]

864

logging.debug('Parsed %s control files.', len(tests))

865

tests = [test for test in tests.itervalues() if predicate(test)]

866

tests.sort(key=lambda t:

867

control_data.ControlData.get_test_time_index(t.time),

reverse=True)

return tests

Allen Li

2017-02-28 18:37:52 -0800

[diff] [blame]

872

def find_possible_tests(cf_getter, predicate, suite_name='', count=10):

873

"""

874

Function to scan through all tests and find possible tests.

875

876

Search through all tests based on given cf_getter, suite_name,

877

add_experimental and forgiving_parser. Use the given predicate to

878

calculate the similarity and return the top 10 matches.

879

880

@param cf_getter: a control_file_getter.ControlFileGetter used to list

881

and fetch the content of control files

882

@param predicate: a function that should return a tuple of (name, ratio)

883

when run over a ControlData representation of a control file that

884

should be in this Suite. `name` is the key to be compared, e.g.,

885

a suite name or test name. `ratio` is a value between [0,1]

886

indicating the similarity of `name` and the value to be compared.

887

@param suite_name: If specified, this method will attempt to restrain

888

the search space to just this suite's control files.

889

@param count: Number of suggestions to return, default to 10.

890

891

@return list of top names that similar to the given test, sorted by

892

match ratio.

893

"""

Allen Li

bb60f44

2017-03-14 12:18:57 -0700

[diff] [blame]

894

logging.debug('Getting control file list for suite: %s', suite_name)

Allen Li

2017-03-14 13:36:26 -0700

[diff] [blame]

895

retriever = _get_cf_retriever(cf_getter,

896

forgiving_parser=True)

897

tests = retriever.retrieve_for_suite(suite_name)

Allen Li

da01219

2017-02-28 18:37:52 -0800

[diff] [blame]

898

logging.debug('Parsed %s control files.', len(tests))

899

similarities = {}

900

for test in tests.itervalues():

901

ratios = predicate(test)

902

# Some predicates may return a list of tuples, e.g.,

903

# name_in_tag_similarity_predicate. Convert all returns to a list.

904

if not isinstance(ratios, list):

905

ratios = [ratios]

906

for name, ratio in ratios:

907

similarities[name] = ratio

908

return [s[0] for s in

909

sorted(similarities.items(), key=operator.itemgetter(1),

910

reverse=True)][:count]

911

912

Allen Li

98a26a4

2017-02-28 18:43:24 -0800

[diff] [blame]

913

def _deprecated_suite_method(func):

914

"""Decorator for deprecated Suite static methods.

915

916

TODO(ayatane): This is used to decorate functions that are called as

917

static methods on Suite.

918

"""

919

@functools.wraps(func)

920

def wrapper(*args, **kwargs):

921

warnings.warn('Calling this method from Suite is deprecated')

922

return func(*args, **kwargs)

923

return staticmethod(wrapper)

924

925

Allen Li

4b5a24f

2017-03-09 16:01:35 -0800

[diff] [blame]

926

class _BaseSuite(object):

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

927

"""

928

A suite of tests, defined by some predicate over control file variables.

929

930

Given a place to search for control files a predicate to match the desired

931

tests, can gather tests and fire off jobs to run them, and then wait for

932

results.

933

934

@var _predicate: a function that should return True when run over a

935

ControlData representation of a control file that should be in

936

this Suite.

937

@var _tag: a string with which to tag jobs run in this suite.

Dan Shi

2014-10-10 13:38:51 -0700

[diff] [blame]

938

@var _builds: the builds on which we're running this suite.

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

939

@var _afe: an instance of AFE as defined in server/frontend.py.

940

@var _tko: an instance of TKO as defined in server/frontend.py.

941

@var _jobs: currently scheduled jobs, if any.

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

942

@var _jobs_to_tests: a dictionary that maps job ids to tests represented

943

ControlData objects.

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

944

@var _retry: a bool value indicating whether jobs should be retried on

945

failure.

946

@var _retry_handler: a RetryHandler object.

947

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

948

"""

949

Dan Shi

2014-10-10 13:38:51 -0700

[diff] [blame]

950

Allen Li

2016-12-09 18:04:26 -0800

[diff] [blame]

951

def __init__(

952

self,

Allen Li

2017-03-09 16:44:30 -0800

[diff] [blame]

953

tests,

Allen Li

2016-12-09 18:04:26 -0800

[diff] [blame]

954

tag,

955

builds,

956

board,

Allen Li

2016-12-09 18:04:26 -0800

[diff] [blame]

afe=None,

tko=None,

pool=None,

results_dir=None,

max_runtime_mins=24*60,

962

timeout_mins=24*60,

963

file_bugs=False,

964

file_experimental_bugs=False,

965

suite_job_id=None,

966

ignore_deps=False,

Allen Li

493eefa

2016-12-09 18:05:35 -0800

[diff] [blame]

967

extra_deps=None,

Allen Li

2016-12-09 18:04:26 -0800

[diff] [blame]

968

priority=priorities.Priority.DEFAULT,

Allen Li

2016-12-09 18:04:26 -0800

[diff] [blame]

969

wait_for_results=True,

970

job_retry=False,

971

max_retries=sys.maxint,

972

offload_failures_only=False,

Shuqian Zhao

2017-02-13 16:22:58 -0800

[diff] [blame]

973

test_source_build=None,

Allen Li

2017-03-09 16:29:48 -0800

[diff] [blame]

974

job_keyvals=None

Allen Li

2016-12-09 18:04:26 -0800

[diff] [blame]

975

):

Allen Li

2017-03-09 16:29:48 -0800

[diff] [blame]

976

"""Initialize instance.

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

977

Allen Li

2017-03-09 16:44:30 -0800

[diff] [blame]

978

@param tests: Iterable of tests to run.

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

979

@param tag: a string with which to tag jobs run in this suite.

Dan Shi

2014-10-10 13:38:51 -0700

[diff] [blame]

980

@param builds: the builds on which we're running this suite.

Alex Miller

a091307

2013-06-12 10:01:51 -0700

[diff] [blame]

981

@param board: the board on which we're running this suite.

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

982

@param afe: an instance of AFE as defined in server/frontend.py.

983

@param tko: an instance of TKO as defined in server/frontend.py.

984

@param pool: Specify the pool of machines to use for scheduling

985

purposes.

986

@param results_dir: The directory where the job can write results to.

987

This must be set if you want job_id of sub-jobs

988

list in the job keyvals.

Aviv Keshet

2013-02-19 17:49:49 -0800

[diff] [blame]

989

@param max_runtime_mins: Maximum suite runtime, in minutes.

Alex Miller

028b031

2013-09-07 15:25:45 -0700

[diff] [blame]

990

@param timeout: Maximum job lifetime, in hours.

Aviv Keshet

2013-02-19 17:49:49 -0800

[diff] [blame]

991

@param suite_job_id: Job id that will act as parent id to all sub jobs.

992

Default: None

Aviv Keshet

d7959f3

2013-05-17 15:58:43 -0700

[diff] [blame]

993

@param ignore_deps: True if jobs should ignore the DEPENDENCIES

994

attribute and skip applying of dependency labels.

995

(Default:False)

Alex Miller

47a0367

2013-08-27 09:09:53 -0700

[diff] [blame]

996

@param extra_deps: A list of strings which are the extra DEPENDENCIES

997

to add to each test being scheduled.

Alex Miller

7d658cf

2013-09-04 16:00:35 -0700

[diff] [blame]

998

@param priority: Integer priority level. Higher is more important.

Dan Shi

9512241

2013-11-12 16:20:33 -0800

[diff] [blame]

999

@param wait_for_results: Set to False to run the suite job without

1000

waiting for test jobs to finish. Default is

1001

True.

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1002

@param job_retry: A bool value indicating whether jobs should be retired

1003

on failure. If True, the field 'JOB_RETRIES' in

1004

control files will be respected. If False, do not

1005

retry.

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

1006

@param max_retries: Maximum retry limit at suite level.

1007

Regardless how many times each individual test

1008

has been retried, the total number of retries

1009

happening in the suite can't exceed _max_retries.

1010

Default to sys.maxint.

Simran Basi

1e10e92

2015-04-16 15:09:56 -0700

[diff] [blame]

1011

@param offload_failures_only: Only enable gs_offloading for failed

1012

jobs.

Dan Shi

2014-10-10 13:38:51 -0700

[diff] [blame]

1013

@param test_source_build: Build that contains the server-side test code.

Shuqian Zhao

2017-02-13 16:22:58 -0800

[diff] [blame]

1014

@param job_keyvals: General job keyvals to be inserted into keyval file,

1015

which will be used by tko/parse later.

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1016

"""

Allen Li

493eefa

2016-12-09 18:05:35 -0800

[diff] [blame]

1017

Allen Li

2017-03-09 16:44:30 -0800

[diff] [blame]

1018

self.tests = list(tests)

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1019

self._tag = tag

Dan Shi

2014-10-10 13:38:51 -0700

[diff] [blame]

1020

self._builds = builds

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1021

self._results_dir = results_dir

1022

self._afe = afe or frontend_wrappers.RetryingAFE(timeout_min=30,

1023

delay_sec=10,

1024

debug=False)

1025

self._tko = tko or frontend_wrappers.RetryingTKO(timeout_min=30,

1026

delay_sec=10,

1027

debug=False)

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1028

self._jobs = []

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1029

self._jobs_to_tests = {}

beeps

89f1e06

2013-09-18 12:00:17 -0700

[diff] [blame]

1030

Alex Miller

a3a4fe7

2013-01-22 09:57:47 -0800

[diff] [blame]

1031

self._file_bugs = file_bugs

beeps

2013-05-30 11:34:14 -0700

[diff] [blame]

1032

self._file_experimental_bugs = file_experimental_bugs

Aviv Keshet

2013-02-19 17:49:49 -0800

[diff] [blame]

1033

self._suite_job_id = suite_job_id

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1034

self._job_retry=job_retry

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

1035

self._max_retries = max_retries

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1036

# RetryHandler to be initialized in schedule()

1037

self._retry_handler = None

Dan Shi

9512241

2013-11-12 16:20:33 -0800

[diff] [blame]

1038

self.wait_for_results = wait_for_results

Shuqian Zhao

2017-02-13 16:22:58 -0800

[diff] [blame]

1039

self._job_keyvals = job_keyvals

Alex Miller

a3a4fe7

2013-01-22 09:57:47 -0800

[diff] [blame]

1040

Allen Li

80dc02c

2017-02-28 18:22:16 -0800

[diff] [blame]

1041

if extra_deps is None:

1042

extra_deps = []

Allen Li

3a83fe6

2017-02-28 18:27:09 -0800

[diff] [blame]

1043

extra_deps.append(board)

Allen Li

cceb183

2017-02-28 18:25:06 -0800

[diff] [blame]

1044

if pool:

1045

extra_deps.append(pool)

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

1046

self._job_creator = _SuiteChildJobCreator(

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

1047

tag=tag,

Allen Li

2017-03-29 17:37:43 -0700

[diff] [blame]

1048

builds=builds,

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

1049

board=board,

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

1050

afe=afe,

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

1051

max_runtime_mins=max_runtime_mins,

1052

timeout_mins=timeout_mins,

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

1053

suite_job_id=suite_job_id,

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

1054

ignore_deps=ignore_deps,

1055

extra_deps=extra_deps,

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

1056

priority=priority,

Allen Li

2017-03-29 17:48:46 -0700

[diff] [blame]

1057

offload_failures_only=offload_failures_only,

1058

test_source_build=test_source_build,

Allen Li

2017-03-29 17:31:35 -0700

[diff] [blame]

1059

)

Allen Li

da198fd

2017-03-29 17:22:13 -0700

[diff] [blame]

1060

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1061

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1062

def _schedule_test(self, record, test, retry_for=None, ignore_errors=False):

1063

"""Schedule a single test and return the job.

1064

Allen Li

e79b3cb

2016-12-12 18:24:17 -0800

[diff] [blame]

1065

Schedule a single test by creating a job, and then update relevant

1066

data structures that are used to keep track of all running jobs.

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1067

Allen Li

e79b3cb

2016-12-12 18:24:17 -0800

[diff] [blame]

1068

Emits a TEST_NA status log entry if it failed to schedule the test due

1069

to NoEligibleHostException or a non-existent board label.

1070

1071

Returns a frontend.Job object if the test is successfully scheduled.

1072

If scheduling failed due to NoEligibleHostException or a non-existent

1073

board label, returns None. If ignore_errors is True, all unknown

1074

errors return None, otherwise the errors are raised as-is.

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1075

1076

@param record: A callable to use for logging.

1077

prototype: record(base_job.status_log_entry)

1078

@param test: ControlData for a test to run.

1079

@param retry_for: If we are scheduling a test to retry an

1080

old job, the afe_job_id of the old job

1081

will be passed in as |retry_for|.

1082

@param ignore_errors: If True, when an rpc error occur, ignore

1083

the error and will return None.

1084

If False, rpc errors will be raised.

1085

Allen Li

e79b3cb

2016-12-12 18:24:17 -0800

[diff] [blame]

1086

@returns: A frontend.Job object or None

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1087

"""

1088

msg = 'Scheduling %s' % test.name

1089

if retry_for:

1090

msg = msg + ', to retry afe job %d' % retry_for

1091

logging.debug(msg)

Dan Shi

dfea368

2014-08-10 23:38:40 -0700

[diff] [blame]

1092

begin_time_str = datetime.datetime.now().strftime(time_utils.TIME_FMT)

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1093

try:

Allen Li

2017-03-29 17:58:23 -0700

[diff] [blame]

1094

job = self._job_creator.create_job(test, retry_for=retry_for)

Allen Li

6fd440f

2016-12-12 18:40:05 -0800

[diff] [blame]

1095

except (error.NoEligibleHostException, proxy.ValidationError) as e:

1096

if (isinstance(e, error.NoEligibleHostException)

1097

or (isinstance(e, proxy.ValidationError)

1098

and _is_nonexistent_board_error(e))):

1099

# Treat a dependency on a non-existent board label the same as

1100

# a dependency on a board that exists, but for which there's no

1101

# hardware.

1102

logging.debug('%s not applicable for this board/pool. '

1103

'Emitting TEST_NA.', test.name)

1104

Status('TEST_NA', test.name,

1105

'Skipping: test not supported on this board/pool.',

Allen Li

9fcd4b4

2016-12-12 16:15:14 -0800

[diff] [blame]

1106

begin_time_str=begin_time_str).record_all(record)

1107

return None

1108

else:

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1109

raise e

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1110

except (error.RPCException, proxy.JSONRPCException) as e:

1111

if retry_for:

1112

# Mark that we've attempted to retry the old job.

1113

self._retry_handler.set_attempted(job_id=retry_for)

Allen Li

0ba5934

2016-12-12 15:57:02 -0800

[diff] [blame]

1114

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1115

if ignore_errors:

1116

logging.error('Failed to schedule test: %s, Reason: %s',

1117

test.name, e)

Allen Li

0ba5934

2016-12-12 15:57:02 -0800

[diff] [blame]

1118

return None

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

else:

raise e

else:

self._jobs.append(job)

1123

self._jobs_to_tests[job.id] = test

1124

if retry_for:

1125

# A retry job was just created, record it.

1126

self._retry_handler.add_retry(

1127

old_job_id=retry_for, new_job_id=job.id)

1128

retry_count = (test.job_retries -

1129

self._retry_handler.get_retry_max(job.id))

1130

logging.debug('Job %d created to retry job %d. '

1131

'Have retried for %d time(s)',

1132

job.id, retry_for, retry_count)

Allen Li

2016-12-29 16:05:41 -0800

[diff] [blame]

1133

self._remember_job_keyval(job)

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1134

return job

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1135

1136

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1137

def schedule(self, record, add_experimental=True):

Aviv Keshet

2013-02-19 17:49:49 -0800

[diff] [blame]

1138

#pylint: disable-msg=C0111

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1139

"""

1140

Schedule jobs using |self._afe|.

1141

1142

frontend.Job objects representing each scheduled job will be put in

1143

|self._jobs|.

1144

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1145

@param record: A callable to use for logging.

1146

prototype: record(base_job.status_log_entry)

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1147

@param add_experimental: schedule experimental tests as well, or not.

Aviv Keshet

e9170d9

2013-07-19 11:20:45 -0700

[diff] [blame]

1148

@returns: The number of tests that were scheduled.

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1149

"""

Allen Li

f4cb5ec

2017-01-03 16:58:12 -0800

[diff] [blame]

1150

scheduled_test_names = []

Allen Li

2017-02-28 13:09:40 -0800

[diff] [blame]

1151

test_filter = _ExperimentalTestFilter(

Allen Li

f4cb5ec

2017-01-03 16:58:12 -0800

[diff] [blame]

1152

tests=self.tests,

1153

add_experimental=add_experimental)

1154

logging.debug('Discovered %d stable tests.',

Allen Li

2017-02-28 13:09:40 -0800

[diff] [blame]

1155

len(test_filter.stable_tests))

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1156

logging.debug('Discovered %d unstable tests.',

Allen Li

2017-02-28 13:09:40 -0800

[diff] [blame]

1157

len(test_filter.unstable_tests))

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1158

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1159

Status('INFO', 'Start %s' % self._tag).record_result(record)

1160

try:

Shuqian Zhao

2017-02-13 16:22:58 -0800

[diff] [blame]

1161

# Write job_keyvals into keyval file.

1162

if self._job_keyvals:

1163

utils.write_keyval(self._results_dir, self._job_keyvals)

1164

Allen Li

2017-02-28 13:09:40 -0800

[diff] [blame]

1165

for test in test_filter.get_tests_to_schedule():

Allen Li

da90573

2016-12-12 15:49:16 -0800

[diff] [blame]

1166

scheduled_job = self._schedule_test(record, test)

1167

if scheduled_job is not None:

Shuqian Zhao

cd866f3

2016-11-29 20:14:34 -0800

[diff] [blame]

1168

scheduled_test_names.append(test.name)

1169

1170

# Write the num of scheduled tests and name of them to keyval file.

Shuqian Zhao

cd866f3

2016-11-29 20:14:34 -0800

[diff] [blame]

1171

logging.debug('Scheduled %d tests, writing the total to keyval.',

Allen Li

a4d3502

2016-12-12 15:42:10 -0800

[diff] [blame]

1172

len(scheduled_test_names))

Allen Li

d4d5dda

2016-12-12 15:39:11 -0800

[diff] [blame]

1173

utils.write_keyval(

1174

self._results_dir,

Allen Li

dda59b8

2016-12-12 18:20:04 -0800

[diff] [blame]

1175

self._make_scheduled_tests_keyvals(scheduled_test_names))

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1176

except Exception: # pylint: disable=W0703

Allen Li

b892d9f

2016-12-29 15:50:11 -0800

[diff] [blame]

1177

logging.exception('Exception while scheduling suite')

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1178

Status('FAIL', self._tag,

1179

'Exception while scheduling suite').record_result(record)

1180

Fang Deng

7e655a9

2014-05-23 13:48:11 -0700

[diff] [blame]

1181

if self._job_retry:

1182

self._retry_handler = RetryHandler(

Fang Deng

2015-01-02 14:51:49 -0800

[diff] [blame]

1183

initial_jobs_to_tests=self._jobs_to_tests,

1184

max_retries=self._max_retries)

Allen Li

a4d3502

2016-12-12 15:42:10 -0800

[diff] [blame]

1185

return len(scheduled_test_names)

Aviv Keshet

e9170d9

2013-07-19 11:20:45 -0700

[diff] [blame]

1186

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1187

Allen Li

dda59b8

2016-12-12 18:20:04 -0800

[diff] [blame]

1188

def _make_scheduled_tests_keyvals(self, scheduled_test_names):

1189

"""Make a keyvals dict to write for scheduled test names.

1190

1191

@param scheduled_test_names: A list of scheduled test name strings.

1192

1193

@returns: A keyvals dict.

1194

"""

1195

return {

1196

constants.SCHEDULED_TEST_COUNT_KEY: len(scheduled_test_names),

1197

constants.SCHEDULED_TEST_NAMES_KEY: repr(scheduled_test_names),

}

Allen Li

2016-12-29 15:12:39 -0800

[diff] [blame]

1201

def _should_report(self, result):

beeps

2013-05-30 11:34:14 -0700

[diff] [blame]

1202

"""

Shuqian Zhao

e33ba4a

2015-09-11 18:51:43 -0700

[diff] [blame]

1203

Returns True if this failure requires to be reported.

beeps

2013-05-30 11:34:14 -0700

[diff] [blame]

1204

1205

@param result: A result, encapsulating the status of the failed job.

Shuqian Zhao

e33ba4a

2015-09-11 18:51:43 -0700

[diff] [blame]

1206

@return: True if we should report this failure.

beeps

2013-05-30 11:34:14 -0700

[diff] [blame]

1207

"""

Allen Li

cc75229

2017-01-03 12:44:39 -0800

[diff] [blame]

1208

if self._has_retry(result):

Fang Deng

2014-03-17 15:19:46 -0700

[diff] [blame]

1209

return False

1210

beeps

beefc06

2013-08-02 11:17:09 -0700

[diff] [blame]

1211

is_not_experimental = (

1212

constants.EXPERIMENTAL_PREFIX not in result._test_name and

1213

constants.EXPERIMENTAL_PREFIX not in result._job_name)

1214

Alex Miller

fcc119b

2014-01-15 13:54:58 -0800

[diff] [blame]

1215

return (self._file_bugs and result.test_executed and

beeps

beefc06

2013-08-02 11:17:09 -0700

[diff] [blame]

1216

(is_not_experimental or self._file_experimental_bugs) and

Fang Deng

d82c1c7

2014-07-29 10:43:01 -0700

[diff] [blame]

1217

not result.is_testna() and

beeps

32fa677

2014-01-28 13:19:53 -0800

[diff] [blame]

1218

result.is_worse_than(job_status.Status('GOOD', '', 'reason')))

beeps

2013-05-30 11:34:14 -0700

[diff] [blame]

1219

1220

Allen Li

cc75229

2017-01-03 12:44:39 -0800

[diff] [blame]

1221

def _has_retry(self, result):

1222

"""

1223

Return True if this result gets to retry.

1224

1225

@param result: A result, encapsulating the status of the failed job.

1226

@return: bool

1227

"""

1228

return (self._job_retry

1229

and self._retry_handler.has_following_retry(result))

1230

1231

Allen Li

1850345

2016-12-29 14:56:48 -0800

[diff] [blame]

1232

def wait(self, record, bug_template=None):

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1233

"""

1234

Polls for the job statuses, using |record| to print status when each

1235

completes.

1236

1237

@param record: callable that records job status.

1238

prototype:

1239

record(base_job.status_log_entry)

beeps

c8a875b

2013-03-25 10:20:38 -0700

[diff] [blame]

1240

@param bug_template: A template dictionary specifying the default bug

1241

filing options for failures in this suite.

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1242

"""

Dan Shi

e67bd6a

2016-02-17 14:44:07 -0800

[diff] [blame]

1243

# reporting modules have dependency on external packages, e.g., httplib2

1244

# Such dependency can cause issue to any module tries to import suite.py

1245

# without building site-packages first. Since the reporting modules are

1246

# only used in this function, move the imports here avoid the

1247

# requirement of building site packages to use other functions in this

1248

# module.

1249

from autotest_lib.server.cros.dynamic_suite import reporting

Dan Shi

e67bd6a

2016-02-17 14:44:07 -0800

[diff] [blame]

1250

Allen Li

1850345

2016-12-29 14:56:48 -0800

[diff] [blame]

1251

if bug_template is None:

1252

bug_template = {}

1253

Alex Miller

a3a4fe7

2013-01-22 09:57:47 -0800

[diff] [blame]

1254

if self._file_bugs:

1255

bug_reporter = reporting.Reporter()

Allen Li

733dab9

2016-12-29 15:07:50 -0800

[diff] [blame]

1256

else:

1257

bug_reporter = reporting.NullReporter()

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1258

try:

Aviv Keshet

133beb1

2013-08-20 14:37:13 -0700

[diff] [blame]

1259

if self._suite_job_id:

1260

results_generator = job_status.wait_for_child_results(

1261

self._afe, self._tko, self._suite_job_id)

1262

else:

Ilja H. Friedel

04be2bd

2014-05-07 21:29:59 -0700

[diff] [blame]

1263

logging.warning('Unknown suite_job_id, falling back to less '

Dan Shi

08ff128

2016-02-18 19:51:16 -0800

[diff] [blame]

1264

'efficient results_generator.')

Aviv Keshet

133beb1

2013-08-20 14:37:13 -0700

[diff] [blame]

1265

results_generator = job_status.wait_for_results(self._afe,

1266

self._tko,

1267

self._jobs)

1268

for result in results_generator:

Allen Li

2016-12-29 15:23:01 -0800

[diff] [blame]

self._record_result(

result=result,

record=record,

results_generator=results_generator,

1273

bug_reporter=bug_reporter,

1274

bug_template=bug_template)

beeps

8ead53c

2013-04-26 19:12:46 -0700

[diff] [blame]

1275

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1276

except Exception: # pylint: disable=W0703

Allen Li

b892d9f

2016-12-29 15:50:11 -0800

[diff] [blame]

1277

logging.exception('Exception waiting for results')

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1278

Status('FAIL', self._tag,

1279

'Exception waiting for results').record_result(record)

1280

1281

Allen Li

2016-12-29 15:23:01 -0800

[diff] [blame]

1282

def _record_result(self, result, record, results_generator, bug_reporter,

1283

bug_template):

1284

"""

1285

Record a single test job result.

1286

1287

@param result: Status instance for job.

1288

@param record: callable that records job status.

1289

prototype:

1290

record(base_job.status_log_entry)

1291

@param results_generator: Results generator for sending job retries.

1292

@param bug_reporter: Reporter instance for reporting bugs.

1293

@param bug_template: A template dictionary specifying the default bug

1294

filing options for failures in this suite.

1295

"""

Allen Li

2016-12-29 15:23:01 -0800

[diff] [blame]

1296

result.record_all(record)

Allen Li

2016-12-29 16:05:41 -0800

[diff] [blame]

1297

self._remember_job_keyval(result)

Allen Li

2016-12-29 15:23:01 -0800

[diff] [blame]

1298

xixuan

bf854f8

2017-04-20 10:40:15 -0700

[diff] [blame]

1299

if self._job_retry and self._retry_handler._should_retry(result):

Allen Li

2016-12-29 15:23:01 -0800

[diff] [blame]

1300

new_job = self._schedule_test(

1301

record=record, test=self._jobs_to_tests[result.id],

1302

retry_for=result.id, ignore_errors=True)

1303

if new_job:

1304

results_generator.send([new_job])

1305

1306

# TODO (fdeng): If the suite times out before a retry could

1307

# finish, we would lose the chance to file a bug for the

1308

# original job.

1309

if self._should_report(result):

Allen Li

1130898

2016-12-29 16:19:55 -0800

[diff] [blame]

1310

if self._should_file_bugs:

Allen Li

47c9fca

2016-12-29 16:22:53 -0800

[diff] [blame]

1311

self._file_bug(result, bug_reporter, bug_template)

Allen Li

2016-12-29 15:23:01 -0800

[diff] [blame]

1312

else:

Allen Li

d5df44b

2016-12-29 15:59:06 -0800

[diff] [blame]

1313

# reporting modules have dependency on external

1314

# packages, e.g., httplib2 Such dependency can cause

1315

# issue to any module tries to import suite.py without

1316

# building site-packages first. Since the reporting

1317

# modules are only used in this function, move the

1318

# imports here avoid the requirement of building site

1319

# packages to use other functions in this module.

1320

from autotest_lib.server.cros.dynamic_suite import reporting

1321

Allen Li

7b97311

2016-12-29 16:17:41 -0800

[diff] [blame]

1322

reporting.send_email(

1323

self._get_test_bug(result),

1324

self._get_bug_template(result, bug_template))

Allen Li

2016-12-29 15:23:01 -0800

[diff] [blame]

1325

1326

Allen Li

d5df44b

2016-12-29 15:59:06 -0800

[diff] [blame]

1327

def _get_bug_template(self, result, bug_template):

1328

"""Get BugTemplate for test job.

1329

1330

@param result: Status instance for job.

1331

@param bug_template: A template dictionary specifying the default bug

1332

filing options for failures in this suite.

1333

@returns: BugTemplate instance

1334

"""

1335

# reporting modules have dependency on external packages, e.g., httplib2

1336

# Such dependency can cause issue to any module tries to import suite.py

1337

# without building site-packages first. Since the reporting modules are

1338

# only used in this function, move the imports here avoid the

1339

# requirement of building site packages to use other functions in this

1340

# module.

1341

from autotest_lib.server.cros.dynamic_suite import reporting_utils

1342

1343

# Try to merge with bug template in test control file.

1344

template = reporting_utils.BugTemplate(bug_template)

1345

try:

1346

test_data = self._jobs_to_tests[result.id]

1347

return template.finalize_bug_template(

1348

test_data.bug_template)

1349

except AttributeError:

1350

# Test control file does not have bug template defined.

1351

return template.bug_template

1352

except reporting_utils.InvalidBugTemplateException as e:

1353

logging.error('Merging bug templates failed with '

1354

'error: %s An empty bug template will '

'be used.', e)

return {}

Allen Li

2016-12-29 15:53:34 -0800

[diff] [blame]

1359

def _get_test_bug(self, result):

1360

"""Get TestBug for the given result.

1361

1362

@param result: Status instance for a test job.

1363

@returns: TestBug instance.

1364

"""

1365

# reporting modules have dependency on external packages, e.g., httplib2

1366

# Such dependency can cause issue to any module tries to import suite.py

1367

# without building site-packages first. Since the reporting modules are

1368

# only used in this function, move the imports here avoid the

1369

# requirement of building site packages to use other functions in this

1370

# module.

1371

from autotest_lib.server.cros.dynamic_suite import reporting

1372

1373

job_views = self._tko.run('get_detailed_test_views',

1374

afe_job_id=result.id)

Allen Li

2017-03-29 17:37:43 -0700

[diff] [blame]

1375

return reporting.TestBug(self._job_creator.cros_build,

Allen Li

5ed7e63

2017-02-03 16:31:33 -0800

[diff] [blame]

1376

utils.get_chrome_version(job_views),

Allen Li

003913e

2016-12-29 15:53:34 -0800

[diff] [blame]

self._tag,

result)

Allen Li

2016-12-29 16:19:55 -0800

[diff] [blame]

1381

@property

1382

def _should_file_bugs(self):

1383

"""Return whether bugs should be filed.

@returns: bool

"""

# File bug when failure is one of the _FILE_BUG_SUITES,

1388

# otherwise send an email to the owner anc cc.

1389

return self._tag in _FILE_BUG_SUITES

1390

1391

Allen Li

47c9fca

2016-12-29 16:22:53 -0800

[diff] [blame]

1392

def _file_bug(self, result, bug_reporter, bug_template):

1393

"""File a bug for a test job result.

1394

1395

@param result: Status instance for job.

1396

@param bug_reporter: Reporter instance for reporting bugs.

1397

@param bug_template: A template dictionary specifying the default bug

1398

filing options for failures in this suite.

1399

"""

1400

bug_id, bug_count = bug_reporter.report(

1401

self._get_test_bug(result),

1402

self._get_bug_template(result, bug_template))

1403

1404

# We use keyvals to communicate bugs filed with run_suite.

1405

if bug_id is not None:

1406

bug_keyvals = tools.create_bug_keyvals(

1407

result.id, result.test_name,

1408

(bug_id, bug_count))

1409

try:

1410

utils.write_keyval(self._results_dir,

1411

bug_keyvals)

1412

except ValueError:

1413

logging.error('Unable to log bug keyval for:%s',

result.test_name)

Alex Miller

2012-12-19 13:38:31 -0800

[diff] [blame]

1417

def abort(self):

1418

"""

1419

Abort all scheduled test jobs.

1420

"""

1421

if self._jobs:

1422

job_ids = [job.id for job in self._jobs]

1423

self._afe.run('abort_host_queue_entries', job__id__in=job_ids)

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1424

1425

Allen Li

2016-12-29 16:05:41 -0800

[diff] [blame]

1426

def _remember_job_keyval(self, job):

Chris Masone

d9f13c5

2012-08-29 10:37:08 -0700

[diff] [blame]

1427

"""

1428

Record provided job as a suite job keyval, for later referencing.

1429

Allen Li

2016-12-29 16:05:41 -0800

[diff] [blame]

1430

@param job: some representation of a job that has the attributes:

1431

id, test_name, and owner

Chris Masone

d9f13c5

2012-08-29 10:37:08 -0700

[diff] [blame]

1432

"""

Allen Li

3cc73cd

2016-12-12 16:02:21 -0800

[diff] [blame]

1433

if self._results_dir and job.id and job.owner and job.test_name:

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1434

job_id_owner = '%s-%s' % (job.id, job.owner)

Chris Masone

d9f13c5

2012-08-29 10:37:08 -0700

[diff] [blame]

1435

logging.debug('Adding job keyval for %s=%s',

Chris Sosa

accb5ce

2012-08-30 17:29:15 -0700

[diff] [blame]

1436

job.test_name, job_id_owner)

Chris Masone

2012-08-15 14:25:53 -0700

[diff] [blame]

1437

utils.write_keyval(

1438

self._results_dir,

1439

{hashlib.md5(job.test_name).hexdigest(): job_id_owner})

1440

Dan Shi

d152180

2013-05-24 13:08:37 -0700

[diff] [blame]

1441

Allen Li

4b5a24f

2017-03-09 16:01:35 -0800

[diff] [blame]

1442

class Suite(_BaseSuite):

1443

"""

1444

A suite of tests, defined by some predicate over control file variables.

1445

1446

Given a place to search for control files a predicate to match the desired

1447

tests, can gather tests and fire off jobs to run them, and then wait for

1448

results.

1449

1450

@var _predicate: a function that should return True when run over a

1451

ControlData representation of a control file that should be in

1452

this Suite.

1453

@var _tag: a string with which to tag jobs run in this suite.

1454

@var _builds: the builds on which we're running this suite.

1455

@var _afe: an instance of AFE as defined in server/frontend.py.

1456

@var _tko: an instance of TKO as defined in server/frontend.py.

1457

@var _jobs: currently scheduled jobs, if any.

1458

@var _jobs_to_tests: a dictionary that maps job ids to tests represented

1459

ControlData objects.

1460

@var _cf_getter: a control_file_getter.ControlFileGetter

1461

@var _retry: a bool value indicating whether jobs should be retried on

1462

failure.

1463

@var _retry_handler: a RetryHandler object.

"""

# TODO(ayatane): These methods are kept on the Suite class for

1468

# backward compatibility.

1469

find_and_parse_tests = _deprecated_suite_method(find_and_parse_tests)

1470

find_possible_tests = _deprecated_suite_method(find_possible_tests)

1471

create_fs_getter = _deprecated_suite_method(create_fs_getter)

1472

name_in_tag_predicate = _deprecated_suite_method(name_in_tag_predicate)

1473

name_in_tag_similarity_predicate = _deprecated_suite_method(

1474

name_in_tag_similarity_predicate)

1475

test_name_equals_predicate = _deprecated_suite_method(

1476

test_name_equals_predicate)

1477

test_name_matches_pattern_predicate = _deprecated_suite_method(

1478

test_name_matches_pattern_predicate)

1479

test_file_matches_pattern_predicate = _deprecated_suite_method(

1480

test_file_matches_pattern_predicate)

1481

matches_attribute_expression_predicate = _deprecated_suite_method(

1482

matches_attribute_expression_predicate)

1483

test_name_similarity_predicate = _deprecated_suite_method(

1484

test_name_similarity_predicate)

1485

test_file_similarity_predicate = _deprecated_suite_method(

1486

test_file_similarity_predicate)

1487

list_all_suites = _deprecated_suite_method(list_all_suites)

1488

get_test_source_build = _deprecated_suite_method(get_test_source_build)

1489

1490

Allen Li

25bb1c6

2017-03-09 16:27:00 -0800

[diff] [blame]

1491

@classmethod

1492

def create_from_predicates(cls, predicates, builds, board, devserver,

1493

cf_getter=None, name='ad_hoc_suite',

1494

run_prod_code=False, **dargs):

1495

"""

1496

Create a Suite using a given predicate test filters.

1497

1498

Uses supplied predicate(s) to instantiate a Suite. Looks for tests in

1499

|autotest_dir| and will schedule them using |afe|. Pulls control files

1500

from the default dev server. Results will be pulled from |tko| upon

1501

completion.

1502

1503

@param predicates: A list of callables that accept ControlData

1504

representations of control files. A test will be

1505

included in suite if all callables in this list

1506

return True on the given control file.

1507

@param builds: the builds on which we're running this suite. It's a

1508

dictionary of version_prefix:build.

1509

@param board: the board on which we're running this suite.

1510

@param devserver: the devserver which contains the build.

1511

@param cf_getter: control_file_getter.ControlFileGetter. Defaults to

1512

using DevServerGetter.

1513

@param name: name of suite. Defaults to 'ad_hoc_suite'

1514

@param run_prod_code: If true, the suite will run the tests that

1515

lives in prod aka the test code currently on the

1516

lab servers.

1517

@param **dargs: Any other Suite constructor parameters, as described

1518

in Suite.__init__ docstring.

1519

@return a Suite instance.

1520

"""

1521

if cf_getter is None:

1522

if run_prod_code:

1523

cf_getter = create_fs_getter(_AUTOTEST_DIR)

1524

else:

1525

build = get_test_source_build(builds, **dargs)

1526

cf_getter = _create_ds_getter(build, devserver)

1527

1528

return cls(predicates,

1529

name, builds, board, cf_getter, run_prod_code, **dargs)

@classmethod

def create_from_name(cls, name, builds, board, devserver, cf_getter=None,

1534

**dargs):

1535

"""

1536

Create a Suite using a predicate based on the SUITE control file var.

1537

1538

Makes a predicate based on |name| and uses it to instantiate a Suite

1539

that looks for tests in |autotest_dir| and will schedule them using

1540

|afe|. Pulls control files from the default dev server.

1541

Results will be pulled from |tko| upon completion.

1542

1543

@param name: a value of the SUITE control file variable to search for.

1544

@param builds: the builds on which we're running this suite. It's a

1545

dictionary of version_prefix:build.

1546

@param board: the board on which we're running this suite.

1547

@param devserver: the devserver which contains the build.

1548

@param cf_getter: control_file_getter.ControlFileGetter. Defaults to

1549

using DevServerGetter.

1550

@param **dargs: Any other Suite constructor parameters, as described

1551

in Suite.__init__ docstring.

1552

@return a Suite instance.

1553

"""

1554

if cf_getter is None:

1555

build = get_test_source_build(builds, **dargs)

1556

cf_getter = _create_ds_getter(build, devserver)

1557

1558

return cls([name_in_tag_predicate(name)],

1559

name, builds, board, cf_getter, **dargs)

1560

1561

Allen Li

2017-03-09 16:23:06 -0800

[diff] [blame]

def __init__(

self,

predicates,

tag,

builds,

board,

cf_getter,

run_prod_code=False,

afe=None,

tko=None,

pool=None,

results_dir=None,

max_runtime_mins=24*60,

1575

timeout_mins=24*60,

1576

file_bugs=False,

1577

file_experimental_bugs=False,

suite_job_id=None,

ignore_deps=False,

extra_deps=None,

priority=priorities.Priority.DEFAULT,

1582

forgiving_parser=True,

1583

wait_for_results=True,

1584

job_retry=False,

1585

max_retries=sys.maxint,

1586

offload_failures_only=False,

1587

test_source_build=None,

Allen Li

2017-03-09 16:29:48 -0800

[diff] [blame]

1588

job_keyvals=None,

1589

test_args=None

Allen Li

2017-03-09 16:23:06 -0800

[diff] [blame]

):

"""

Constructor

@param predicates: A list of callables that accept ControlData

1595

representations of control files. A test will be

Allen Li

2887e33

2017-03-09 16:30:36 -0800

[diff] [blame]

1596

included in suite if all callables in this list

Allen Li

2017-03-09 16:23:06 -0800

[diff] [blame]

1597

return True on the given control file.

1598

@param tag: a string with which to tag jobs run in this suite.

1599

@param builds: the builds on which we're running this suite.

1600

@param board: the board on which we're running this suite.

1601

@param cf_getter: a control_file_getter.ControlFileGetter

1602

@param afe: an instance of AFE as defined in server/frontend.py.

1603

@param tko: an instance of TKO as defined in server/frontend.py.

1604

@param pool: Specify the pool of machines to use for scheduling

1605

purposes.

1606

@param run_prod_code: If true, the suite will run the test code that

1607

lives in prod aka the test code currently on the

1608

lab servers.

1609

@param results_dir: The directory where the job can write results to.

1610

This must be set if you want job_id of sub-jobs

1611

list in the job keyvals.

1612

@param max_runtime_mins: Maximum suite runtime, in minutes.

1613

@param timeout: Maximum job lifetime, in hours.

1614

@param suite_job_id: Job id that will act as parent id to all sub jobs.

1615

Default: None

1616

@param ignore_deps: True if jobs should ignore the DEPENDENCIES

1617

attribute and skip applying of dependency labels.

1618

(Default:False)

1619

@param extra_deps: A list of strings which are the extra DEPENDENCIES

1620

to add to each test being scheduled.

1621

@param priority: Integer priority level. Higher is more important.

1622

@param wait_for_results: Set to False to run the suite job without

1623

waiting for test jobs to finish. Default is

1624

True.

1625

@param job_retry: A bool value indicating whether jobs should be retired

1626

on failure. If True, the field 'JOB_RETRIES' in

1627

control files will be respected. If False, do not

1628

retry.

1629

@param max_retries: Maximum retry limit at suite level.

1630

Regardless how many times each individual test

1631

has been retried, the total number of retries

1632

happening in the suite can't exceed _max_retries.

1633

Default to sys.maxint.

1634

@param offload_failures_only: Only enable gs_offloading for failed

1635

jobs.

1636

@param test_source_build: Build that contains the server-side test code.

1637

@param job_keyvals: General job keyvals to be inserted into keyval file,

1638

which will be used by tko/parse later.

Allen Li

2017-03-09 16:29:48 -0800

[diff] [blame]

1639

@param test_args: A dict of args passed all the way to each individual

1640

test that will be actually ran.

Allen Li

2017-03-09 16:23:06 -0800

[diff] [blame]

1641

1642

"""

Allen Li

2017-03-09 16:44:30 -0800

[diff] [blame]

1643

tests = find_and_parse_tests(

1644

cf_getter,

1645

_ComposedPredicate(predicates),

1646

tag,

1647

add_experimental=True,

1648

forgiving_parser=forgiving_parser,

1649

run_prod_code=run_prod_code,

1650

test_args=test_args,

1651

)

Allen Li

2017-03-09 16:23:06 -0800

[diff] [blame]

1652

super(Suite, self).__init__(

Allen Li

2017-03-09 16:44:30 -0800

[diff] [blame]

1653

tests=tests,

Allen Li

2017-03-09 16:23:06 -0800

[diff] [blame]

1654

tag=tag,

1655

builds=builds,

1656

board=board,

Allen Li

2017-03-09 16:23:06 -0800

[diff] [blame]

afe=afe,

tko=tko,

pool=pool,

results_dir=results_dir,

1661

max_runtime_mins=max_runtime_mins,

1662

timeout_mins=timeout_mins,

1663

file_bugs=file_bugs,

1664

file_experimental_bugs=file_experimental_bugs,

1665

suite_job_id=suite_job_id,

1666

ignore_deps=ignore_deps,

1667

extra_deps=extra_deps,

1668

priority=priority,

Allen Li