Blame - frontend/afe/rpc_utils.py - platform/external/autotest

2013-02-19 17:49:49 -0800

[diff] [blame]

1

#pylint: disable-msg=C0111

mbligh

2008-02-15 16:48:40 +0000

[diff] [blame]

2

"""\

3

Utility functions for rpc_interface.py. We keep them in a separate file so that

4

only RPC interface functions go into that file.

5

"""

6

7

__author__ = 'showard@google.com (Steve Howard)'

8

MK Ryu

84573e1

2015-02-18 15:54:09 -0800

[diff] [blame]

9

import datetime

MK Ryu

2015-06-08 14:13:16 -0700

[diff] [blame]

10

from functools import wraps

MK Ryu

84573e1

2015-02-18 15:54:09 -0800

[diff] [blame]

11

import inspect

12

import os

13

import sys

showard

3d6ae11

2009-05-02 00:45:48 +0000

[diff] [blame]

14

import django.http

Dan Shi

07e09af

2013-04-12 09:31:29 -0700

[diff] [blame]

15

from autotest_lib.frontend.afe import models, model_logic

Alex Miller

2013-08-21 13:59:01 -0700

[diff] [blame]

16

from autotest_lib.client.common_lib import control_data, error

Jiaxi Luo

421608e

2014-07-07 14:38:00 -0700

[diff] [blame]

17

from autotest_lib.client.common_lib import global_config, priorities

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

18

from autotest_lib.client.common_lib import time_utils

MK Ryu

2015-05-18 12:00:47 -0700

[diff] [blame]

19

from autotest_lib.client.common_lib.cros.graphite import autotest_stats

Prashanth Balasubramanian

2014-12-23 11:26:44 -0800

[diff] [blame]

20

from autotest_lib.server import utils as server_utils

MK Ryu

9651ca5

2015-06-08 17:48:22 -0700

[diff] [blame]

21

from autotest_lib.server.cros import provision

22

from autotest_lib.server.cros.dynamic_suite import frontend_wrappers

mbligh

2008-02-15 16:48:40 +0000

[diff] [blame]

23

showard

a62866b

2008-07-28 21:27:41 +0000

[diff] [blame]

24

NULL_DATETIME = datetime.datetime.max

25

NULL_DATE = datetime.date.max

26

mbligh

2008-02-15 16:48:40 +0000

[diff] [blame]

27

def prepare_for_serialization(objects):

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

28

"""

29

Prepare Python objects to be returned via RPC.

Aviv Keshet

2013-02-19 17:49:49 -0800

[diff] [blame]

30

@param objects: objects to be prepared.

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

31

"""

32

if (isinstance(objects, list) and len(objects) and

33

isinstance(objects[0], dict) and 'id' in objects[0]):

34

objects = gather_unique_dicts(objects)

35

return _prepare_data(objects)

showard

b8d3424

2008-04-25 18:11:16 +0000

[diff] [blame]

36

37

showard

2009-04-07 18:14:34 +0000

[diff] [blame]

38

def prepare_rows_as_nested_dicts(query, nested_dict_column_names):

39

"""

40

Prepare a Django query to be returned via RPC as a sequence of nested

41

dictionaries.

42

43

@param query - A Django model query object with a select_related() method.

44

@param nested_dict_column_names - A list of column/attribute names for the

45

rows returned by query to expand into nested dictionaries using

46

their get_object_dict() method when not None.

47

48

@returns An list suitable to returned in an RPC.

49

"""

50

all_dicts = []

51

for row in query.select_related():

52

row_dict = row.get_object_dict()

53

for column in nested_dict_column_names:

54

if row_dict[column] is not None:

55

row_dict[column] = getattr(row, column).get_object_dict()

56

all_dicts.append(row_dict)

57

return prepare_for_serialization(all_dicts)

58

59

showard

b8d3424

2008-04-25 18:11:16 +0000

[diff] [blame]

60

def _prepare_data(data):

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

61

"""

62

Recursively process data structures, performing necessary type

63

conversions to values in data to allow for RPC serialization:

64

-convert datetimes to strings

showard

2b9a88b

2008-06-13 20:55:03 +0000

[diff] [blame]

65

-convert tuples and sets to lists

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

66

"""

67

if isinstance(data, dict):

68

new_data = {}

69

for key, value in data.iteritems():

70

new_data[key] = _prepare_data(value)

71

return new_data

showard

2b9a88b

2008-06-13 20:55:03 +0000

[diff] [blame]

72

elif (isinstance(data, list) or isinstance(data, tuple) or

73

isinstance(data, set)):

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

74

return [_prepare_data(item) for item in data]

showard

9865997

2008-07-17 17:00:07 +0000

[diff] [blame]

75

elif isinstance(data, datetime.date):

showard

a62866b

2008-07-28 21:27:41 +0000

[diff] [blame]

76

if data is NULL_DATETIME or data is NULL_DATE:

77

return None

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

78

return str(data)

79

else:

80

return data

mbligh

2008-02-15 16:48:40 +0000

[diff] [blame]

81

82

Moises Osorio

2dda22e

2014-09-16 15:56:24 -0700

[diff] [blame]

83

def fetchall_as_list_of_dicts(cursor):

84

"""

85

Converts each row in the cursor to a dictionary so that values can be read

86

by using the column name.

87

@param cursor: The database cursor to read from.

88

@returns: A list of each row in the cursor as a dictionary.

89

"""

90

desc = cursor.description

91

return [ dict(zip([col[0] for col in desc], row))

92

for row in cursor.fetchall() ]

93

94

showard

3d6ae11

2009-05-02 00:45:48 +0000

[diff] [blame]

95

def raw_http_response(response_data, content_type=None):

96

response = django.http.HttpResponse(response_data, mimetype=content_type)

97

response['Content-length'] = str(len(response.content))

return response

showard

2008-06-06 18:08:02 +0000

[diff] [blame]

101

def gather_unique_dicts(dict_iterable):

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

102

"""\

103

Pick out unique objects (by ID) from an iterable of object dicts.

"""

id_set = set()

result = []

for obj in dict_iterable:

108

if obj['id'] not in id_set:

109

id_set.add(obj['id'])

110

result.append(obj)

111

return result

showard

b0dfb9f

2008-06-06 18:08:02 +0000

[diff] [blame]

112

113

Jiaxi Luo

15cbf37

2014-07-01 19:20:20 -0700

[diff] [blame]

114

def extra_job_status_filters(not_yet_run=False, running=False, finished=False):

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

115

"""\

116

Generate a SQL WHERE clause for job status filtering, and return it in

117

a dict of keyword args to pass to query.extra(). No more than one of

118

the parameters should be passed as True.

showard

2009-10-01 18:45:22 +0000

[diff] [blame]

119

* not_yet_run: all HQEs are Queued

120

* finished: all HQEs are complete

121

* running: everything else

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

122

"""

123

assert not ((not_yet_run and running) or

124

(not_yet_run and finished) or

125

(running and finished)), ('Cannot specify more than one '

126

'filter to this function')

showard

2009-10-01 18:45:22 +0000

[diff] [blame]

127

showard

2009-12-23 00:03:56 +0000

[diff] [blame]

128

not_queued = ('(SELECT job_id FROM afe_host_queue_entries '

129

'WHERE status != "%s")'

showard

2009-10-01 18:45:22 +0000

[diff] [blame]

130

% models.HostQueueEntry.Status.QUEUED)

showard

2009-12-23 00:03:56 +0000

[diff] [blame]

131

not_finished = ('(SELECT job_id FROM afe_host_queue_entries '

132

'WHERE not complete)')

showard

2009-10-01 18:45:22 +0000

[diff] [blame]

133

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

134

if not_yet_run:

showard

2009-10-01 18:45:22 +0000

[diff] [blame]

135

where = ['id NOT IN ' + not_queued]

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

136

elif running:

showard

2009-10-01 18:45:22 +0000

[diff] [blame]

137

where = ['(id IN %s) AND (id IN %s)' % (not_queued, not_finished)]

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

138

elif finished:

showard

2009-10-01 18:45:22 +0000

[diff] [blame]

139

where = ['id NOT IN ' + not_finished]

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

140

else:

showard

10f4167

2009-05-13 21:28:25 +0000

[diff] [blame]

141

return {}

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

142

return {'where': where}

mbligh

2008-02-15 16:48:40 +0000

[diff] [blame]

143

144

Jiaxi Luo

15cbf37

2014-07-01 19:20:20 -0700

[diff] [blame]

145

def extra_job_type_filters(extra_args, suite=False,

146

sub=False, standalone=False):

147

"""\

148

Generate a SQL WHERE clause for job status filtering, and return it in

149

a dict of keyword args to pass to query.extra().

150

151

param extra_args: a dict of existing extra_args.

152

153

No more than one of the parameters should be passed as True:

154

* suite: job which is parent of other jobs

155

* sub: job with a parent job

156

* standalone: job with no child or parent jobs

157

"""

158

assert not ((suite and sub) or

159

(suite and standalone) or

160

(sub and standalone)), ('Cannot specify more than one '

161

'filter to this function')

162

163

where = extra_args.get('where', [])

164

parent_job_id = ('DISTINCT parent_job_id')

165

child_job_id = ('id')

166

filter_common = ('(SELECT %s FROM afe_jobs '

167

'WHERE parent_job_id IS NOT NULL)')

168

169

if suite:

170

where.append('id IN ' + filter_common % parent_job_id)

171

elif sub:

172

where.append('id IN ' + filter_common % child_job_id)

173

elif standalone:

174

where.append('NOT EXISTS (SELECT 1 from afe_jobs AS sub_query '

175

'WHERE parent_job_id IS NOT NULL'

176

' AND (sub_query.parent_job_id=afe_jobs.id'

177

' OR sub_query.id=afe_jobs.id))')

else:

return extra_args

extra_args['where'] = where

return extra_args

showard

2009-08-20 23:37:04 +0000

[diff] [blame]

186

def extra_host_filters(multiple_labels=()):

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

187

"""\

188

Generate SQL WHERE clauses for matching hosts in an intersection of

189

labels.

190

"""

191

extra_args = {}

showard

2009-12-23 00:03:56 +0000

[diff] [blame]

192

where_str = ('afe_hosts.id in (select host_id from afe_hosts_labels '

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

193

'where label_id=%s)')

194

extra_args['where'] = [where_str] * len(multiple_labels)

195

extra_args['params'] = [models.Label.smart_get(label).id

196

for label in multiple_labels]

197

return extra_args

showard

8e3aa5e

2008-04-08 19:42:32 +0000

[diff] [blame]

198

199

showard

2009-08-20 23:37:04 +0000

[diff] [blame]

200

def get_host_query(multiple_labels, exclude_only_if_needed_labels,

showard

8aa84fc

2009-09-16 17:17:55 +0000

[diff] [blame]

201

exclude_atomic_group_hosts, valid_only, filter_data):

202

if valid_only:

203

query = models.Host.valid_objects.all()

204

else:

205

query = models.Host.objects.all()

206

showard

43a3d26

2008-11-12 18:17:05 +0000

[diff] [blame]

207

if exclude_only_if_needed_labels:

208

only_if_needed_labels = models.Label.valid_objects.filter(

209

only_if_needed=True)

showard

f7eac6f

2008-11-13 21:18:01 +0000

[diff] [blame]

210

if only_if_needed_labels.count() > 0:

showard

2009-08-20 23:37:04 +0000

[diff] [blame]

211

only_if_needed_ids = ','.join(

212

str(label['id'])

213

for label in only_if_needed_labels.values('id'))

showard

f7eac6f

2008-11-13 21:18:01 +0000

[diff] [blame]

214

query = models.Host.objects.add_join(

showard

2009-12-23 00:03:56 +0000

[diff] [blame]

215

query, 'afe_hosts_labels', join_key='host_id',

216

join_condition=('afe_hosts_labels_exclude_OIN.label_id IN (%s)'

showard

2009-08-20 23:37:04 +0000

[diff] [blame]

217

% only_if_needed_ids),

218

suffix='_exclude_OIN', exclude=True)

showard

8aa84fc

2009-09-16 17:17:55 +0000

[diff] [blame]

219

showard

2009-08-20 23:37:04 +0000

[diff] [blame]

220

if exclude_atomic_group_hosts:

221

atomic_group_labels = models.Label.valid_objects.filter(

222

atomic_group__isnull=False)

223

if atomic_group_labels.count() > 0:

224

atomic_group_label_ids = ','.join(

225

str(atomic_group['id'])

226

for atomic_group in atomic_group_labels.values('id'))

227

query = models.Host.objects.add_join(

showard

2009-12-23 00:03:56 +0000

[diff] [blame]

228

query, 'afe_hosts_labels', join_key='host_id',

229

join_condition=(

230

'afe_hosts_labels_exclude_AG.label_id IN (%s)'

231

% atomic_group_label_ids),

showard

2009-08-20 23:37:04 +0000

[diff] [blame]

232

suffix='_exclude_AG', exclude=True)

Fang Deng

04d3061

2013-04-10 18:13:13 -0700

[diff] [blame]

233

try:

234

assert 'extra_args' not in filter_data

235

filter_data['extra_args'] = extra_host_filters(multiple_labels)

236

return models.Host.query_objects(filter_data, initial_query=query)

237

except models.Label.DoesNotExist as e:

238

return models.Host.objects.none()

showard

43a3d26

2008-11-12 18:17:05 +0000

[diff] [blame]

239

240

showard

2008-03-10 21:29:07 +0000

[diff] [blame]

241

class InconsistencyException(Exception):

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

242

'Raised when a list of objects does not have a consistent value'

showard

2008-03-10 21:29:07 +0000

[diff] [blame]

243

244

245

def get_consistent_value(objects, field):

mbligh

c5ddfd1

2008-08-04 17:15:00 +0000

[diff] [blame]

246

if not objects:

247

# well a list of nothing is consistent

248

return None

249

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

250

value = getattr(objects[0], field)

251

for obj in objects:

252

this_value = getattr(obj, field)

253

if this_value != value:

254

raise InconsistencyException(objects[0], obj)

255

return value

showard

2008-03-10 21:29:07 +0000

[diff] [blame]

256

257

Matthew Sartori

1043809

2015-06-24 14:30:18 -0700

[diff] [blame]

258

def afe_test_dict_to_test_object(test_dict):

259

if not isinstance(test_dict, dict):

return test_dict

numerized_dict = {}

for key, value in test_dict.iteritems():

264

try:

265

numerized_dict[key] = int(value)

266

except (ValueError, TypeError):

267

numerized_dict[key] = value

268

269

return type('TestObject', (object,), numerized_dict)

270

271

272

def prepare_generate_control_file(tests, kernel, label, profilers,

273

db_tests=True):

274

if db_tests:

275

test_objects = [models.Test.smart_get(test) for test in tests]

276

else:

277

test_objects = [afe_test_dict_to_test_object(test) for test in tests]

278

showard

2b9a88b

2008-06-13 20:55:03 +0000

[diff] [blame]

279

profiler_objects = [models.Profiler.smart_get(profiler)

280

for profiler in profilers]

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

281

# ensure tests are all the same type

282

try:

283

test_type = get_consistent_value(test_objects, 'test_type')

284

except InconsistencyException, exc:

285

test1, test2 = exc.args

mbligh

ec5546d

2008-06-16 16:51:28 +0000

[diff] [blame]

286

raise model_logic.ValidationError(

Matthew Sartori

1043809

2015-06-24 14:30:18 -0700

[diff] [blame]

287

{'tests' : 'You cannot run both test_suites and server-side '

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

288

'tests together (tests %s and %s differ' % (

289

test1.name, test2.name)})

showard

2008-03-10 21:29:07 +0000

[diff] [blame]

290

Aviv Keshet

3dd8beb

2013-05-13 17:36:04 -0700

[diff] [blame]

291

is_server = (test_type == control_data.CONTROL_TYPE.SERVER)

showard

14374b1

2009-01-31 00:11:54 +0000

[diff] [blame]

292

if test_objects:

293

synch_count = max(test.sync_count for test in test_objects)

294

else:

295

synch_count = 1

jadmanski

2008-06-06 21:10:57 +0000

[diff] [blame]

296

if label:

297

label = models.Label.smart_get(label)

mbligh

2008-02-15 16:48:40 +0000

[diff] [blame]

298

Matthew Sartori

1043809

2015-06-24 14:30:18 -0700

[diff] [blame]

299

if db_tests:

300

dependencies = set(label.name for label

301

in models.Label.objects.filter(test__in=test_objects))

302

else:

303

dependencies = reduce(

304

set.union, [set(test.dependencies) for test in test_objects])

showard

2008-10-01 11:38:11 +0000

[diff] [blame]

305

showard

2bab8f4

2008-11-12 18:15:22 +0000

[diff] [blame]

306

cf_info = dict(is_server=is_server, synch_count=synch_count,

307

dependencies=list(dependencies))

308

return cf_info, test_objects, profiler_objects, label

showard

2008-10-01 11:38:11 +0000

[diff] [blame]

309

310

311

def check_job_dependencies(host_objects, job_dependencies):

312

"""

313

Check that a set of machines satisfies a job's dependencies.

314

host_objects: list of models.Host objects

315

job_dependencies: list of names of labels

316

"""

317

# check that hosts satisfy dependencies

318

host_ids = [host.id for host in host_objects]

319

hosts_in_job = models.Host.objects.filter(id__in=host_ids)

320

ok_hosts = hosts_in_job

321

for index, dependency in enumerate(job_dependencies):

Alex Miller

aa77200

2014-04-10 17:51:21 -0700

[diff] [blame]

322

if not provision.is_for_special_action(dependency):

Aviv Keshet

2013-07-31 16:13:01 -0700

[diff] [blame]

323

ok_hosts = ok_hosts.filter(labels__name=dependency)

showard

2008-10-01 11:38:11 +0000

[diff] [blame]

324

failing_hosts = (set(host.hostname for host in host_objects) -

325

set(host.hostname for host in ok_hosts))

326

if failing_hosts:

327

raise model_logic.ValidationError(

Eric Li

e0493a4

2010-11-15 13:05:43 -0800

[diff] [blame]

328

{'hosts' : 'Host(s) failed to meet job dependencies (' +

329

(', '.join(job_dependencies)) + '): ' +

330

(', '.join(failing_hosts))})

331

showard

2008-10-01 11:38:11 +0000

[diff] [blame]

332

Alex Miller

2013-08-21 13:59:01 -0700

[diff] [blame]

333

def check_job_metahost_dependencies(metahost_objects, job_dependencies):

334

"""

335

Check that at least one machine within the metahost spec satisfies the job's

336

dependencies.

337

338

@param metahost_objects A list of label objects representing the metahosts.

339

@param job_dependencies A list of strings of the required label names.

340

@raises NoEligibleHostException If a metahost cannot run the job.

341

"""

342

for metahost in metahost_objects:

343

hosts = models.Host.objects.filter(labels=metahost)

344

for label_name in job_dependencies:

Alex Miller

aa77200

2014-04-10 17:51:21 -0700

[diff] [blame]

345

if not provision.is_for_special_action(label_name):

Alex Miller

2013-08-21 13:59:01 -0700

[diff] [blame]

346

hosts = hosts.filter(labels__name=label_name)

347

if not any(hosts):

348

raise error.NoEligibleHostException("No hosts within %s satisfy %s."

349

% (metahost.name, ', '.join(job_dependencies)))

350

showard

2bab8f4

2008-11-12 18:15:22 +0000

[diff] [blame]

351

352

def _execution_key_for(host_queue_entry):

353

return (host_queue_entry.job.id, host_queue_entry.execution_subdir)

354

355

356

def check_abort_synchronous_jobs(host_queue_entries):

357

# ensure user isn't aborting part of a synchronous autoserv execution

358

count_per_execution = {}

359

for queue_entry in host_queue_entries:

360

key = _execution_key_for(queue_entry)

361

count_per_execution.setdefault(key, 0)

362

count_per_execution[key] += 1

363

364

for queue_entry in host_queue_entries:

365

if not queue_entry.execution_subdir:

366

continue

367

execution_count = count_per_execution[_execution_key_for(queue_entry)]

368

if execution_count < queue_entry.job.synch_count:

mbligh

1ef218d

2009-08-03 16:57:56 +0000

[diff] [blame]

369

raise model_logic.ValidationError(

370

{'' : 'You cannot abort part of a synchronous job execution '

371

'(%d/%s), %d included, %d expected'

372

% (queue_entry.job.id, queue_entry.execution_subdir,

373

execution_count, queue_entry.job.synch_count)})

showard

8fbae65

2009-01-20 23:23:10 +0000

[diff] [blame]

374

375

showard

2009-04-07 18:14:34 +0000

[diff] [blame]

376

def check_atomic_group_create_job(synch_count, host_objects, metahost_objects,

Alex Miller

2013-08-08 01:19:20 -0700

[diff] [blame]

377

dependencies, atomic_group):

showard

2009-04-07 18:14:34 +0000

[diff] [blame]

378

"""

379

Attempt to reject create_job requests with an atomic group that

380

will be impossible to schedule. The checks are not perfect but

381

should catch the most obvious issues.

382

383

@param synch_count - The job's minimum synch count.

384

@param host_objects - A list of models.Host instances.

385

@param metahost_objects - A list of models.Label instances.

386

@param dependencies - A list of job dependency label names.

showard

2009-04-07 18:14:34 +0000

[diff] [blame]

387

@param labels_by_name - A dictionary mapping label names to models.Label

388

instance. Used to look up instances for dependencies.

389

390

@raises model_logic.ValidationError - When an issue is found.

391

"""

392

# If specific host objects were supplied with an atomic group, verify

393

# that there are enough to satisfy the synch_count.

394

minimum_required = synch_count or 1

395

if (host_objects and not metahost_objects and

396

len(host_objects) < minimum_required):

397

raise model_logic.ValidationError(

398

{'hosts':

399

'only %d hosts provided for job with synch_count = %d' %

400

(len(host_objects), synch_count)})

401

402

# Check that the atomic group has a hope of running this job

403

# given any supplied metahosts and dependancies that may limit.

404

405

# Get a set of hostnames in the atomic group.

406

possible_hosts = set()

407

for label in atomic_group.label_set.all():

408

possible_hosts.update(h.hostname for h in label.host_set.all())

409

410

# Filter out hosts that don't match all of the job dependency labels.

Alex Miller

2013-08-08 01:19:20 -0700

[diff] [blame]

411

for label in models.Label.objects.filter(name__in=dependencies):

showard

2009-04-07 18:14:34 +0000

[diff] [blame]

412

hosts_in_label = (h.hostname for h in label.host_set.all())

413

possible_hosts.intersection_update(hosts_in_label)

414

showard

225bdc1

2009-04-13 16:09:21 +0000

[diff] [blame]

415

if not host_objects and not metahost_objects:

416

# No hosts or metahosts are required to queue an atomic group Job.

417

# However, if they are given, we respect them below.

418

host_set = possible_hosts

419

else:

420

host_set = set(host.hostname for host in host_objects)

421

unusable_host_set = host_set.difference(possible_hosts)

422

if unusable_host_set:

423

raise model_logic.ValidationError(

424

{'hosts': 'Hosts "%s" are not in Atomic Group "%s"' %

425

(', '.join(sorted(unusable_host_set)), atomic_group.name)})

showard

2009-04-07 18:14:34 +0000

[diff] [blame]

426

427

# Lookup hosts provided by each meta host and merge them into the

428

# host_set for final counting.

429

for meta_host in metahost_objects:

430

meta_possible = possible_hosts.copy()

431

hosts_in_meta_host = (h.hostname for h in meta_host.host_set.all())

432

meta_possible.intersection_update(hosts_in_meta_host)

433

434

# Count all hosts that this meta_host will provide.

435

host_set.update(meta_possible)

436

437

if len(host_set) < minimum_required:

438

raise model_logic.ValidationError(

439

{'atomic_group_name':

440

'Insufficient hosts in Atomic Group "%s" with the'

441

' supplied dependencies and meta_hosts.' %

442

(atomic_group.name,)})

443

444

showard

be0d869

2009-08-20 23:42:44 +0000

[diff] [blame]

445

def check_modify_host(update_data):

446

"""

447

Sanity check modify_host* requests.

448

449

@param update_data: A dictionary with the changes to make to a host

450

or hosts.

451

"""

452

# Only the scheduler (monitor_db) is allowed to modify Host status.

453

# Otherwise race conditions happen as a hosts state is changed out from

454

# beneath tasks being run on a host.

455

if 'status' in update_data:

456

raise model_logic.ValidationError({

457

'status': 'Host status can not be modified by the frontend.'})

458

459

showard

ce7c092

2009-09-11 18:39:24 +0000

[diff] [blame]

460

def check_modify_host_locking(host, update_data):

461

"""

462

Checks when locking/unlocking has been requested if the host is already

463

locked/unlocked.

464

465

@param host: models.Host object to be modified

466

@param update_data: A dictionary with the changes to make to the host.

467

"""

468

locked = update_data.get('locked', None)

Matthew Sartori

6818633

2015-04-27 17:19:53 -0700

[diff] [blame]

469

lock_reason = update_data.get('lock_reason', None)

showard

ce7c092

2009-09-11 18:39:24 +0000

[diff] [blame]

470

if locked is not None:

471

if locked and host.locked:

472

raise model_logic.ValidationError({

473

'locked': 'Host already locked by %s on %s.' %

474

(host.locked_by, host.lock_time)})

475

if not locked and not host.locked:

476

raise model_logic.ValidationError({

477

'locked': 'Host already unlocked.'})

Matthew Sartori

6818633

2015-04-27 17:19:53 -0700

[diff] [blame]

478

if locked and not lock_reason and not host.locked:

479

raise model_logic.ValidationError({

480

'locked': 'Please provide a reason for locking'})

showard

ce7c092

2009-09-11 18:39:24 +0000

[diff] [blame]

481

482

showard

8fbae65

2009-01-20 23:23:10 +0000

[diff] [blame]

483

def get_motd():

484

dirname = os.path.dirname(__file__)

485

filename = os.path.join(dirname, "..", "..", "motd.txt")

486

text = ''

487

try:

488

fp = open(filename, "r")

try:

text = fp.read()

finally:

fp.close()

except:

pass

return text

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

497

498

499

def _get_metahost_counts(metahost_objects):

500

metahost_counts = {}

501

for metahost in metahost_objects:

502

metahost_counts.setdefault(metahost, 0)

503

metahost_counts[metahost] += 1

504

return metahost_counts

505

506

showard

a965cef

2009-05-15 23:17:41 +0000

[diff] [blame]

507

def get_job_info(job, preserve_metahosts=False, queue_entry_filter_data=None):

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

hosts = []

one_time_hosts = []

meta_hosts = []

atomic_group = None

jamesren

2010-04-12 18:25:06 +0000

[diff] [blame]

512

hostless = False

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

513

showard

4d07756

2009-05-08 18:24:36 +0000

[diff] [blame]

514

queue_entries = job.hostqueueentry_set.all()

showard

a965cef

2009-05-15 23:17:41 +0000

[diff] [blame]

515

if queue_entry_filter_data:

516

queue_entries = models.HostQueueEntry.query_objects(

517

queue_entry_filter_data, initial_query=queue_entries)

showard

4d07756

2009-05-08 18:24:36 +0000

[diff] [blame]

518

519

for queue_entry in queue_entries:

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

520

if (queue_entry.host and (preserve_metahosts or

521

not queue_entry.meta_host)):

522

if queue_entry.deleted:

523

continue

524

if queue_entry.host.invalid:

525

one_time_hosts.append(queue_entry.host)

526

else:

527

hosts.append(queue_entry.host)

jamesren

2010-04-12 18:25:06 +0000

[diff] [blame]

528

elif queue_entry.meta_host:

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

529

meta_hosts.append(queue_entry.meta_host)

jamesren

2010-04-12 18:25:06 +0000

[diff] [blame]

else:

hostless = True

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

533

if atomic_group is None:

534

if queue_entry.atomic_group is not None:

535

atomic_group = queue_entry.atomic_group

536

else:

537

assert atomic_group.name == queue_entry.atomic_group.name, (

538

'DB inconsistency. HostQueueEntries with multiple atomic'

539

' groups on job %s: %s != %s' % (

540

id, atomic_group.name, queue_entry.atomic_group.name))

541

542

meta_host_counts = _get_metahost_counts(meta_hosts)

543

544

info = dict(dependencies=[label.name for label

545

in job.dependency_labels.all()],

546

hosts=hosts,

547

meta_hosts=meta_hosts,

548

meta_host_counts=meta_host_counts,

549

one_time_hosts=one_time_hosts,

jamesren

2010-04-12 18:25:06 +0000

[diff] [blame]

550

atomic_group=atomic_group,

551

hostless=hostless)

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

return info

showard

2009-11-19 01:01:19 +0000

[diff] [blame]

555

def check_for_duplicate_hosts(host_objects):

556

host_ids = set()

557

duplicate_hostnames = set()

558

for host in host_objects:

559

if host.id in host_ids:

560

duplicate_hostnames.add(host.hostname)

561

host_ids.add(host.id)

562

563

if duplicate_hostnames:

564

raise model_logic.ValidationError(

565

{'hosts' : 'Duplicate hosts: %s'

566

% ', '.join(duplicate_hostnames)})

567

568

showard

2009-05-12 17:32:04 +0000

[diff] [blame]

569

def create_new_job(owner, options, host_objects, metahost_objects,

570

atomic_group=None):

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

571

all_host_objects = host_objects + metahost_objects

572

metahost_counts = _get_metahost_counts(metahost_objects)

showard

2009-05-12 17:32:04 +0000

[diff] [blame]

573

dependencies = options.get('dependencies', [])

574

synch_count = options.get('synch_count')

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

575

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

576

if atomic_group:

577

check_atomic_group_create_job(

578

synch_count, host_objects, metahost_objects,

Alex Miller

2013-08-08 01:19:20 -0700

[diff] [blame]

579

dependencies, atomic_group)

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

580

else:

581

if synch_count is not None and synch_count > len(all_host_objects):

582

raise model_logic.ValidationError(

583

{'hosts':

584

'only %d hosts provided for job with synch_count = %d' %

585

(len(all_host_objects), synch_count)})

586

atomic_hosts = models.Host.objects.filter(

587

id__in=[host.id for host in host_objects],

588

labels__atomic_group=True)

589

unusable_host_names = [host.hostname for host in atomic_hosts]

590

if unusable_host_names:

591

raise model_logic.ValidationError(

592

{'hosts':

593

'Host(s) "%s" are atomic group hosts but no '

594

'atomic group was specified for this job.' %

595

(', '.join(unusable_host_names),)})

596

showard

09d80f9

2009-11-19 01:01:19 +0000

[diff] [blame]

597

check_for_duplicate_hosts(host_objects)

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

598

Aviv Keshet

2013-07-31 16:13:01 -0700

[diff] [blame]

599

for label_name in dependencies:

Alex Miller

aa77200

2014-04-10 17:51:21 -0700

[diff] [blame]

600

if provision.is_for_special_action(label_name):

Aviv Keshet

2013-07-31 16:13:01 -0700

[diff] [blame]

601

# TODO: We could save a few queries

602

# if we had a bulk ensure-label-exists function, which used

603

# a bulk .get() call. The win is probably very small.

Alex Miller

2013-08-08 01:19:20 -0700

[diff] [blame]

604

_ensure_label_exists(label_name)

Aviv Keshet

2013-07-31 16:13:01 -0700

[diff] [blame]

605

Alex Miller

2013-08-21 13:59:01 -0700

[diff] [blame]

606

# This only checks targeted hosts, not hosts eligible due to the metahost

607

check_job_dependencies(host_objects, dependencies)

608

check_job_metahost_dependencies(metahost_objects, dependencies)

609

Alex Miller

2013-08-08 01:19:20 -0700

[diff] [blame]

610

options['dependencies'] = list(

611

models.Label.objects.filter(name__in=dependencies))

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

612

showard

2009-05-12 17:32:04 +0000

[diff] [blame]

613

for label in metahost_objects + options['dependencies']:

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

614

if label.atomic_group and not atomic_group:

615

raise model_logic.ValidationError(

616

{'atomic_group_name':

showard

c873032

2009-06-30 01:56:38 +0000

[diff] [blame]

617

'Dependency %r requires an atomic group but no '

618

'atomic_group_name or meta_host in an atomic group was '

619

'specified for this job.' % label.name})

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

620

elif (label.atomic_group and

621

label.atomic_group.name != atomic_group.name):

622

raise model_logic.ValidationError(

623

{'atomic_group_name':

showard

c873032

2009-06-30 01:56:38 +0000

[diff] [blame]

624

'meta_hosts or dependency %r requires atomic group '

625

'%r instead of the supplied atomic_group_name=%r.' %

626

(label.name, label.atomic_group.name, atomic_group.name)})

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

627

showard

2009-05-12 17:32:04 +0000

[diff] [blame]

628

job = models.Job.create(owner=owner, options=options,

629

hosts=all_host_objects)

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

630

job.queue(all_host_objects, atomic_group=atomic_group,

showard

2009-05-12 17:32:04 +0000

[diff] [blame]

631

is_template=options.get('is_template', False))

showard

2009-04-29 21:16:24 +0000

[diff] [blame]

632

return job.id

showard

0957a84

2009-05-11 19:25:08 +0000

[diff] [blame]

633

634

Aviv Keshet

2013-07-31 16:13:01 -0700

[diff] [blame]

635

def _ensure_label_exists(name):

636

"""

637

Ensure that a label called |name| exists in the Django models.

638

639

This function is to be called from within afe rpcs only, as an

640

alternative to server.cros.provision.ensure_label_exists(...). It works

641

by Django model manipulation, rather than by making another create_label

642

rpc call.

643

644

@param name: the label to check for/create.

645

@raises ValidationError: There was an error in the response that was

646

not because the label already existed.

647

@returns True is a label was created, False otherwise.

648

"""

649

try:

650

models.Label.objects.get(name=name)

651

except models.Label.DoesNotExist:

652

new_label = models.Label.objects.create(name=name)

new_label.save()

return True

return False

showard

2009-07-07 20:54:42 +0000

[diff] [blame]

658

def find_platform_and_atomic_group(host):

659

"""

660

Figure out the platform name and atomic group name for the given host

661

object. If none, the return value for either will be None.

662

663

@returns (platform name, atomic group name) for the given host.

664

"""

showard

0957a84

2009-05-11 19:25:08 +0000

[diff] [blame]

665

platforms = [label.name for label in host.label_list if label.platform]

666

if not platforms:

showard

909c914

2009-07-07 20:54:42 +0000

[diff] [blame]

667

platform = None

668

else:

669

platform = platforms[0]

showard

0957a84

2009-05-11 19:25:08 +0000

[diff] [blame]

670

if len(platforms) > 1:

671

raise ValueError('Host %s has more than one platform: %s' %

672

(host.hostname, ', '.join(platforms)))

showard

909c914

2009-07-07 20:54:42 +0000

[diff] [blame]

673

for label in host.label_list:

674

if label.atomic_group:

675

atomic_group_name = label.atomic_group.name

676

break

677

else:

678

atomic_group_name = None

679

# Don't check for multiple atomic groups on a host here. That is an

680

# error but should not trip up the RPC interface. monitor_db_cleanup

681

# deals with it. This just returns the first one found.

682

return platform, atomic_group_name

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

683

684

685

# support for get_host_queue_entries_and_special_tasks()

686

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

687

def _common_entry_to_dict(entry, type, job_dict, exec_path, status, started_on):

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

688

return dict(type=type,

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

689

host=entry['host'],

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

690

job=job_dict,

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

691

execution_path=exec_path,

692

status=status,

693

started_on=started_on,

694

id=str(entry['id']) + type,

695

oid=entry['id'])

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

696

697

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

698

def _special_task_to_dict(task, queue_entries):

699

"""Transforms a special task dictionary to another form of dictionary.

700

701

@param task Special task as a dictionary type

702

@param queue_entries Host queue entries as a list of dictionaries.

703

704

@return Transformed dictionary for a special task.

705

"""

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

706

job_dict = None

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

707

if task['queue_entry']:

708

# Scan queue_entries to get the job detail info.

709

for qentry in queue_entries:

710

if task['queue_entry']['id'] == qentry['id']:

711

job_dict = qentry['job']

712

break

713

# If not found, get it from DB.

714

if job_dict is None:

715

job = models.Job.objects.get(id=task['queue_entry']['job'])

716

job_dict = job.get_object_dict()

717

718

exec_path = server_utils.get_special_task_exec_path(

719

task['host']['hostname'], task['id'], task['task'],

720

time_utils.time_string_to_datetime(task['time_requested']))

721

status = server_utils.get_special_task_status(

722

task['is_complete'], task['success'], task['is_active'])

723

return _common_entry_to_dict(task, task['task'], job_dict,

724

exec_path, status, task['time_started'])

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

725

726

727

def _queue_entry_to_dict(queue_entry):

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

728

job_dict = queue_entry['job']

729

tag = server_utils.get_job_tag(job_dict['id'], job_dict['owner'])

730

exec_path = server_utils.get_hqe_exec_path(tag,

731

queue_entry['execution_subdir'])

732

return _common_entry_to_dict(queue_entry, 'Job', job_dict, exec_path,

733

queue_entry['status'], queue_entry['started_on'])

734

735

736

def prepare_host_queue_entries_and_special_tasks(interleaved_entries,

737

queue_entries):

738

"""

739

Prepare for serialization the interleaved entries of host queue entries

740

and special tasks.

741

Each element in the entries is a dictionary type.

742

The special task dictionary has only a job id for a job and lacks

743

the detail of the job while the host queue entry dictionary has.

744

queue_entries is used to look up the job detail info.

745

746

@param interleaved_entries Host queue entries and special tasks as a list

747

of dictionaries.

748

@param queue_entries Host queue entries as a list of dictionaries.

749

750

@return A post-processed list of dictionaries that is to be serialized.

751

"""

752

dict_list = []

753

for e in interleaved_entries:

754

# Distinguish the two mixed entries based on the existence of

755

# the key "task". If an entry has the key, the entry is for

756

# special task. Otherwise, host queue entry.

757

if 'task' in e:

758

dict_list.append(_special_task_to_dict(e, queue_entries))

759

else:

760

dict_list.append(_queue_entry_to_dict(e))

761

return prepare_for_serialization(dict_list)

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

762

763

764

def _compute_next_job_for_tasks(queue_entries, special_tasks):

765

"""

766

For each task, try to figure out the next job that ran after that task.

767

This is done using two pieces of information:

768

* if the task has a queue entry, we can use that entry's job ID.

769

* if the task has a time_started, we can try to compare that against the

770

started_on field of queue_entries. this isn't guaranteed to work perfectly

771

since queue_entries may also have null started_on values.

772

* if the task has neither, or if use of time_started fails, just use the

773

last computed job ID.

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

774

775

@param queue_entries Host queue entries as a list of dictionaries.

776

@param special_tasks Special tasks as a list of dictionaries.

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

777

"""

778

next_job_id = None # most recently computed next job

779

hqe_index = 0 # index for scanning by started_on times

780

for task in special_tasks:

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

781

if task['queue_entry']:

782

next_job_id = task['queue_entry']['job']

783

elif task['time_started'] is not None:

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

784

for queue_entry in queue_entries[hqe_index:]:

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

785

if queue_entry['started_on'] is None:

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

786

continue

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

787

t1 = time_utils.time_string_to_datetime(

788

queue_entry['started_on'])

789

t2 = time_utils.time_string_to_datetime(task['time_started'])

790

if t1 < t2:

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

791

break

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

792

next_job_id = queue_entry['job']['id']

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

793

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

794

task['next_job_id'] = next_job_id

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

795

796

# advance hqe_index to just after next_job_id

797

if next_job_id is not None:

798

for queue_entry in queue_entries[hqe_index:]:

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

799

if queue_entry['job']['id'] < next_job_id:

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

break

hqe_index += 1

def interleave_entries(queue_entries, special_tasks):

805

"""

806

Both lists should be ordered by descending ID.

807

"""

808

_compute_next_job_for_tasks(queue_entries, special_tasks)

809

810

# start with all special tasks that've run since the last job

811

interleaved_entries = []

812

for task in special_tasks:

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

813

if task['next_job_id'] is not None:

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

814

break

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

815

interleaved_entries.append(task)

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

816

817

# now interleave queue entries with the remaining special tasks

818

special_task_index = len(interleaved_entries)

819

for queue_entry in queue_entries:

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

820

interleaved_entries.append(queue_entry)

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

821

# add all tasks that ran between this job and the previous one

822

for task in special_tasks[special_task_index:]:

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

823

if task['next_job_id'] < queue_entry['job']['id']:

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

824

break

MK Ryu

2015-04-30 12:00:55 -0700

[diff] [blame]

825

interleaved_entries.append(task)

showard

2009-07-08 21:14:45 +0000

[diff] [blame]

826

special_task_index += 1

827

828

return interleaved_entries

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

829

830

Prashanth Balasubramanian

6edaaf9

2014-11-24 16:36:25 -0800

[diff] [blame]

831

def bucket_hosts_by_shard(host_objs, rpc_hostnames=False):

832

"""Figure out which hosts are on which shards.

833

834

@param host_objs: A list of host objects.

835

@param rpc_hostnames: If True, the rpc_hostnames of a shard are returned

836

instead of the 'real' shard hostnames. This only matters for testing

837

environments.

838

839

@return: A map of shard hostname: list of hosts on the shard.

840

"""

841

shard_host_map = {}

842

for host in host_objs:

843

if host.shard:

844

shard_name = (host.shard.rpc_hostname() if rpc_hostnames

845

else host.shard.hostname)

846

shard_host_map.setdefault(shard_name, []).append(host.hostname)

847

return shard_host_map

848

849

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

850

def get_create_job_common_args(local_args):

851

"""

852

Returns a dict containing only the args that apply for create_job_common

853

854

Returns a subset of local_args, which contains only the arguments that can

855

be passed in to create_job_common().

856

"""

Alex Miller

7d658cf

2013-09-04 16:00:35 -0700

[diff] [blame]

857

# This code is only here to not kill suites scheduling tests when priority

858

# becomes an int instead of a string.

859

if isinstance(local_args['priority'], str):

860

local_args['priority'] = priorities.Priority.DEFAULT

861

# </migration hack>

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

862

arg_names, _, _, _ = inspect.getargspec(create_job_common)

863

return dict(item for item in local_args.iteritems() if item[0] in arg_names)

864

865

866

def create_job_common(name, priority, control_type, control_file=None,

867

hosts=(), meta_hosts=(), one_time_hosts=(),

868

atomic_group_name=None, synch_count=None,

Simran Basi

7e60574

2013-11-12 13:43:36 -0800

[diff] [blame]

869

is_template=False, timeout=None, timeout_mins=None,

870

max_runtime_mins=None, run_verify=True, email_list='',

871

dependencies=(), reboot_before=None, reboot_after=None,

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

872

parse_failed_repair=None, hostless=False, keyvals=None,

Aviv Keshet

2013-02-19 17:49:49 -0800

[diff] [blame]

873

drone_set=None, parameterized_job=None,

Dan Shi

ec1d47d

2015-02-13 11:38:13 -0800

[diff] [blame]

874

parent_job_id=None, test_retry=0, run_reset=True,

875

require_ssp=None):

Aviv Keshet

2013-02-19 17:49:49 -0800

[diff] [blame]

876

#pylint: disable-msg=C0111

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

877

"""

878

Common code between creating "standard" jobs and creating parameterized jobs

879

"""

880

user = models.User.current_user()

881

owner = user.login

882

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

883

# input validation

884

if not (hosts or meta_hosts or one_time_hosts or atomic_group_name

885

or hostless):

886

raise model_logic.ValidationError({

887

'arguments' : "You must pass at least one of 'hosts', "

888

"'meta_hosts', 'one_time_hosts', "

889

"'atomic_group_name', or 'hostless'"

})

if hostless:

if hosts or meta_hosts or one_time_hosts or atomic_group_name:

894

raise model_logic.ValidationError({

895

'hostless': 'Hostless jobs cannot include any hosts!'})

Aviv Keshet

3dd8beb

2013-05-13 17:36:04 -0700

[diff] [blame]

896

server_type = control_data.CONTROL_TYPE_NAMES.SERVER

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

897

if control_type != server_type:

898

raise model_logic.ValidationError({

899

'control_type': 'Hostless jobs cannot use client-side '

900

'control files'})

901

Alex Miller

2013-08-08 01:19:20 -0700

[diff] [blame]

902

atomic_groups_by_name = dict((ag.name, ag)

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

903

for ag in models.AtomicGroup.objects.all())

Alex Miller

2013-08-08 01:19:20 -0700

[diff] [blame]

904

label_objects = list(models.Label.objects.filter(name__in=meta_hosts))

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

905

906

# Schedule on an atomic group automagically if one of the labels given

907

# is an atomic group label and no explicit atomic_group_name was supplied.

908

if not atomic_group_name:

Alex Miller

2013-08-08 01:19:20 -0700

[diff] [blame]

909

for label in label_objects:

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

910

if label and label.atomic_group:

911

atomic_group_name = label.atomic_group.name

912

break

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

913

# convert hostnames & meta hosts to host/label objects

914

host_objects = models.Host.smart_get_bulk(hosts)

Prashanth Balasubramanian

2014-12-23 11:26:44 -0800

[diff] [blame]

915

if not server_utils.is_shard():

Prashanth Balasubramanian

6edaaf9

2014-11-24 16:36:25 -0800

[diff] [blame]

916

shard_host_map = bucket_hosts_by_shard(host_objects)

Prashanth Balasubramanian

2014-12-23 11:26:44 -0800

[diff] [blame]

917

num_shards = len(shard_host_map)

918

if (num_shards > 1 or (num_shards == 1 and

919

len(shard_host_map.values()[0]) != len(host_objects))):

920

# We disallow the following jobs on master:

921

# num_shards > 1: this is a job spanning across multiple shards.

922

# num_shards == 1 but number of hosts on shard is less

923

# than total number of hosts: this is a job that spans across

924

# one shard and the master.

925

raise ValueError(

926

'The following hosts are on shard(s), please create '

927

'seperate jobs for hosts on each shard: %s ' %

928

shard_host_map)

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

929

metahost_objects = []

Alex Miller

2013-08-08 01:19:20 -0700

[diff] [blame]

930

meta_host_labels_by_name = {label.name: label for label in label_objects}

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

931

for label_name in meta_hosts or []:

Alex Miller

2013-08-08 01:19:20 -0700

[diff] [blame]

932

if label_name in meta_host_labels_by_name:

933

metahost_objects.append(meta_host_labels_by_name[label_name])

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

934

elif label_name in atomic_groups_by_name:

935

# If given a metahost name that isn't a Label, check to

936

# see if the user was specifying an Atomic Group instead.

937

atomic_group = atomic_groups_by_name[label_name]

938

if atomic_group_name and atomic_group_name != atomic_group.name:

939

raise model_logic.ValidationError({

940

'meta_hosts': (

941

'Label "%s" not found. If assumed to be an '

942

'atomic group it would conflict with the '

943

'supplied atomic group "%s".' % (

944

label_name, atomic_group_name))})

945

atomic_group_name = atomic_group.name

946

else:

947

raise model_logic.ValidationError(

948

{'meta_hosts' : 'Label "%s" not found' % label_name})

949

950

# Create and sanity check an AtomicGroup object if requested.

951

if atomic_group_name:

952

if one_time_hosts:

953

raise model_logic.ValidationError(

954

{'one_time_hosts':

955

'One time hosts cannot be used with an Atomic Group.'})

956

atomic_group = models.AtomicGroup.smart_get(atomic_group_name)

957

if synch_count and synch_count > atomic_group.max_number_of_machines:

958

raise model_logic.ValidationError(

959

{'atomic_group_name' :

960

'You have requested a synch_count (%d) greater than the '

961

'maximum machines in the requested Atomic Group (%d).' %

962

(synch_count, atomic_group.max_number_of_machines)})

else:

atomic_group = None

for host in one_time_hosts or []:

967

this_host = models.Host.create_one_time_host(host)

968

host_objects.append(this_host)

969

970

options = dict(name=name,

971

priority=priority,

972

control_file=control_file,

973

control_type=control_type,

974

is_template=is_template,

975

timeout=timeout,

Simran Basi

7e60574

2013-11-12 13:43:36 -0800

[diff] [blame]

976

timeout_mins=timeout_mins,

Simran Basi

3421702

2012-11-06 13:43:15 -0800

[diff] [blame]

977

max_runtime_mins=max_runtime_mins,

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

978

synch_count=synch_count,

979

run_verify=run_verify,

980

email_list=email_list,

981

dependencies=dependencies,

982

reboot_before=reboot_before,

983

reboot_after=reboot_after,

984

parse_failed_repair=parse_failed_repair,

985

keyvals=keyvals,

986

drone_set=drone_set,

Aviv Keshet

2013-02-19 17:49:49 -0800

[diff] [blame]

987

parameterized_job=parameterized_job,

Aviv Keshet

cd1ff9b

2013-03-01 14:55:19 -0800

[diff] [blame]

988

parent_job_id=parent_job_id,

Dan Shi

07e09af

2013-04-12 09:31:29 -0700

[diff] [blame]

989

test_retry=test_retry,

Dan Shi

ec1d47d

2015-02-13 11:38:13 -0800

[diff] [blame]

990

run_reset=run_reset,

991

require_ssp=require_ssp)

jamesren

2010-07-16 22:33:48 +0000

[diff] [blame]

992

return create_new_job(owner=owner,

993

options=options,

994

host_objects=host_objects,

995

metahost_objects=metahost_objects,

996

atomic_group=atomic_group)

Simran Basi

b6ec8ae

2014-04-23 12:05:08 -0700

[diff] [blame]

997

998

999

def encode_ascii(control_file):

1000

"""Force a control file to only contain ascii characters.

1001

1002

@param control_file: Control file to encode.

1003

1004

@returns the control file in an ascii encoding.

1005

1006

@raises error.ControlFileMalformed: if encoding fails.

1007

"""

1008

try:

1009

return control_file.encode('ascii')

1010

except UnicodeDecodeError as e:

Jiaxi Luo

421608e

2014-07-07 14:38:00 -0700

[diff] [blame]

1011

raise error.ControlFileMalformed(str(e))

1012

1013

1014

def get_wmatrix_url():

1015

"""Get wmatrix url from config file.

1016

1017

@returns the wmatrix url or an empty string.

1018

"""

1019

return global_config.global_config.get_config_value('AUTOTEST_WEB',

1020

'wmatrix_url',

Jiaxi Luo

15cbf37

2014-07-01 19:20:20 -0700

[diff] [blame]

1021

default='')

Jiaxi Luo

57bc195

2014-07-22 15:27:30 -0700

[diff] [blame]

1022

1023

1024

def inject_times_to_filter(start_time_key=None, end_time_key=None,

1025

start_time_value=None, end_time_value=None,

1026

**filter_data):

1027

"""Inject the key value pairs of start and end time if provided.

1028

1029

@param start_time_key: A string represents the filter key of start_time.

1030

@param end_time_key: A string represents the filter key of end_time.

1031

@param start_time_value: Start_time value.

1032

@param end_time_value: End_time value.

1033

1034

@returns the injected filter_data.

1035

"""

1036

if start_time_value:

1037

filter_data[start_time_key] = start_time_value

1038

if end_time_value:

1039

filter_data[end_time_key] = end_time_value

return filter_data

def inject_times_to_hqe_special_tasks_filters(filter_data_common,

1044

start_time, end_time):

1045

"""Inject start and end time to hqe and special tasks filters.

1046

1047

@param filter_data_common: Common filter for hqe and special tasks.

1048

@param start_time_key: A string represents the filter key of start_time.

1049

@param end_time_key: A string represents the filter key of end_time.

1050

1051

@returns a pair of hqe and special tasks filters.

1052

"""

1053

filter_data_special_tasks = filter_data_common.copy()

1054

return (inject_times_to_filter('started_on__gte', 'started_on__lte',

1055

start_time, end_time, **filter_data_common),

1056

inject_times_to_filter('time_started__gte', 'time_started__lte',

1057

start_time, end_time,

Jakob Juelich

2014-09-02 16:37:46 -0700

[diff] [blame]

1058

**filter_data_special_tasks))

1059

1060

1061

def retrieve_shard(shard_hostname):

1062

"""

Jakob Juelich

7745757

2014-09-22 17:02:43 -0700

[diff] [blame]

1063

Retrieves the shard with the given hostname from the database.

Jakob Juelich

2014-09-02 16:37:46 -0700

[diff] [blame]

1064

1065

@param shard_hostname: Hostname of the shard to retrieve

1066

Jakob Juelich

7745757

2014-09-22 17:02:43 -0700

[diff] [blame]

1067

@raises models.Shard.DoesNotExist, if no shard with this hostname was found.

1068

Jakob Juelich

2014-09-02 16:37:46 -0700

[diff] [blame]

1069

@returns: Shard object

1070

"""

MK Ryu

2015-05-18 12:00:47 -0700

[diff] [blame]

1071

timer = autotest_stats.Timer('shard_heartbeat.retrieve_shard')

1072

with timer:

1073

return models.Shard.smart_get(shard_hostname)

Jakob Juelich

2014-09-02 16:37:46 -0700

[diff] [blame]

1074

1075

Jakob Juelich

1b52574

2014-09-30 13:08:07 -0700

[diff] [blame]

1076

def find_records_for_shard(shard, known_job_ids, known_host_ids):

Jakob Juelich

2014-09-02 16:37:46 -0700

[diff] [blame]

1077

"""Find records that should be sent to a shard.

1078

Jakob Juelich

2014-09-18 16:02:49 -0700

[diff] [blame]

1079

@param shard: Shard to find records for.

Jakob Juelich

1b52574

2014-09-30 13:08:07 -0700

[diff] [blame]

1080

@param known_job_ids: List of ids of jobs the shard already has.

1081

@param known_host_ids: List of ids of hosts the shard already has.

Jakob Juelich

2014-09-18 16:02:49 -0700

[diff] [blame]

1082

Fang Deng

f370599

2014-12-16 17:32:18 -0800

[diff] [blame]

1083

@returns: Tuple of three lists for hosts, jobs, and suite job keyvals:

1084

(hosts, jobs, suite_job_keyvals).

Jakob Juelich

2014-09-02 16:37:46 -0700

[diff] [blame]

1085

"""

MK Ryu

2015-05-18 12:00:47 -0700

[diff] [blame]

1086

timer = autotest_stats.Timer('shard_heartbeat')

1087

with timer.get_client('find_hosts'):

1088

hosts = models.Host.assign_to_shard(shard, known_host_ids)

1089

with timer.get_client('find_jobs'):

1090

jobs = models.Job.assign_to_shard(shard, known_job_ids)

1091

with timer.get_client('find_suite_job_keyvals'):

1092

parent_job_ids = [job.parent_job_id for job in jobs]

1093

suite_job_keyvals = models.JobKeyval.objects.filter(

1094

job_id__in=parent_job_ids)

Fang Deng

f370599

2014-12-16 17:32:18 -0800

[diff] [blame]

1095

return hosts, jobs, suite_job_keyvals

Jakob Juelich

2014-09-18 16:02:49 -0700

[diff] [blame]

1096

1097

1098

def _persist_records_with_type_sent_from_shard(

1099

shard, records, record_type, *args, **kwargs):

1100

"""

1101

Handle records of a specified type that were sent to the shard master.

1102

1103

@param shard: The shard the records were sent from.

1104

@param records: The records sent in their serialized format.

1105

@param record_type: Type of the objects represented by records.

1106

@param args: Additional arguments that will be passed on to the sanity

1107

checks.

1108

@param kwargs: Additional arguments that will be passed on to the sanity

1109

checks.

1110

1111

@raises error.UnallowedRecordsSentToMaster if any of the sanity checks fail.

1112

1113

@returns: List of primary keys of the processed records.

1114

"""

1115

pks = []

1116

for serialized_record in records:

1117

pk = serialized_record['id']

1118

try:

1119

current_record = record_type.objects.get(pk=pk)

1120

except record_type.DoesNotExist:

1121

raise error.UnallowedRecordsSentToMaster(

1122

'Object with pk %s of type %s does not exist on master.' % (

1123

pk, record_type))

1124

1125

current_record.sanity_check_update_from_shard(

1126

shard, serialized_record, *args, **kwargs)

1127

1128

current_record.update_from_serialized(serialized_record)

pks.append(pk)

return pks

def persist_records_sent_from_shard(shard, jobs, hqes):

1134

"""

1135

Sanity checking then saving serialized records sent to master from shard.

1136

1137

During heartbeats shards upload jobs and hostqueuentries. This performs

1138

some sanity checks on these and then updates the existing records for those

1139

entries with the updated ones from the heartbeat.

1140

1141

The sanity checks include:

1142

- Checking if the objects sent already exist on the master.

1143

- Checking if the objects sent were assigned to this shard.

1144

- hostqueueentries must be sent together with their jobs.

1145

1146

@param shard: The shard the records were sent from.

1147

@param jobs: The jobs the shard sent.

1148

@param hqes: The hostqueuentries the shart sent.

1149

1150

@raises error.UnallowedRecordsSentToMaster if any of the sanity checks fail.

1151

"""

MK Ryu

2015-05-18 12:00:47 -0700

[diff] [blame]

1152

timer = autotest_stats.Timer('shard_heartbeat')

1153

with timer.get_client('persist_jobs'):

1154

job_ids_sent = _persist_records_with_type_sent_from_shard(

1155

shard, jobs, models.Job)

Jakob Juelich

2014-09-18 16:02:49 -0700

[diff] [blame]

1156

MK Ryu

2015-05-18 12:00:47 -0700

[diff] [blame]

1157

with timer.get_client('persist_hqes'):

1158

_persist_records_with_type_sent_from_shard(

1159

shard, hqes, models.HostQueueEntry, job_ids_sent=job_ids_sent)

Jakob Juelich

2014-10-01 12:43:23 -0700

[diff] [blame]

1160

1161

Jakob Juelich

2014-10-01 12:43:23 -0700

[diff] [blame]

1162

def forward_single_host_rpc_to_shard(func):

1163

"""This decorator forwards rpc calls that modify a host to a shard.

1164

1165

If a host is assigned to a shard, rpcs that change his attributes should be

1166

forwarded to the shard.

1167

1168

This assumes the first argument of the function represents a host id.

1169

1170

@param func: The function to decorate

1171

1172

@returns: The function to replace func with.

1173

"""

1174

def replacement(**kwargs):

1175

# Only keyword arguments can be accepted here, as we need the argument

1176

# names to send the rpc. serviceHandler always provides arguments with

1177

# their keywords, so this is not a problem.

1178

host = models.Host.smart_get(kwargs['id'])

Prashanth Balasubramanian

2014-12-23 11:26:44 -0800

[diff] [blame]

1179

if host.shard and not server_utils.is_shard():

MK Ryu

26f0c93

2015-05-28 18:14:33 -0700

[diff] [blame]

1180

run_rpc_on_multiple_hostnames(func.func_name,

1181

[host.shard.rpc_hostname()],

Jakob Juelich

2014-10-01 12:43:23 -0700

[diff] [blame]

1182

**kwargs)

1183

return func(**kwargs)

return replacement

Prashanth Balasubramanian

5949b4a

2014-11-23 12:58:30 -0800

[diff] [blame]

1188

def forward_multi_host_rpc_to_shards(func):

1189

"""This decorator forwards rpc calls that modify multiple hosts.

1190

1191

If a host is assigned to a shard, rpcs that change his attributes should be

1192

forwarded to the shard. Some calls however, take a list of hosts and a

1193

single id to modify, eg: label_add_hosts. This wrapper will sift through

1194

the list of hosts, find each of their shards, and forward the rpc for

1195

those hosts to that shard before calling the local version of the given rpc.

1196

1197

This assumes:

1198

1. The rpc call uses `smart_get` to retrieve host objects, not the

1199

stock django `get` call. This is true for most, if not all rpcs in

1200

the rpc_interface.

1201

2. The kwargs to the function contain either a list of host ids or

1202

hostnames, keyed under 'hosts'. This is true for all the rpc

1203

functions that use 'smart_get'.

1204

1205

@param func: The function to decorate

1206

1207

@returns: The function to replace func with.

1208

"""

1209

def replacement(**kwargs):

MK Ryu

9c5fbbe

2015-02-11 15:46:22 -0800

[diff] [blame]

1210

fanout_rpc(

1211

models.Host.smart_get_bulk(kwargs['hosts']),

1212

func.func_name, **kwargs)

Prashanth Balasubramanian

5949b4a

2014-11-23 12:58:30 -0800

[diff] [blame]

1213

return func(**kwargs)

return replacement

MK Ryu

2015-07-01 12:21:20 -0700

[diff] [blame^]

1218

def fanout_rpc(host_objs, rpc_name, include_hostnames=True, **kwargs):

1219

"""Fanout the given rpc to shards of given hosts.

1220

1221

@param host_objs: Host objects for the rpc.

1222

@param rpc_name: The name of the rpc.

1223

@param include_hostnames: If True, include the hostnames in the kwargs.

1224

Hostnames are not always necessary, this functions is designed to

1225

send rpcs to the shard a host is on, the rpcs themselves could be

1226

related to labels, acls etc.

1227

@param kwargs: The kwargs for the rpc.

1228

"""

1229

# Figure out which hosts are on which shards.

1230

shard_host_map = bucket_hosts_by_shard(

1231

host_objs, rpc_hostnames=True)

1232

1233

# Execute the rpc against the appropriate shards.

1234

for shard, hostnames in shard_host_map.iteritems():

1235

if include_hostnames:

1236

kwargs['hosts'] = hostnames

1237

try:

1238

run_rpc_on_multiple_hostnames(rpc_name, [shard], **kwargs)

1239

except:

1240

ei = sys.exc_info()

1241

new_exc = error.RPCException('RPC %s failed on shard %s due to '

1242

'%s: %s' % (rpc_name, shard, ei[0].__name__, ei[1]))

1243

raise new_exc.__class__, new_exc, ei[2]

1244

1245

Jakob Juelich

2014-10-01 12:43:23 -0700

[diff] [blame]

1246

def run_rpc_on_multiple_hostnames(rpc_call, shard_hostnames, **kwargs):

1247

"""Runs an rpc to multiple AFEs

1248

1249

This is i.e. used to propagate changes made to hosts after they are assigned

1250

to a shard.

1251

1252

@param rpc_call: Name of the rpc endpoint to call.

1253

@param shard_hostnames: List of hostnames to run the rpcs on.

1254

@param **kwargs: Keyword arguments to pass in the rpcs.

1255

"""

MK Ryu

fb5e3a8

2015-07-01 12:21:20 -0700

[diff] [blame^]

1256

# Make sure this function is not called on shards but only on master.

1257

assert not server_utils.is_shard()

Jakob Juelich

2014-10-01 12:43:23 -0700

[diff] [blame]

1258

for shard_hostname in shard_hostnames:

MK Ryu

9651ca5

2015-06-08 17:48:22 -0700

[diff] [blame]

1259

afe = frontend_wrappers.RetryingAFE(server=shard_hostname)

Jakob Juelich

2014-10-01 12:43:23 -0700

[diff] [blame]

1260

afe.run(rpc_call, **kwargs)

MK Ryu

9c5fbbe

2015-02-11 15:46:22 -0800

[diff] [blame]

def get_label(name):

"""Gets a label object using a given name.

1265

1266

@param name: Label name.

1267

@raises model.Label.DoesNotExist: when there is no label matching

1268

the given name.

1269

@return: a label object matching the given name.

1270

"""

1271

try:

1272

label = models.Label.smart_get(name)

1273

except models.Label.DoesNotExist:

return None

return label

def get_global_afe_hostname():

J. Richard Barnette

fdfcd66

2015-04-13 17:20:29 -0700

[diff] [blame]

1279

"""Read the hostname of the global AFE from the global configuration."""

MK Ryu

9c5fbbe

2015-02-11 15:46:22 -0800

[diff] [blame]

1280

return global_config.global_config.get_config_value(

1281

'SHARD', 'global_afe_hostname')

1282

1283

MK Ryu

2015-06-08 14:13:16 -0700

[diff] [blame]

1284

def route_rpc_to_master(func):

J. Richard Barnette

fdfcd66

2015-04-13 17:20:29 -0700

[diff] [blame]

1285

"""Route RPC to master AFE.

MK Ryu

2d10756

2015-02-24 17:45:02 -0800

[diff] [blame]

1286

MK Ryu

2015-06-08 14:13:16 -0700

[diff] [blame]

1287

@param func: The function to decorate

J. Richard Barnette

fdfcd66

2015-04-13 17:20:29 -0700

[diff] [blame]

1288

MK Ryu

2015-06-08 14:13:16 -0700

[diff] [blame]

1289

@returns: The function to replace func with.

MK Ryu

2d10756

2015-02-24 17:45:02 -0800

[diff] [blame]

1290

"""

MK Ryu

2015-06-08 14:13:16 -0700

[diff] [blame]

1291

@wraps(func)

MK Ryu

f6ab8a7

2015-07-06 10:19:48 -0700

[diff] [blame]

1292

def replacement(*args, **kwargs):

1293

kwargs = inspect.getcallargs(func, *args, **kwargs)

MK Ryu

2015-06-08 14:13:16 -0700

[diff] [blame]

1294

if server_utils.is_shard():

MK Ryu

9651ca5

2015-06-08 17:48:22 -0700

[diff] [blame]

1295

afe = frontend_wrappers.RetryingAFE(

1296

server=get_global_afe_hostname())

1297

return afe.run(func.func_name, **kwargs)

MK Ryu