Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 1 | #!/usr/bin/python |
| 2 | |
Yunlian Jiang | e5b673f | 2013-05-23 11:42:53 -0700 | [diff] [blame] | 3 | # Copyright (c) 2013 The Chromium OS Authors. All rights reserved. |
| 4 | # Use of this source code is governed by a BSD-style license that can be |
| 5 | # found in the LICENSE file. |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 6 | |
| 7 | import datetime |
| 8 | import os |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 9 | import threading |
| 10 | import time |
| 11 | import traceback |
Ahmad Sharif | fd356fb | 2012-05-07 12:02:16 -0700 | [diff] [blame] | 12 | |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 13 | from utils import command_executer |
| 14 | from utils import timeline |
| 15 | |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 16 | from suite_runner import SuiteRunner |
Ahmad Sharif | f395c26 | 2012-10-09 17:48:09 -0700 | [diff] [blame] | 17 | from results_cache import Result |
| 18 | from results_cache import ResultsCache |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 19 | from results_cache import TelemetryResult |
| 20 | |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 21 | |
| 22 | STATUS_FAILED = "FAILED" |
| 23 | STATUS_SUCCEEDED = "SUCCEEDED" |
| 24 | STATUS_IMAGING = "IMAGING" |
| 25 | STATUS_RUNNING = "RUNNING" |
| 26 | STATUS_WAITING = "WAITING" |
| 27 | STATUS_PENDING = "PENDING" |
| 28 | |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 29 | class BenchmarkRun(threading.Thread): |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 30 | def __init__(self, name, benchmark, |
| 31 | label, |
| 32 | iteration, |
| 33 | cache_conditions, |
Ahmad Sharif | fd356fb | 2012-05-07 12:02:16 -0700 | [diff] [blame] | 34 | machine_manager, |
Luis Lozano | f81680c | 2013-03-15 14:44:13 -0700 | [diff] [blame] | 35 | logger_to_use, |
| 36 | share_users): |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 37 | threading.Thread.__init__(self) |
| 38 | self.name = name |
| 39 | self._logger = logger_to_use |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 40 | self.benchmark = benchmark |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 41 | self.iteration = iteration |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 42 | self.label = label |
Ahmad Sharif | fd356fb | 2012-05-07 12:02:16 -0700 | [diff] [blame] | 43 | self.result = None |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 44 | self.terminated = False |
| 45 | self.retval = None |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 46 | self.run_completed = False |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 47 | self.machine_manager = machine_manager |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 48 | self.suite_runner = SuiteRunner(self._logger) |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 49 | self.machine = None |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 50 | self.cache_conditions = cache_conditions |
| 51 | self.runs_complete = 0 |
| 52 | self.cache_hit = False |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 53 | self.failure_reason = "" |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 54 | self.test_args = "%s %s" % (benchmark.test_args, |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 55 | self._GetExtraAutotestArgs()) |
Ahmad Sharif | 92ab7af | 2012-03-01 18:03:46 -0800 | [diff] [blame] | 56 | self._ce = command_executer.GetCommandExecuter(self._logger) |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 57 | self.timeline = timeline.Timeline() |
| 58 | self.timeline.Record(STATUS_PENDING) |
Luis Lozano | f81680c | 2013-03-15 14:44:13 -0700 | [diff] [blame] | 59 | self.share_users = share_users |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 60 | |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 61 | def ReadCache(self): |
| 62 | # Just use the first machine for running the cached version, |
| 63 | # without locking it. |
| 64 | self.cache = ResultsCache() |
| 65 | self.cache.Init(self.label.chromeos_image, |
| 66 | self.label.chromeos_root, |
| 67 | self.benchmark.test_name, |
| 68 | self.iteration, |
| 69 | self.test_args, |
| 70 | self.machine_manager, |
| 71 | self.label.board, |
| 72 | self.cache_conditions, |
| 73 | self._logger, |
| 74 | self.label, |
| 75 | self.share_users, |
| 76 | self.benchmark.suite |
| 77 | ) |
| 78 | |
| 79 | self.result = self.cache.ReadResult() |
| 80 | self.cache_hit = (self.result is not None) |
| 81 | |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 82 | def run(self): |
| 83 | try: |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 84 | self.ReadCache() |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 85 | |
Ahmad Sharif | fd356fb | 2012-05-07 12:02:16 -0700 | [diff] [blame] | 86 | if self.result: |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 87 | self._logger.LogOutput("%s: Cache hit." % self.name) |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 88 | self._logger.LogOutput(self.result.out, print_to_console=False) |
| 89 | self._logger.LogError(self.result.err, print_to_console=False) |
| 90 | |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 91 | else: |
| 92 | self._logger.LogOutput("%s: No cache hit." % self.name) |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 93 | self.timeline.Record(STATUS_WAITING) |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 94 | # Try to acquire a machine now. |
| 95 | self.machine = self.AcquireMachine() |
Ahmad Sharif | fd356fb | 2012-05-07 12:02:16 -0700 | [diff] [blame] | 96 | self.result = self.RunTest(self.machine) |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 97 | |
| 98 | self.cache.remote = self.machine.name |
Ahmad Sharif | 5ae8a5c | 2012-05-18 10:59:51 -0700 | [diff] [blame] | 99 | self.cache.StoreResult(self.result) |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 100 | |
| 101 | if self.terminated: |
| 102 | return |
| 103 | |
Ahmad Sharif | fd356fb | 2012-05-07 12:02:16 -0700 | [diff] [blame] | 104 | if not self.result.retval: |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 105 | self.timeline.Record(STATUS_SUCCEEDED) |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 106 | else: |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 107 | if self.timeline.GetLastEvent() != STATUS_FAILED: |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 108 | self.failure_reason = "Return value of test suite was non-zero." |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 109 | self.timeline.Record(STATUS_FAILED) |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 110 | |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 111 | except Exception, e: |
| 112 | self._logger.LogError("Benchmark run: '%s' failed: %s" % (self.name, e)) |
| 113 | traceback.print_exc() |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 114 | if self.timeline.GetLastEvent() != STATUS_FAILED: |
| 115 | self.timeline.Record(STATUS_FAILED) |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 116 | self.failure_reason = str(e) |
| 117 | finally: |
| 118 | if self.machine: |
Yunlian Jiang | e5b673f | 2013-05-23 11:42:53 -0700 | [diff] [blame] | 119 | if not self.machine.IsReachable(): |
| 120 | self._logger.LogOutput("Machine % is not reachable, removing it." |
| 121 | % self.machine.name) |
| 122 | self.machine_manager.RemoveMachine(self.machine.name) |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 123 | self._logger.LogOutput("Releasing machine: %s" % self.machine.name) |
| 124 | self.machine_manager.ReleaseMachine(self.machine) |
| 125 | self._logger.LogOutput("Released machine: %s" % self.machine.name) |
| 126 | |
| 127 | def Terminate(self): |
| 128 | self.terminated = True |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 129 | self.suite_runner.Terminate() |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 130 | if self.timeline.GetLastEvent() != STATUS_FAILED: |
| 131 | self.timeline.Record(STATUS_FAILED) |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 132 | self.failure_reason = "Thread terminated." |
| 133 | |
| 134 | def AcquireMachine(self): |
| 135 | while True: |
| 136 | if self.terminated: |
| 137 | raise Exception("Thread terminated while trying to acquire machine.") |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 138 | machine = self.machine_manager.AcquireMachine(self.label.chromeos_image, |
| 139 | self.label) |
| 140 | |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 141 | if machine: |
| 142 | self._logger.LogOutput("%s: Machine %s acquired at %s" % |
| 143 | (self.name, |
| 144 | machine.name, |
| 145 | datetime.datetime.now())) |
| 146 | break |
| 147 | else: |
| 148 | sleep_duration = 10 |
| 149 | time.sleep(sleep_duration) |
| 150 | return machine |
| 151 | |
Ahmad Sharif | 5ae8a5c | 2012-05-18 10:59:51 -0700 | [diff] [blame] | 152 | def _GetExtraAutotestArgs(self): |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 153 | if self.benchmark.perf_args and self.benchmark.suite == "telemetry": |
| 154 | self._logger.LogError("Telemetry benchmark does not support profiler.") |
| 155 | |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 156 | if self.benchmark.perf_args: |
| 157 | perf_args_list = self.benchmark.perf_args.split(" ") |
Ahmad Sharif | f395c26 | 2012-10-09 17:48:09 -0700 | [diff] [blame] | 158 | perf_args_list = [perf_args_list[0]] + ["-a"] + perf_args_list[1:] |
| 159 | perf_args = " ".join(perf_args_list) |
| 160 | if not perf_args_list[0] in ["record", "stat"]: |
| 161 | raise Exception("perf_args must start with either record or stat") |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 162 | extra_test_args = ["--profiler=custom_perf", |
Ahmad Sharif | 5ae8a5c | 2012-05-18 10:59:51 -0700 | [diff] [blame] | 163 | ("--profiler_args='perf_options=\"%s\"'" % |
| 164 | perf_args)] |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 165 | return " ".join(extra_test_args) |
Ahmad Sharif | 5ae8a5c | 2012-05-18 10:59:51 -0700 | [diff] [blame] | 166 | else: |
| 167 | return "" |
| 168 | |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 169 | def RunTest(self, machine): |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 170 | self.timeline.Record(STATUS_IMAGING) |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 171 | self.machine_manager.ImageMachine(machine, |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 172 | self.label) |
| 173 | self.timeline.Record(STATUS_RUNNING) |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 174 | [retval, out, err] = self.suite_runner.Run(machine.name, |
| 175 | self.label, |
| 176 | self.benchmark, |
| 177 | self.test_args) |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 178 | self.run_completed = True |
Ahmad Sharif | 5ae8a5c | 2012-05-18 10:59:51 -0700 | [diff] [blame] | 179 | return Result.CreateFromRun(self._logger, |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 180 | self.label, |
Ahmad Sharif | 5ae8a5c | 2012-05-18 10:59:51 -0700 | [diff] [blame] | 181 | out, |
| 182 | err, |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 183 | retval, |
| 184 | self.benchmark.suite) |
Ahmad Sharif | 92ab7af | 2012-03-01 18:03:46 -0800 | [diff] [blame] | 185 | |
Ahmad Sharif | 0dcbc4b | 2012-02-02 16:37:18 -0800 | [diff] [blame] | 186 | def SetCacheConditions(self, cache_conditions): |
| 187 | self.cache_conditions = cache_conditions |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 188 | |
| 189 | |
| 190 | class MockBenchmarkRun(BenchmarkRun): |
| 191 | """Inherited from BenchmarkRun, just overide RunTest for testing.""" |
| 192 | |
| 193 | def RunTest(self, machine): |
| 194 | """Remove Result.CreateFromRun for testing.""" |
| 195 | self.timeline.Record(STATUS_IMAGING) |
| 196 | self.machine_manager.ImageMachine(machine, |
| 197 | self.label) |
| 198 | self.timeline.Record(STATUS_RUNNING) |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 199 | [retval, out, err] = self.suite_runner.Run(machine.name, |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 200 | self.label.chromeos_root, |
| 201 | self.label.board, |
Yunlian Jiang | 04dc5dc | 2013-04-23 15:05:05 -0700 | [diff] [blame] | 202 | self.benchmark.test_name, |
| 203 | self.test_args) |
Ahmad Sharif | 4467f00 | 2012-12-20 12:09:49 -0800 | [diff] [blame] | 204 | self.run_completed = True |
| 205 | rr = Result("Results placed in /tmp/test", "", 0) |
| 206 | rr.out = out |
| 207 | rr.err = err |
| 208 | rr.retval = retval |
| 209 | return rr |
| 210 | |