Nicolas Noble | ddef246 | 2015-01-06 18:08:25 -0800 | [diff] [blame] | 1 | """Run a group of subprocesses and then finish.""" |
| 2 | |
| 3 | import multiprocessing |
| 4 | import random |
| 5 | import subprocess |
| 6 | import sys |
ctiller | 3040cb7 | 2015-01-07 12:13:17 -0800 | [diff] [blame] | 7 | import tempfile |
| 8 | import time |
Nicolas Noble | ddef246 | 2015-01-06 18:08:25 -0800 | [diff] [blame] | 9 | |
ctiller | 3040cb7 | 2015-01-07 12:13:17 -0800 | [diff] [blame] | 10 | |
ctiller | 94e5dde | 2015-01-09 10:41:59 -0800 | [diff] [blame^] | 11 | _DEFAULT_MAX_JOBS = 16 * multiprocessing.cpu_count() |
Nicolas Noble | ddef246 | 2015-01-06 18:08:25 -0800 | [diff] [blame] | 12 | |
| 13 | |
| 14 | def shuffle_iteratable(it): |
| 15 | """Return an iterable that randomly walks it""" |
| 16 | # take a random sampling from the passed in iterable |
| 17 | # we take an element with probablity 1/p and rapidly increase |
| 18 | # p as we take elements - this gives us a somewhat random set of values before |
| 19 | # we've seen all the values, but starts producing values without having to |
| 20 | # compute ALL of them at once, allowing tests to start a little earlier |
| 21 | nextit = [] |
| 22 | p = 1 |
| 23 | for val in it: |
| 24 | if random.randint(0, p) == 0: |
ctiller | 3040cb7 | 2015-01-07 12:13:17 -0800 | [diff] [blame] | 25 | p = min(p*2, 100) |
Nicolas Noble | ddef246 | 2015-01-06 18:08:25 -0800 | [diff] [blame] | 26 | yield val |
| 27 | else: |
| 28 | nextit.append(val) |
| 29 | # after taking a random sampling, we shuffle the rest of the elements and |
| 30 | # yield them |
| 31 | random.shuffle(nextit) |
| 32 | for val in nextit: |
| 33 | yield val |
| 34 | |
| 35 | |
ctiller | 3040cb7 | 2015-01-07 12:13:17 -0800 | [diff] [blame] | 36 | _SUCCESS = object() |
| 37 | _FAILURE = object() |
| 38 | _RUNNING = object() |
| 39 | _KILLED = object() |
| 40 | |
| 41 | |
| 42 | class Job(object): |
| 43 | """Manages one job.""" |
| 44 | |
| 45 | def __init__(self, cmdline): |
| 46 | self._cmdline = ' '.join(cmdline) |
| 47 | self._tempfile = tempfile.TemporaryFile() |
| 48 | self._process = subprocess.Popen(args=cmdline, |
| 49 | stderr=subprocess.STDOUT, |
| 50 | stdout=self._tempfile) |
| 51 | self._state = _RUNNING |
| 52 | sys.stdout.write('\x1b[0G\x1b[2K\x1b[33mSTART\x1b[0m: %s' % |
| 53 | self._cmdline) |
| 54 | sys.stdout.flush() |
| 55 | |
| 56 | def state(self): |
| 57 | """Poll current state of the job. Prints messages at completion.""" |
| 58 | if self._state == _RUNNING and self._process.poll() is not None: |
| 59 | if self._process.returncode != 0: |
| 60 | self._state = _FAILURE |
| 61 | self._tempfile.seek(0) |
| 62 | stdout = self._tempfile.read() |
| 63 | sys.stdout.write('\x1b[0G\x1b[2K\x1b[31mFAILED\x1b[0m: %s' |
| 64 | ' [ret=%d]\n' |
| 65 | '%s\n' % ( |
| 66 | self._cmdline, self._process.returncode, stdout)) |
| 67 | sys.stdout.flush() |
| 68 | else: |
| 69 | self._state = _SUCCESS |
| 70 | sys.stdout.write('\x1b[0G\x1b[2K\x1b[32mPASSED\x1b[0m: %s' % |
| 71 | self._cmdline) |
| 72 | sys.stdout.flush() |
| 73 | return self._state |
| 74 | |
| 75 | def kill(self): |
| 76 | if self._state == _RUNNING: |
| 77 | self._state = _KILLED |
| 78 | self._process.terminate() |
| 79 | |
| 80 | |
Nicolas Noble | ddef246 | 2015-01-06 18:08:25 -0800 | [diff] [blame] | 81 | class Jobset(object): |
| 82 | """Manages one run of jobs.""" |
| 83 | |
ctiller | 94e5dde | 2015-01-09 10:41:59 -0800 | [diff] [blame^] | 84 | def __init__(self, check_cancelled, maxjobs): |
ctiller | 3040cb7 | 2015-01-07 12:13:17 -0800 | [diff] [blame] | 85 | self._running = set() |
| 86 | self._check_cancelled = check_cancelled |
| 87 | self._cancelled = False |
Nicolas Noble | ddef246 | 2015-01-06 18:08:25 -0800 | [diff] [blame] | 88 | self._failures = 0 |
ctiller | 94e5dde | 2015-01-09 10:41:59 -0800 | [diff] [blame^] | 89 | self._maxjobs = maxjobs |
Nicolas Noble | ddef246 | 2015-01-06 18:08:25 -0800 | [diff] [blame] | 90 | |
ctiller | 3040cb7 | 2015-01-07 12:13:17 -0800 | [diff] [blame] | 91 | def start(self, cmdline): |
| 92 | """Start a job. Return True on success, False on failure.""" |
ctiller | 94e5dde | 2015-01-09 10:41:59 -0800 | [diff] [blame^] | 93 | while len(self._running) >= self._maxjobs: |
ctiller | 3040cb7 | 2015-01-07 12:13:17 -0800 | [diff] [blame] | 94 | if self.cancelled(): return False |
| 95 | self.reap() |
| 96 | if self.cancelled(): return False |
| 97 | self._running.add(Job(cmdline)) |
| 98 | return True |
Nicolas Noble | ddef246 | 2015-01-06 18:08:25 -0800 | [diff] [blame] | 99 | |
ctiller | 3040cb7 | 2015-01-07 12:13:17 -0800 | [diff] [blame] | 100 | def reap(self): |
| 101 | """Collect the dead jobs.""" |
| 102 | while self._running: |
| 103 | dead = set() |
| 104 | for job in self._running: |
| 105 | st = job.state() |
| 106 | if st == _RUNNING: continue |
| 107 | if st == _FAILURE: self._failures += 1 |
| 108 | dead.add(job) |
| 109 | for job in dead: |
| 110 | self._running.remove(job) |
| 111 | if not dead: return |
| 112 | time.sleep(0.1) |
| 113 | |
| 114 | def cancelled(self): |
| 115 | """Poll for cancellation.""" |
| 116 | if self._cancelled: return True |
| 117 | if not self._check_cancelled(): return False |
| 118 | for job in self._running: |
| 119 | job.kill() |
| 120 | self._cancelled = True |
| 121 | return True |
| 122 | |
| 123 | def finish(self): |
| 124 | while self._running: |
| 125 | if self.cancelled(): pass # poll cancellation |
| 126 | self.reap() |
| 127 | return not self.cancelled() and self._failures == 0 |
Nicolas Noble | ddef246 | 2015-01-06 18:08:25 -0800 | [diff] [blame] | 128 | |
| 129 | |
ctiller | 3040cb7 | 2015-01-07 12:13:17 -0800 | [diff] [blame] | 130 | def _never_cancelled(): |
| 131 | return False |
| 132 | |
| 133 | |
ctiller | 94e5dde | 2015-01-09 10:41:59 -0800 | [diff] [blame^] | 134 | def run(cmdlines, check_cancelled=_never_cancelled, maxjobs=None): |
| 135 | js = Jobset(check_cancelled, |
| 136 | maxjobs if maxjobs is not None else _DEFAULT_MAX_JOBS) |
ctiller | 3040cb7 | 2015-01-07 12:13:17 -0800 | [diff] [blame] | 137 | for cmdline in shuffle_iteratable(cmdlines): |
| 138 | if not js.start(cmdline): |
| 139 | break |
| 140 | return js.finish() |