Merge pull request #1886 from dgquintas/run_tests_shuffling Improvements to the way we randomize test runs.

commit: 82c8d6de1ee065deb0330a101287e91583e35fbe [log] [tgz]
author: Craig Tiller <craig.tiller@gmail.com> Wed Jun 03 08:00:59 2015 -0700
committer: Craig Tiller <craig.tiller@gmail.com> Wed Jun 03 08:00:59 2015 -0700
tree: 86e6b60f30878fd4694a6f14f44ba588b19f8f3c
parent: 669c139a4a41eaca7bff52071510258e65274de7 [diff]
parent: 79e389f4318fa7b729d52363cd3566e477f7691e [diff]
diff --git a/tools/run_tests/jobset.py b/tools/run_tests/jobset.py
index 51d61db..985b7a7 100755
--- a/tools/run_tests/jobset.py
+++ b/tools/run_tests/jobset.py

@@ -33,7 +33,6 @@
 import multiprocessing
 import os
 import platform
-import random
 import signal
 import subprocess
 import sys
@@ -59,40 +58,6 @@
   signal.signal(signal.SIGALRM, alarm_handler)
 
 
-def shuffle_iteratable(it):
-  """Return an iterable that randomly walks it"""
-  # take a random sampling from the passed in iterable
-  # we take an element with probability 1/p and rapidly increase
-  # p as we take elements - this gives us a somewhat random set of values before
-  # we've seen all the values, but starts producing values without having to
-  # compute ALL of them at once, allowing tests to start a little earlier
-  LARGE_THRESHOLD = 1000
-  nextit = []
-  p = 1
-  for val in it:
-    if random.randint(0, p) == 0:
-      p = min(p*2, 100)
-      yield val
-    else:
-      nextit.append(val)
-      # if the input iterates over a large number of values (potentially
-      # infinite, we'd be in the loop for a while (again, potentially forever).
-      # We need to reset "nextit" every so often to, in the case of an infinite
-      # iterator, avoid growing "nextit" without ever freeing it.
-      if len(nextit) > LARGE_THRESHOLD:
-        random.shuffle(nextit)
-        for val in nextit:
-          yield val
-        nextit = []
-        p = 1
-
-  # after taking a random sampling, we shuffle the rest of the elements and
-  # yield them
-  random.shuffle(nextit)
-  for val in nextit:
-    yield val
-
-
 _SUCCESS = object()
 _FAILURE = object()
 _RUNNING = object()
@@ -358,11 +323,6 @@
               maxjobs if maxjobs is not None else _DEFAULT_MAX_JOBS,
               newline_on_success, travis, stop_on_failure,
               cache if cache is not None else NoCache())
-  # We can't sort an infinite sequence of runs.
-  if not travis or infinite_runs:
-    cmdlines = shuffle_iteratable(cmdlines)
-  else:
-    cmdlines = sorted(cmdlines, key=lambda x: x.shortname)
   for cmdline in cmdlines:
     if not js.start(cmdline):
       break

diff --git a/tools/run_tests/run_tests.py b/tools/run_tests/run_tests.py
index c00d794..3240567 100755
--- a/tools/run_tests/run_tests.py
+++ b/tools/run_tests/run_tests.py

@@ -36,16 +36,16 @@
 import json
 import multiprocessing
 import os
+import platform
+import random
 import re
+import subprocess
 import sys
 import time
-import platform
-import subprocess
 
 import jobset
 import watch_dirs
 
-
 ROOT = os.path.abspath(os.path.join(os.path.dirname(sys.argv[0]), '../..'))
 os.chdir(ROOT)
 
@@ -488,13 +488,21 @@
     return 1
 
   # start antagonists
-  antagonists = [subprocess.Popen(['tools/run_tests/antagonist.py']) 
+  antagonists = [subprocess.Popen(['tools/run_tests/antagonist.py'])
                  for _ in range(0, args.antagonists)]
   try:
     infinite_runs = runs_per_test == 0
-    # run all the tests
-    runs_sequence = (itertools.repeat(one_run) if infinite_runs
-                     else itertools.repeat(one_run, runs_per_test))
+    # When running on travis, we want out test runs to be as similar as possible
+    # for reproducibility purposes.
+    if travis:
+      massaged_one_run = sorted(one_run, key=lambda x: x.shortname)
+    else:
+      # whereas otherwise, we want to shuffle things up to give all tests a
+      # chance to run.
+      massaged_one_run = list(one_run)  # random.shuffle needs an indexable seq.
+      random.shuffle(massaged_one_run)  # which it modifies in-place.
+    runs_sequence = (itertools.repeat(massaged_one_run) if infinite_runs
+                     else itertools.repeat(massaged_one_run, runs_per_test))
     all_runs = itertools.chain.from_iterable(runs_sequence)
     if not jobset.run(all_runs, check_cancelled,
                       newline_on_success=newline_on_success, travis=travis,
commit	82c8d6de1ee065deb0330a101287e91583e35fbe	[log] [tgz]
author	Craig Tiller <craig.tiller@gmail.com>	Wed Jun 03 08:00:59 2015 -0700
committer	Craig Tiller <craig.tiller@gmail.com>	Wed Jun 03 08:00:59 2015 -0700
tree	86e6b60f30878fd4694a6f14f44ba588b19f8f3c
parent	669c139a4a41eaca7bff52071510258e65274de7 [diff]
parent	79e389f4318fa7b729d52363cd3566e477f7691e [diff]