Autotest: Add additional logging to autotestd_monitor In order to help determine what is happening on autotestd_monitor, we have added additional logging so that we can tell where it gets stuck in the situations where the client-side test never exits. BUG=chromium-os:37608 TEST=ensured the log output is recorder and did not impact status or status.log Change-Id: I4ee96831ab458a9e4d4400e88b6cb2daf46cc10d Reviewed-on: https://gerrit.chromium.org/gerrit/41983 Reviewed-by: Simran Basi <sbasi@chromium.org> Tested-by: Simran Basi <sbasi@chromium.org> Commit-Queue: Simran Basi <sbasi@chromium.org>

commit: bca10a6fc4527d43199f4ad7f489127662fe6c29 [log] [tgz]
author: Simran Basi <sbasi@chromium.org> Thu Jan 24 15:52:35 2013 -0800
committer: ChromeBot <chrome-bot@google.com> Fri Jan 25 11:19:31 2013 -0800
tree: 1dbbdcec7a8acaa0438d3d918d55bdd7a0e89af8
parent: d35e6c4c767abb12b47fddbf6822ab757a28f619 [diff] [blame]
diff --git a/client/bin/autotestd_monitor b/client/bin/autotestd_monitor
index a3217af..a94c966 100755
--- a/client/bin/autotestd_monitor
+++ b/client/bin/autotestd_monitor

@@ -6,7 +6,10 @@
 logdir = sys.argv[1]
 stdout_start = int(sys.argv[2])  # number of bytes we can skip on stdout
 stderr_start = int(sys.argv[3])  # nubmer of bytes we can skip on stderr
+# TODO (crosbug.com/38224)- sbasi: Remove extra logging.
+stderr = open(os.path.join(logdir, 'stderr'), 'a', 0)
 
+print >> stderr, 'Entered autotestd_monitor.'
 # if any of our tail processes die, the monitor should die too
 def kill_self(signum, frame):
     os.kill(os.getpid(), signal.SIGTERM)
@@ -26,6 +29,8 @@
 stdout_pump = launch_tail('stdout', sys.stdout, stdout_start)
 stderr_pump = launch_tail('stderr', sys.stderr, stderr_start)
 
+print >> stderr, 'Finished launching tail subprocesses.'
+
 # wait for logdir/started to exist to be sure autotestd is started
 start_time = time.time()
 started_file_path = os.path.join(logdir, 'started')
@@ -34,9 +39,12 @@
     if time.time() - start_time >= 30:
         raise Exception("autotestd failed to start in %s" % logdir)
 
+print >> stderr, 'Finished waiting on autotestd to start.'
+
 # watch the exit code file for an exit
 exit_code_file = open(os.path.join(logdir, 'exit_code'))
 fcntl.flock(exit_code_file, fcntl.LOCK_EX)
+print >> stderr, 'Got lock of exit_code_file.'
 try:
     exit_code = exit_code_file.read()
     if len(exit_code) != 4:
@@ -46,9 +54,12 @@
 finally:
     fcntl.flock(exit_code_file, fcntl.LOCK_UN)
     exit_code_file.close()
+    print >> stderr, 'Released lock of exit_code_file and closed it.'
 
 # tail runs in 1s polling loop, so give them a chance to finish
 time.sleep(2)
+
+print >> stderr, 'Killing child processes.'
 # clear the SIGCHLD handler so that killing the tails doesn't kill us
 signal.signal(signal.SIGCHLD, signal.SIG_DFL)
 os.kill(stdout_pump.pid, signal.SIGTERM)
commit	bca10a6fc4527d43199f4ad7f489127662fe6c29	[log] [tgz]
author	Simran Basi <sbasi@chromium.org>	Thu Jan 24 15:52:35 2013 -0800
committer	ChromeBot <chrome-bot@google.com>	Fri Jan 25 11:19:31 2013 -0800
tree	1dbbdcec7a8acaa0438d3d918d55bdd7a0e89af8
parent	d35e6c4c767abb12b47fddbf6822ab757a28f619 [diff] [blame]