Convert the parser into an embeddable library. This includes a major re-organization of the existing code. Signed-off-by: John Admanski <jadmanski@google.com> git-svn-id: http://test.kernel.org/svn/autotest/trunk@1447 592f7852-d20e-0410-864c-8624ca9c26a4

commit: 96cf051df036862a1437e184124af1bbdabbe84a [log] [tgz]
author: mbligh <mbligh@592f7852-d20e-0410-864c-8624ca9c26a4> Thu Apr 17 15:25:38 2008 +0000
committer: mbligh <mbligh@592f7852-d20e-0410-864c-8624ca9c26a4> Thu Apr 17 15:25:38 2008 +0000
tree: 7e567b59b008eee4247475a579237b466a58827e
parent: 6437ff5bb28a0cc97582766826f866a39affae2a [diff]
diff --git a/tko/db.py b/tko/db.py
index 14e7c1b..7d2345b 100644
--- a/tko/db.py
+++ b/tko/db.py

@@ -1,5 +1,8 @@
-import re, os, sys, types
-from common import global_config
+import re, os, sys, types, time
+
+import common
+from autotest_lib.client.common_lib import global_config
+
 
 class MySQLTooManyRows(Exception):
 	pass
@@ -10,26 +13,28 @@
 				database = None, user = None, password = None):
 		self.debug = debug
 		self.autocommit = autocommit
-		
-		path = os.path.dirname(__file__)
-		
+
+		self.host = host
+		self.database = database
+		self.user = user
+		self.password = password
+
 		# grab the global config
 		c = global_config.global_config
-		
+
 		# grab the host, database
-		if not host:
-			host = c.get_config_value("TKO", "host")
-		if not database:
-			database = c.get_config_value("TKO", "database")
-		
+		if not self.host:
+			self.host = c.get_config_value("TKO", "host")
+		if not self.database:
+			self.database = c.get_config_value("TKO", "database")
+
 		# grab the user and password
-		if not user:
-			user = c.get_config_value("TKO", "user")
-		if not password:
-			password = c.get_config_value("TKO", "password")
-			
-		self.con = self.connect(host, database, user, password)
-		self.cur = self.con.cursor()
+		if not self.user:
+			self.user = c.get_config_value("TKO", "user")
+		if not self.password:
+			self.password = c.get_config_value("TKO", "password")
+
+		self._init_db()
 
 		# if not present, insert statuses
 		self.status_idx = {}
@@ -39,8 +44,8 @@
 			self.status_idx[s[1]] = s[0]
 			self.status_word[s[0]] = s[1]
 
-		dir = os.path.dirname(__file__)
-		machine_map = os.path.join(dir, 'machines')
+		machine_map = os.path.join(os.path.dirname(__file__),
+					   'machines')
 		if os.path.exists(machine_map):
 			self.machine_map = machine_map
 		else:
@@ -48,6 +53,41 @@
 		self.machine_group = {}
 
 
+	def _init_db(self):
+		# create the db connection and cursor
+		self.con = self.connect(self.host, self.database,
+					self.user, self.password)
+		self.cur = self.con.cursor()
+
+
+	def _run_with_retry(self, function, *args, **dargs):
+		"""Call function(*args, **dargs) until either it passes
+		without an operational error, or a timeout is reached. This
+		is intended for internal use with database functions, not
+		for generic use."""
+		OperationalError = _get_error_class("OperationalError")
+		# TODO: make this configurable
+		TIMEOUT = 3600 # one hour
+		success = False
+		start_time = time.time()
+		while not success:
+			try:
+				result = function(*args, **dargs)
+			except OperationalError:
+				stop_time = time.time()
+				elapsed_time = stop_time - start_time
+				if elapsed_time > TIMEOUT:
+					raise
+				else:
+					try:
+						self._init_db()
+					except OperationalError:
+						pass
+			else:
+				success = True
+		return result
+
+
 	def dprint(self, value):
 		if self.debug:
 			sys.stdout.write('SQL: ' + str(value) + '\n')
@@ -103,20 +143,26 @@
 
 		# TODO: this assumes there's a where clause...bad
 		if wherein and isinstance(wherein, types.DictionaryType):
-			keys_in = []
-			for field_in in wherein.keys():
-				keys_in += [field_in + ' in (' + ','.join(wherein[field_in])+') '] 
-			
+			keys_in = ["%s in (%s) " % (field, ','.join(where))
+				   for field, where in wherein.iteritems()]
 			cmd.append(' and '+' and '.join(keys_in))
+
 		if group_by:
 			cmd.append(' GROUP BY ' + group_by)
 
 		self.dprint('%s %s' % (' '.join(cmd), values))
-		numRec = self.cur.execute(' '.join(cmd), values)
-		if max_rows != None and numRec > max_rows:
-			msg = 'Exceeded allowed number of records'
-			raise MySQLTooManyRows(msg)
-		return self.cur.fetchall()
+
+		# create a re-runable function for executing the query
+		def exec_sql():
+			sql = ' '.join(cmd)
+			numRec = self.cur.execute(sql, values)
+			if max_rows != None and numRec > max_rows:
+				msg = 'Exceeded allowed number of records'
+				raise MySQLTooManyRows(msg)
+			return self.cur.fetchall()
+
+		# run the query, re-trying after operational errors
+		return self._run_with_retry(exec_sql)
 
 
 	def select_sql(self, fields, table, sql, values):
@@ -125,8 +171,28 @@
 		"""
 		cmd = 'select %s from %s %s' % (fields, table, sql)
 		self.dprint(cmd)
-		self.cur.execute(cmd, values)
-		return self.cur.fetchall()
+
+		# create a -re-runable function for executing the query
+		def exec_sql():
+			self.cur.execute(cmd, values)
+			return self.cur.fetchall()
+
+		# run the query, re-trying after operational errors
+		return self._run_with_retry(exec_sql)
+
+
+	def _exec_sql_with_commit(self, sql, values, commit):
+		if self.autocommit:
+			# re-run the query until it succeeds
+			def exec_sql():
+				self.cur.execute(sql, values)
+				self.con.commit()
+			self._run_with_retry(exec_sql)
+		else:
+			# take one shot at running the query
+			self.cur.execute(sql, values)
+			if commit:
+				self.con.commit()
 
 
 	def insert(self, table, data, commit = None):
@@ -136,18 +202,14 @@
 			data:
 				dictionary of fields and data
 		"""
-		if commit == None:
-			commit = self.autocommit
 		fields = data.keys()
 		refs = ['%s' for field in fields]
 		values = [data[field] for field in fields]
 		cmd = 'insert into %s (%s) values (%s)' % \
 				(table, ','.join(fields), ','.join(refs))
+		self.dprint('%s %s' % (cmd, values))
 
-		self.dprint('%s %s' % (cmd,values))
-		self.cur.execute(cmd, values)
-		if commit:
-			self.con.commit()
+		self._exec_sql_with_commit(cmd, values, commit)
 
 
 	def delete(self, table, where, commit = None):
@@ -158,11 +220,11 @@
 			keys = [field + '=%s' for field in where.keys()]
 			values = [where[field] for field in where.keys()]
 			cmd += ['where', ' and '.join(keys)]
-		self.dprint('%s %s' % (' '.join(cmd),values))
-		self.cur.execute(' '.join(cmd), values)
-		if commit:
-			self.con.commit()
-		
+		sql = ' '.join(cmd)
+		self.dprint('%s %s' % (sql, values))
+
+		self._exec_sql_with_commit(sql, values, commit)
+
 
 	def update(self, table, data, where, commit = None):
 		"""\
@@ -183,10 +245,10 @@
 		where_values = [where[field] for field in where.keys()]
 		cmd += ' where ' + ' and '.join(where_keys)
 
-		print '%s %s' % (cmd, data_values + where_values)
-		self.cur.execute(cmd, data_values + where_values)
-		if commit:
-			self.con.commit()
+		values = data_values + where_values
+		print '%s %s' % (cmd, values)
+
+		self._exec_sql_with_commit(cmd, values, commit)
 
 
 	def delete_job(self, tag, commit = None):
@@ -237,8 +299,10 @@
 				self.insert('iteration_result',
                                             data,
                                             commit=commit)
-		data = {'test_idx':test_idx, 'attribute':'version', 'value':test.version}
-		self.insert('test_attributes', data, commit=commit)
+
+		for key, value in test.attributes.iteritems():
+			data = {'test_idx': test_idx, 'attribute': key, 'value': value}
+			self.insert('test_attributes', data, commit=commit)
 
 
 	def read_machine_map(self):
@@ -354,16 +418,26 @@
 			return None
 
 
-# Use a class method as a class factory, generating a relevant database object.
-def db(*args, **dargs):
-	path = os.path.dirname(__file__)
-	db_type = None
-	
-	# read db_type from global config
-	c = global_config.global_config
-	db_type = c.get_config_value("TKO", "db_type", default="mysql")
-	db_type = 'db_' + db_type
-	exec ('import %s; db = %s.%s(*args, **dargs)'
-	      % (db_type, db_type, db_type))
+def _get_db_type():
+	"""Get the database type name to use from the global config."""
+	get_value = global_config.global_config.get_config_value
+	return "db_" + get_value("TKO", "db_type", default="mysql")
 
+
+def _get_error_class(class_name):
+	"""Retrieves the appropriate error class by name from the database
+	module."""
+	db_module = __import__("autotest_lib.tko." + _get_db_type(),
+			       globals(), locals(), ["driver"])
+	return getattr(db_module.driver, class_name)
+
+
+def db(*args, **dargs):
+	"""Creates an instance of the database class with the arguments
+	provided in args and dargs, using the database type specified by
+	the global configuration (defaulting to mysql)."""
+	db_type = _get_db_type()
+	db_module = __import__("autotest_lib.tko." + db_type, globals(),
+			       locals(), [db_type])
+	db = getattr(db_module, db_type)(*args, **dargs)
 	return db

diff --git a/tko/db_mysql.py b/tko/db_mysql.py
index 37c216b..da59ecd 100644
--- a/tko/db_mysql.py
+++ b/tko/db_mysql.py

@@ -1,7 +1,7 @@
-import MySQLdb
+import MySQLdb as driver
 import db
 
 class db_mysql(db.db_sql):
 	def connect(self, host, database, user, password):
-		return MySQLdb.connect(host=host, user=user,
-			passwd=password, db=database)
+		return driver.connect(host=host, user=user,
+				      passwd=password, db=database)

diff --git a/tko/db_postgres.py b/tko/db_postgres.py
index 816d358..166ee02 100644
--- a/tko/db_postgres.py
+++ b/tko/db_postgres.py

@@ -1,7 +1,7 @@
-import psycopg2.psycopg1 as postgres
+import psycopg2.psycopg1 as driver
 import db
 
 class db_postgres(db.db_sql):
 	def connect(self, host, database, user, password):
-		return postgres.connect("dbname=%s user=%s password=%s" % \
-				(database, user, password))
+		return driver.connect("dbname=%s user=%s password=%s" % \
+				      (database, user, password))

diff --git a/tko/parse b/tko/parse
index a8741bf..8379db3 100755
--- a/tko/parse
+++ b/tko/parse

@@ -1,164 +1,9 @@
 #!/usr/bin/python -u
-import os, re, parse, frontend, db, sys, socket, fcntl
-from optparse import OptionParser
-from traceback import format_exception
 
-def format_error():
-	t, o, tb = sys.exc_info()
-	trace = format_exception(t, o, tb)
-	# Clear the backtrace to prevent a circular reference
-	# in the heap -- as per tutorial
-	tb = ''
+import os, sys
 
-	return ''.join(trace)
+# this is a stub that just execs into parse.py
+mypath = os.path.dirname(os.path.abspath(__file__))
+parse_py = os.path.join(mypath, "parse.py")
 
-parser = OptionParser()
-parser.add_option('-m', help='Send mail for FAILED tests', dest='mailit',
-							action='store_true')
-parser.add_option('-r', help='Reparse the results of a job', dest='reparse',
-							action='store_true')
-parser.add_option('-o', help='one: parse a single results directory',
-					dest='singledir', action='store_true')
-parser.add_option('-l', help='levels of subdirectories to include in job name',
-					type='int', dest='level', default=1)
-parser.add_option('-n', help='no blocking on an existing parse',
-		  dest='noblock', action='store_true')
-parser.add_option('-s', help='Database server hostname',
-					dest='db_host', action='store')
-parser.add_option('-u', help='Database username',
-					dest='db_user', action='store')
-parser.add_option('-p', help='Database password',
-					dest='db_pass', action='store')
-parser.add_option('-d', help='Database name',
-					dest='db_name', action='store')
-(options, args) = parser.parse_args()
-
-if len(args) == 0:
-	print "ERROR: You need to at least provide a directory to parse\n"
-	parser.print_help()
-	sys.exit(1)
-
-dir = os.path.abspath(args[0])
-assert os.path.exists(dir)
-
-if options.singledir:
-	jobs_list = [dir]
-else:
-	jobs_list = [os.path.join(dir, subdir) for subdir in os.listdir(dir)]
-
-debug = True
-
-failcc = ""
-# The user to notify on job failures - TOOD, pull into the config file
-notify_user = None
-# do commits transactionally
-db = db.db(autocommit=False, host=options.db_host,
-           user=options.db_user, password=options.db_pass,
-           database=options.db_name)
-
-
-def mailfailure(jobname, job, mesgtxt):
-	# XXX: Need to insert URL here too (frontend.test.url?)
-	link = "http://" + socket.gethostname() + "/results/" + jobname
-
-	# This looks pretty good on fixed-width-font email reader.
-	message_header = "\n%s\n%s\n\n%-12s %-20s %-12s %-10s %s\n" % \
-				("The following tests FAILED for this job:",
-				link, "Job name", "Kernel", "Test name",
-				"FAIL/WARN", "Failure Reason")
-	message_header += "%-12s %-20s %-12s %-10s %s\n" % \
-					("========", "======", "=========",
-					 "=========", "==============")
-
-	subject = "AUTOTEST: FAILED tests from " + " job " + jobname
-	parse.mail(notify_user, job.user, failcc, subject,
-						message_header + mesgtxt)
-
-
-def dprint(string):
-	if debug:
-		print string
-
-
-def do_parse(jobname, path):
-	"""
-	Parse a single job. Optionally send email on failure, etc.
-	"""
-	dprint('\nScanning %s (%s)' % (jobname, path))
-	if options.reparse and db.find_job(jobname):
-		dprint('! Deleting old copy of job results, to reparse it')
-		db.delete_job(jobname)
-	if db.find_job(jobname):		# Job has already been parsed
-		dprint('! Already processed')
-		return
-	job = parse.job(path)
-	if not job:
-		dprint('! Failed to parse job (no status file?)')
-		return
-	if not job.kernel:
-		dprint('! Failed to find kernel for job')
-		return
-	print '+ Parsing ' + path
-	print '* jobname, kernel version: %s %s' % (jobname, job.kernel.base)
-	mesgtxt = "\n"
-	for test in job.tests:
-		if not test.subdir:
-			continue
-		print "* testname, status, reason: %s %s %s" % \
-					(test.subdir, test.status, test.reason)
-		if re.match(r'(FAIL|WARN)',test.status):
-			mesgtxt += "%-12s %-20s %-12s %-10s %s" % \
-					(jobname, job.kernel.base, test.subdir,
-					 test.status, test.reason)
-
-	if len(mesgtxt) > 2 and options.mailit:
-		print "Sending email report of FAILURES on %s to %s" % \
-							(jobname, job.user)
-		mailfailure(jobname, job, mesgtxt)
-	db.insert_job(jobname, job)
-	print "COMMITING"
-	db.commit()
-
-
-def parse_path(path):
-	job_elements = path.split('/')[-options.level:]
-					# last 'level' elements of path
-	jobname = '/'.join(job_elements)
-	machine_list = os.path.join(path, '.machines')
-	if os.path.exists(machine_list):
-		# This is a multi-machine job
-		for m in open(machine_list):
-			machine = m.rstrip()
-			if not machine:
-				continue
-			jobpath = os.path.join(path, machine)
-			jobname = os.path.join(os.path.basename(path), machine)
-			try:
-				do_parse(jobname, jobpath)
-			except:
-				print format_error()
-				continue
-	else:
-		# This is a single-machine job
-		try:
-			do_parse(jobname, path)
-		except:
-			print format_error()
-
-
-for path in jobs_list:
-	lockfile = open(os.path.join(path, ".parse.lock"), "w")
-	try:
-		flags = fcntl.LOCK_EX
-		if options.noblock:
-			flags |= fcntl.LOCK_NB
-		fcntl.flock(lockfile, flags)
-	except IOError:
-		# only happens when non-blocking if the lock is already held
-		lockfile.close()
-		continue   # a parse is already running here, skip it
-	try:
-		parse_path(path)
-	finally:
-		fcntl.flock(lockfile, fcntl.LOCK_UN)
-		lockfile.close()
+os.execv(parse_py, [parse_py] + sys.argv[1:])

diff --git a/tko/parse.py b/tko/parse.py
index ec5f1e4..f18b076 100755
--- a/tko/parse.py
+++ b/tko/parse.py

@@ -1,416 +1,188 @@
-#!/usr/bin/python
-import os, re, md5, sys, email.Message, smtplib, datetime
+#!/usr/bin/python -u
 
-client_bin = os.path.join(os.path.dirname(__file__), '../client/bin')
-sys.path.insert(0, os.path.abspath(client_bin))
-from autotest_utils import read_keyval
+import os, sys, optparse, fcntl, errno, traceback
 
-user = re.compile(r'user(\s*)=')
-label = re.compile(r'label(\s*)=')
-
-debug = True
-
-# XXX: these mail bits came almost verbatim from mirror/mirror and this should
-# probably be refactored into another file and used by both.
-def mail(from_address, to_addresses, cc_addresses, subject, message_text):
-	# if passed a string for the to_addresses convert it to a tuple
-	if type(to_addresses) is str:
-		to_addresses = (to_addresses,)
-
-	message = email.Message.Message()
-	message["To"] = ", ".join(to_addresses)
-	message["Cc"] = ", ".join(cc_addresses)
-	message["From"] = from_address
-	message["Subject"] = subject
-	message.set_payload(message_text)
-
-	try:
-		sendmail(message.as_string())
-	except SendmailException, e:
-		server = smtplib.SMTP("localhost")
-		server.sendmail(from_address, to_addresses, cc_addresses, message.as_string())
-		server.quit()
+import common
+from autotest_lib.client.common_lib import mail as common_mail
+from autotest_lib.tko import db as tko_db, utils, status_lib
 
 
-MAIL = "sendmail"
+def parse_args():
+	# build up our options parser and parse sys.argv
+	parser = optparse.OptionParser()
+	parser.add_option("-m", help="Send mail for FAILED tests",
+			  dest="mailit", action="store_true")
+	parser.add_option("-r", help="Reparse the results of a job",
+			  dest="reparse", action="store_true")
+	parser.add_option("-o", help="Parse a single results directory",
+			  dest="singledir", action="store_true")
+	parser.add_option("-l", help=("Levels of subdirectories to include "
+				      "in the job name"),
+			  type="int", dest="level", default=1)
+	parser.add_option("-n", help="No blocking on an existing parse",
+			  dest="noblock", action="store_true")
+	parser.add_option("-s", help="Database server hostname",
+			  dest="db_host", action="store")
+	parser.add_option("-u", help="Database username", dest="db_user",
+			  action="store")
+	parser.add_option("-p", help="Database password", dest="db_pass",
+			  action="store")
+	parser.add_option("-d", help="Database name", dest="db_name",
+			  action="store")
+	options, args = parser.parse_args()
 
-class SendmailException(Exception):
-	pass
+	# we need a results directory
+	if len(args) == 0:
+		utils.dprint("ERROR: at least one results directory must "
+			     "be provided")
+		parser.print_help()
+		sys.exit(1)
 
-def sendmail(message):
-	"""Send an email using sendmail"""
-	# open a pipe to the mail program and
-	# write the data to the pipe
-	p = os.popen("%s -t" % MAIL, 'w')
-	p.write(message)
-	exitcode = p.close()
-	if exitcode:
-		raise SendmailException("Exit code: %s" % exitcode)
-
-# XXX: End of code from mirror/mirror
+	# pass the options back
+	return options, args
 
 
-def shorten_patch(long):
-	short = os.path.basename(long)
-	short = re.sub(r'^patch-', '', short)
-	short = re.sub(r'\.(bz2|gz)$', '', short)
-	short = re.sub(r'\.patch$', '', short)
-	short = re.sub(r'\+', '_', short)
-	return short
+def format_failure_message(jobname, kernel, testname, status, reason):
+	format_string = "%-12s %-20s %-12s %-10s %s"
+	return format_string % (jobname, kernel, testname, status, reason)
 
 
-def dprint(info):
-	if debug:
-		sys.stderr.write(str(info) + '\n')
+def mailfailure(jobname, job, message):
+	message_lines = [""]
+	message_lines.append("The following tests FAILED for this job")
+	message_lines.append("http://%s/results/%s" %
+			     (socket.gethostname(), jobname))
+	message_lines.append("")
+	message_lines.append(format_failure_message("Job name", "Kernel",
+						    "Test name", "FAIL/WARN",
+						    "Failure reason"))
+	message_lines.append(format_failure_message("=" * 8, "=" * 6, "=" * 8,
+						    "=" * 8, "=" * 14))
+	message_header = "\n".join(message_lines)
+
+	subject = "AUTOTEST: FAILED tests from job %s" % jobname
+	common_mail.send("", job.user, "", subject, message_header + message)
 
 
-def get_timestamp(mapping, field):
-	val = mapping.get(field, None)
-	if val is not None:
-		val = datetime.datetime.fromtimestamp(int(val))
-	return val
+def parse_one(db, jobname, path, reparse, mail_on_failure):
+	"""
+	Parse a single job. Optionally send email on failure.
+	"""
+	utils.dprint("\nScanning %s (%s)" % (jobname, path))
+	if reparse and db.find_job(jobname):
+		utils.dprint("! Deleting old copy of job results to "
+				 "reparse it")
+		db.delete_job(jobname)
+	if db.find_job(jobname):
+		utils.dprint("! Job is already parsed, done")
+		return
+
+	# parse out the job
+	parser = status_lib.parser(0)
+	job = parser.make_job(path)
+	status_log = os.path.join(path, "status.log")
+	if not os.path.exists(status_log):
+		status_log = os.path.join(path, "status")
+	if not os.path.exists(status_log):
+		utils.dprint("! Unable to parse job, no status file")
+		return
+
+	# parse the status logs
+	utils.dprint("+ Parsing dir=%s, jobname=%s" % (path, jobname))
+	status_lines = open(status_log).readlines()
+	parser.start(job)
+	tests = parser.end(status_lines)
+	job.tests = tests
+
+	# check for failures
+	message_lines = [""]
+	for test in job.tests:
+		if not test.subdir:
+			continue
+		utils.dprint("* testname, status, reason: %s %s %s"
+			     % (test.subdir, test.status, test.reason))
+		if test.status in ("FAIL", "WARN"):
+			message_lines.append(format_failure_message(
+			    jobname, test.kernel.base, test.subdir,
+			    test.status, test.reason))
+	message = "\n".join(message_lines)
+
+	# send out a email report of failure
+	if len(message) > 2 and mail_on_failure:
+		utils.dprint("Sending email report of failure on %s to %s"
+			     % (jobname, job.user))
+		mailfailure(jobname, job, message)
+
+	# write the job into the database
+	db.insert_job(jobname, job)
+	db.commit()
 
 
-class status_stack:
-	def __init__(self, job):
-		self.job = job
-		self.status_stack = [self.job.statuses[-1]]
-
-
-	def current_status(self):
-		return self.status_stack[-1]
-
-
-	def update(self, new_status):
-		if new_status not in self.job.statuses:
-			return
-		old = self.job.statuses.index(self.current_status())
-		new = self.job.statuses.index(new_status)
-		if new < old:
-			self.status_stack[-1] = new_status
-
-
-	def start(self):
-		self.status_stack.append(self.job.statuses[-1])
-
-
-	def end(self):
-		result = self.status_stack.pop()
-		if len(self.status_stack) == 0:
-			self.status_stack.append(self.job.statuses[-1])
-		return result
-
-
-
-class job:
-	statuses = ['NOSTATUS', 'ERROR', 'ABORT', 'FAIL', 'WARN', 'GOOD',
-		    'ALERT']
-
-	def __init__(self, dir):
-		self.dir = dir
-		self.control = os.path.join(dir, "control")
-		self.status = os.path.join(dir, "status.log")
-		if not os.path.exists(self.status):
-			self.status = os.path.join(dir, "status")
-		self.variables = {}
-		self.tests = []
-		self.kernel = None
-
-		# Get the user + tag info from the keyval file.
+def parse_path(db, path, level, reparse, mail_on_failure):
+	machine_list = os.path.join(path, ".machines")
+	if os.path.exists(machine_list):
+		# multi-machine job
+		for m in file(machine_list):
+			machine = m.rstrip()
+			if not machine:
+				continue
+			jobpath = os.path.join(path, machine)
+			jobname = "%s/%s" % (os.path.basename(path), machine)
+			try:
+				parse_one(db, jobname, jobpath, reparse,
+					  mail_on_failure)
+			except Exception:
+				traceback.print_exc()
+				continue
+	else:
+		# single machine job
+		job_elements = path.split("/")[-level:]
+		jobname = "/".join(job_elements)
 		try:
-			keyval = read_keyval(dir)
-			print keyval
-		except:
-			keyval = {}
-		self.user = keyval.get('user', None)
-		self.label = keyval.get('label', None)
-		self.machine = keyval.get('hostname', None)
-		if self.machine:
-			assert ',' not in self.machine
-		self.queued_time = get_timestamp(keyval, 'job_queued')
-		self.started_time = get_timestamp(keyval, 'job_started')
-		self.finished_time = get_timestamp(keyval, 'job_finished')
-		self.machine_owner = keyval.get('owner', None)
-
-		if not self.machine:
-			self.get_machine()
-
-		print 'MACHINE NAME: ' + self.machine
-		if not os.path.exists(self.status):
-			return None
-
-		self.grope_status()
+			parse_one(db, jobname, path, reparse, mail_on_failure)
+		except Exception:
+			traceback.print_exc()
 
 
-	def get_machine(self):
+def main():
+	options, args = parse_args()
+	results_dir = os.path.abspath(args[0])
+	assert os.path.exists(results_dir)
+
+	# build up the list of job dirs to parse
+	if options.singledir:
+		jobs_list = [results_dir]
+	else:
+		jobs_list = [os.path.join(results_dir, subdir)
+			     for subdir in os.listdir(results_dir)]
+
+	# build up the database
+	db = tko_db.db(autocommit=False, host=options.db_host,
+		       user=options.db_user, password=options.db_pass,
+		       database=options.db_name)
+
+	# parse all the jobs
+	for path in jobs_list:
+		lockfile = open(os.path.join(path, ".parse.lock"), "w")
+		flags = fcntl.LOCK_EX
+		if options.noblock:
+			flags != fcntl.LOCK_NB
 		try:
-			hostname = os.path.join(self.dir, "sysinfo/hostname")
-			self.machine = open(hostname, 'r').readline().rstrip()
-			return
-		except:
-			pass
+			fcntl.flock(lockfile, flags)
+		except IOError, e:
+			# was this because the lock is unavailable?
+			if e.errno == errno.EWOULDBLOCK:
+				lockfile.close()
+				continue
+			else:
+				raise # something unexpected happened
 		try:
-			uname = os.path.join(self.dir, "sysinfo/uname_-a")
-			self.machine = open(uname, 'r').readline().split()[1]
-			return
-		except:
-			pass
-		raise "Could not figure out machine name"
+			parse_path(db, path, options.level, options.reparse,
+				   options.mailit)
+		finally:
+			fcntl.flock(lockfile, fcntl.LOCK_UN)
+			lockfile.close()
 
 
-	def grope_status(self):
-		"""
-		Note that what we're looking for here is level 1 groups
-		(ie end markers with 1 tab in front)
-
-		For back-compatiblity, we also count level 0 groups that
-		are not job-level events, if there's no start/end job level
-		markers: "START   ----    ----"
-		"""
-		dprint('=====================================================')
-		dprint(self.dir)
-		dprint('=====================================================')
-		self.kernel = kernel(self.dir)
-
-		reboot_inprogress = 0	# Saw reboot start and not finish
-		boot_count = 0
-		alert_pending = None	# Saw an ALERT for this test
-		group_subdir = None
-		group_status = status_stack(self)
-		sought_level = 0        # we log events at indent level 0
-		current_kernel = self.kernel
-		for line in open(self.status, 'r').readlines():
-			dprint('\nSTATUS: ' + line.rstrip())
-			if not re.search(r'^\t*\S', line):
-				dprint('Continuation line, ignoring')
-				continue	# ignore continuation lines
-			if re.search(r'^START\t----\t----', line):
-				sought_level = 1
-				# we now log events at indent level 1
-				dprint('Found job level start marker. Looking for level 1 groups now')
-				continue
-			if re.search(r'^END [^\t]*\t----\t----', line):
-				sought_level = 0
-				# the job is ended
-				dprint('Found job level end marker. Loocking for level 0 lines now')
-			indent = re.search('^(\t*)', line).group(0).count('\t')
-			line = line.lstrip()
-			line = line.rstrip('\n')
-			if line.startswith('START\t'):
-				group_subdir = None
-				group_status.start()
-				dprint('start line, ignoring')
-				continue	# ignore start lines
-			reason = None
-			if line.startswith('END '):
-				elements = line.split('\t')
-				elements[0] = elements[0][4:] # remove 'END '
-				end = True
-			else:
-				elements = line.split('\t')
-				end = False
-			(status, subdir, testname, reason) = elements[0:4]
-			status, subdir, testname = elements[:3]
-			reason = elements[-1]
-			optional_fields = dict(element.split('=', 1)
-					       for element in elements[3:-1])
-			group_status.update(status)
-			dprint('GROPE_STATUS: ' +
-			       str([group_status.current_status(), status,
-				    subdir, testname, reason]))
-			if status == 'ALERT':
-				dprint('job level alert, recording')
-				alert_pending = reason
-				continue
-			if testname == 'Autotest.install' and status == 'GOOD':
-				dprint('Sucessful autotest install, ignoring')
-				continue
-			if testname == '----':
-				if status == 'ABORT' and not end:
-					testname = 'JOB'
-				else:
-					dprint('job level event, ignoring')
-					# This is a job level event, not a test
-					continue
-			################################################
-			# REMOVE THIS SECTION ONCE OLD FORMAT JOBS ARE GONE
-			################################################
-			if re.search(r'^(GOOD|FAIL|WARN) ', line):
-				status, testname, reason = line.split(None, 2)
-
-				if testname.startswith('kernel.'):
-					subdir = 'build'
-				else:
-					subdir = testname
-			if testname.startswith('completed'):
-				raise 'testname is crap'
-			################################################
-			if subdir == '----':
-				subdir = None
-			if line.startswith('END'):
-				subdir = group_subdir
-			if (indent != sought_level and status != 'ABORT' and
-			    not testname.startswith('reboot.')):
-				# we're in a block group
-				if subdir:
-					dprint('set group_subdir: %s' % subdir)
-					group_subdir = subdir
-				dprint('incorrect indent level %d != %d, ignoring' % (indent, sought_level))
-				continue
-			if not re.search(r'^(boot(\.\d+)?$|kernel\.)', testname):
-				# This is a real test
-				if subdir and subdir.count('.'):
-					# eg dbench.ext3
-					testname = subdir
-			if testname == 'reboot.start':
-				dprint('reboot start event, ignoring')
-				reboot_inprogress = 1
-				continue
-			if testname == 'reboot.verify':
-				testname = 'boot.%d' % boot_count
-				dprint('reboot verified')
-				reboot_inprogress = 0
-				verify_ident = reason.strip()
-				current_kernel = kernel(self.dir, verify_ident)
-				boot_count += 1
-			if alert_pending:
-				status = 'ALERT'
-				reason = alert_pending
-				alert_pending = None
-			if status in self.statuses:
-				dprint('Adding: %s\nSubdir:%s\nTestname:%s\n%s'
-				       % (group_status.current_status(),
-					  subdir, testname, reason))
-			else:
-				dprint('WARNING: Invalid status code. Ignoring')
-				continue
-
-			finished_time = get_timestamp(optional_fields,
-						      'timestamp')
-			test_status = group_status.end()
-			self.tests.append(test(subdir, testname, test_status,
-					       reason, current_kernel, self,
-					       finished_time))
-			dprint('')
-
-		if reboot_inprogress:
-			testname = 'boot.%d' % boot_count
-			dprint('Adding: %s\nSubdir:%s\nTestname:%s\n%s' %
-					('----', subdir, testname, reason))
-			self.tests.append(test('----', testname, 'ABORT', 
-				'machine did not return from reboot',
-				current_kernel, self))
-			dprint('')
-
-
-class kernel:
-	def __init__(self, topdir, verify_ident=None):
-		self.base = 'UNKNOWN'
-		self.patches = []
-		patch_hashes = []
-		# HACK. we don't have proper build tags in the status file yet
-		# so we hardcode build/ and do it at the start of the job
-		build_log = os.path.join(topdir, 'build/debug/build_log')
-
-		if os.path.exists(build_log):
-			for line in open(build_log, 'r'):
-				print line
-				(type, rest) = line.split(': ', 1)
-				words = rest.split()
-				if type == 'BASE':
-					self.base = words[0]
-				if type == 'PATCH':
-					print words
-					self.patches.append(patch(*words[0:]))
-					patch_hashes.append(words[2])
-		elif verify_ident:
-			self.base = verify_ident
-		else:
-			for sysinfo in ['sysinfo/reboot1', 'sysinfo']:
-				uname_file = os.path.join(topdir, sysinfo, 'uname_-a')
-				if not os.path.exists(uname_file):
-					continue
-				uname = open(uname_file, 'r').readline().split()
-				self.base = uname[2]
-				re.sub(r'-autotest$', '', self.base)
-				break
-		print 'kernel.__init__() found kernel version %s' % self.base
-		if self.base == 'UNKNOWN':
-			self.kernel_hash = 'UNKNOWN'
-		else:
-			self.kernel_hash = self.get_kver_hash(self.base, patch_hashes)
-
-
-	def get_kver_hash(self, base, patch_hashes):
-		"""\
-		Calculate a hash representing the unique combination of
-		the kernel base version plus 
-		"""
-		key_string = ','.join([base] + patch_hashes)
-		return md5.new(key_string).hexdigest()
-
-
-class patch:
-	def __init__(self, spec, reference=None, hash=None):
-		# NEITHER OF THE ABOVE SHOULD HAVE DEFAULTS!!!! HACK HACK
-		if not reference:
-			reference = spec
-		print 'PATCH::%s %s %s' % (spec, reference, hash)
-		self.spec = spec
-		self.reference = reference
-		self.hash = hash
-
-
-class test:
-	def __init__(self, subdir, testname, status, reason, kernel, job,
-		     finished_time=None):
-		# NOTE: subdir may be none here for lines that aren't an
-		# actual test
-		self.subdir = subdir
-		self.testname = testname
-		self.status = status
-		self.reason = reason
-		self.version = None
-		self.keyval = None
-
-		if subdir:
-			keyval = os.path.join(job.dir, subdir, 'results/keyval')
-			if os.path.exists(keyval):
-				self.keyval = keyval
-			keyval2 = os.path.join(job.dir, subdir, 'keyval')
-			if os.path.exists(keyval2):
-				self.version = open(keyval2, 'r').readline().split('=')[1]
-		else:
-			self.keyval = None
-		self.iterations = []
-		self.kernel = kernel
-		self.machine = job.machine
-		self.finished_time = finished_time
-
-		dprint("PARSING TEST %s %s %s" % (subdir, testname, self.keyval))
-
-		if not self.keyval:
-			return
-		count = 1
-		lines = []
-		for line in open(self.keyval, 'r').readlines():
-			if not re.search('\S', line):		# blank line
-				self.iterations.append(iteration(count, lines))
-				lines = []
-				count += 1
-			else:
-				lines.append(line)
-		if lines:
-			self.iterations.append(iteration(count, lines))
-
-
-class iteration:
-	def __init__(self, index, lines):
-		self.index = index
-		self.keyval = {}
-
-		dprint("ADDING ITERATION %d" % index)
-		for line in lines:
-			line = line.rstrip();
-			(key, value) = line.split('=', 1)
-			self.keyval[key] = value
+if __name__ == "__main__":
+	main()
commit	96cf051df036862a1437e184124af1bbdabbe84a	[log] [tgz]
author	mbligh <mbligh@592f7852-d20e-0410-864c-8624ca9c26a4>	Thu Apr 17 15:25:38 2008 +0000
committer	mbligh <mbligh@592f7852-d20e-0410-864c-8624ca9c26a4>	Thu Apr 17 15:25:38 2008 +0000
tree	7e567b59b008eee4247475a579237b466a58827e
parent	6437ff5bb28a0cc97582766826f866a39affae2a [diff]