| #! /usr/bin/env python | 
 |  | 
 | # Extract statistics from ftp daemon log. | 
 |  | 
 | # Usage: | 
 | # ftpstats [-m maxitems] [-s search] [file] | 
 | # -m maxitems: restrict number of items in "top-N" lists, default 25. | 
 | # -s string:   restrict statistics to lines containing this string. | 
 | # Default file is /usr/adm/ftpd;  a "-" means read stdandard input. | 
 |  | 
 | # The script must be run on the host where the ftp daemon runs. | 
 | # (At CWI this is currently buizerd.) | 
 |  | 
 | import os | 
 | import sys | 
 | import regex | 
 | import string | 
 | import getopt | 
 |  | 
 | pat = '^\([a-zA-Z0-9 :]*\)!\(.*\)!\(.*\)!\([<>].*\)!\([0-9]+\)!\([0-9]+\)$' | 
 | prog = regex.compile(pat) | 
 |  | 
 | def main(): | 
 | 	maxitems = 25 | 
 | 	search = None | 
 | 	try: | 
 | 		opts, args = getopt.getopt(sys.argv[1:], 'm:s:') | 
 | 	except getopt.error, msg: | 
 | 		print msg | 
 | 		print 'usage: ftpstats [-m maxitems] [file]' | 
 | 		sys.exit(2) | 
 | 	for o, a in opts: | 
 | 		if o == '-m': | 
 | 			maxitems = string.atoi(a) | 
 | 		if o == '-s': | 
 | 			search = a | 
 | 	file = '/usr/adm/ftpd' | 
 | 	if args: file = args[0] | 
 | 	if file == '-': | 
 | 		f = sys.stdin | 
 | 	else: | 
 | 		try: | 
 | 			f = open(file, 'r') | 
 | 		except IOError, msg: | 
 | 			print file, ':', msg | 
 | 			sys.exit(1) | 
 | 	bydate = {} | 
 | 	bytime = {} | 
 | 	byfile = {} | 
 | 	bydir = {} | 
 | 	byhost = {} | 
 | 	byuser = {} | 
 | 	bytype = {} | 
 | 	lineno = 0 | 
 | 	try: | 
 | 		while 1: | 
 | 			line = f.readline() | 
 | 			if not line: break | 
 | 			lineno = lineno + 1 | 
 | 			if search and string.find(line, search) < 0: | 
 | 				continue | 
 | 			if prog.match(line) < 0: | 
 | 				print 'Bad line', lineno, ':', `line` | 
 | 				continue | 
 | 			items = prog.group(1, 2, 3, 4, 5, 6) | 
 | 			(logtime, loguser, loghost, logfile, logbytes, | 
 | 			 logxxx2) = items | 
 | ## 			print logtime | 
 | ## 			print '-->', loguser | 
 | ## 			print '--> -->', loghost | 
 | ## 			print '--> --> -->', logfile | 
 | ## 			print '--> --> --> -->', logbytes | 
 | ## 			print '--> --> --> --> -->', logxxx2 | 
 | ## 			for i in logtime, loghost, logbytes, logxxx2: | 
 | ## 				if '!' in i: print '???', i | 
 | 			add(bydate, logtime[-4:] + ' ' + logtime[:6], items) | 
 | 			add(bytime, logtime[7:9] + ':00-59', items) | 
 | 			direction, logfile = logfile[0], logfile[1:] | 
 | 			# The real path probably starts at the last //... | 
 | 			while 1: | 
 | 				i = string.find(logfile, '//') | 
 | 				if i < 0: break | 
 | 				logfile = logfile[i+1:] | 
 | 			add(byfile, logfile + ' ' + direction, items) | 
 | 			logdir = os.path.dirname(logfile) | 
 | ##		logdir = os.path.normpath(logdir) + '/.' | 
 | 			while 1: | 
 | 				add(bydir, logdir + ' ' + direction, items) | 
 | 				dirhead = os.path.dirname(logdir) | 
 | 				if dirhead == logdir: break | 
 | 				logdir = dirhead | 
 | 			add(byhost, loghost, items) | 
 | 			add(byuser, loguser, items) | 
 | 			add(bytype, direction, items) | 
 | 	except KeyboardInterrupt: | 
 | 		print 'Interrupted at line', lineno | 
 | 	show(bytype, 'by transfer direction', maxitems) | 
 | 	show(bydir, 'by directory', maxitems) | 
 | 	show(byfile, 'by file', maxitems) | 
 | 	show(byhost, 'by host', maxitems) | 
 | 	show(byuser, 'by user', maxitems) | 
 | 	showbar(bydate, 'by date') | 
 | 	showbar(bytime, 'by time of day') | 
 |  | 
 | def showbar(dict, title): | 
 | 	n = len(title) | 
 | 	print '='*((70-n)/2), title, '='*((71-n)/2) | 
 | 	list = [] | 
 | 	keys = dict.keys() | 
 | 	keys.sort() | 
 | 	for key in keys: | 
 | 		n = len(str(key)) | 
 | 		list.append((len(dict[key]), key)) | 
 | 	maxkeylength = 0 | 
 | 	maxcount = 0 | 
 | 	for count, key in list: | 
 | 		maxkeylength = max(maxkeylength, len(key)) | 
 | 		maxcount = max(maxcount, count) | 
 | 	maxbarlength = 72 - maxkeylength - 7 | 
 | 	for count, key in list: | 
 | 		barlength = int(round(maxbarlength*float(count)/maxcount)) | 
 | 		bar = '*'*barlength | 
 | 		print '%5d %-*s %s' % (count, maxkeylength, key, bar) | 
 |  | 
 | def show(dict, title, maxitems): | 
 | 	if len(dict) > maxitems: | 
 | 		title = title + ' (first %d)'%maxitems | 
 | 	n = len(title) | 
 | 	print '='*((70-n)/2), title, '='*((71-n)/2) | 
 | 	list = [] | 
 | 	keys = dict.keys() | 
 | 	for key in keys: | 
 | 		list.append((-len(dict[key]), key)) | 
 | 	list.sort() | 
 | 	for count, key in list[:maxitems]: | 
 | 		print '%5d %s' % (-count, key) | 
 |  | 
 | def add(dict, key, item): | 
 | 	if dict.has_key(key): | 
 | 		dict[key].append(item) | 
 | 	else: | 
 | 		dict[key] = [item] | 
 |  | 
 | main() |