| #! /usr/bin/env python | 
 |  | 
 | """Mirror a remote ftp subtree into a local directory tree. | 
 |  | 
 | usage: ftpmirror [-v] [-q] [-i] [-m] [-n] [-r] [-s pat] | 
 |                  [-l username [-p passwd [-a account]]] | 
 | 		 hostname [remotedir [localdir]] | 
 | -v: verbose | 
 | -q: quiet | 
 | -i: interactive mode | 
 | -m: macintosh server (NCSA telnet 2.4) (implies -n -s '*.o') | 
 | -n: don't log in | 
 | -r: remove local files/directories no longer pertinent | 
 | -l username [-p passwd [-a account]]: login info (default anonymous ftp) | 
 | -s pat: skip files matching pattern | 
 | hostname: remote host | 
 | remotedir: remote directory (default initial) | 
 | localdir: local directory (default current) | 
 | """ | 
 |  | 
 | import os | 
 | import sys | 
 | import time | 
 | import getopt | 
 | import string | 
 | import ftplib | 
 | from fnmatch import fnmatch | 
 |  | 
 | # Print usage message and exit | 
 | def usage(*args): | 
 | 	sys.stdout = sys.stderr | 
 | 	for msg in args: print msg | 
 | 	print __doc__ | 
 | 	sys.exit(2) | 
 |  | 
 | verbose = 1 # 0 for -q, 2 for -v | 
 | interactive = 0 | 
 | mac = 0 | 
 | rmok = 0 | 
 | nologin = 0 | 
 | skippats = ['.', '..', '.mirrorinfo'] | 
 |  | 
 | # Main program: parse command line and start processing | 
 | def main(): | 
 | 	global verbose, interactive, mac, rmok, nologin | 
 | 	try: | 
 | 		opts, args = getopt.getopt(sys.argv[1:], 'a:bil:mnp:qrs:v') | 
 | 	except getopt.error, msg: | 
 | 		usage(msg) | 
 | 	login = '' | 
 | 	passwd = '' | 
 | 	account = '' | 
 | 	for o, a in opts: | 
 | 		if o == '-l': login = a | 
 | 		if o == '-p': passwd = a | 
 | 		if o == '-a': account = a | 
 | 		if o == '-v': verbose = verbose + 1 | 
 | 		if o == '-q': verbose = 0 | 
 | 		if o == '-i': interactive = 1 | 
 | 		if o == '-m': mac = 1; nologin = 1; skippats.append('*.o') | 
 | 		if o == '-n': nologin = 1 | 
 | 		if o == '-r': rmok = 1 | 
 | 		if o == '-s': skippats.append(a) | 
 | 	if not args: usage('hostname missing') | 
 | 	host = args[0] | 
 | 	remotedir = '' | 
 | 	localdir = '' | 
 | 	if args[1:]: | 
 | 		remotedir = args[1] | 
 | 		if args[2:]: | 
 | 			localdir = args[2] | 
 | 			if args[3:]: usage('too many arguments') | 
 | 	# | 
 | 	f = ftplib.FTP() | 
 | 	if verbose: print 'Connecting to %s...' % `host` | 
 | 	f.connect(host) | 
 | 	if not nologin: | 
 | 		if verbose: | 
 | 			print 'Logging in as %s...' % `login or 'anonymous'` | 
 | 		f.login(login, passwd, account) | 
 | 	if verbose: print 'OK.' | 
 | 	pwd = f.pwd() | 
 | 	if verbose > 1: print 'PWD =', `pwd` | 
 | 	if remotedir: | 
 | 		if verbose > 1: print 'cwd(%s)' % `remotedir` | 
 | 		f.cwd(remotedir) | 
 | 		if verbose > 1: print 'OK.' | 
 | 		pwd = f.pwd() | 
 | 		if verbose > 1: print 'PWD =', `pwd` | 
 | 	# | 
 | 	mirrorsubdir(f, localdir) | 
 |  | 
 | # Core logic: mirror one subdirectory (recursively) | 
 | def mirrorsubdir(f, localdir): | 
 | 	pwd = f.pwd() | 
 | 	if localdir and not os.path.isdir(localdir): | 
 | 		if verbose: print 'Creating local directory', `localdir` | 
 | 		try: | 
 | 		    makedir(localdir) | 
 | 		except os.error, msg: | 
 | 		    print "Failed to establish local directory", `localdir` | 
 | 		    return | 
 | 	infofilename = os.path.join(localdir, '.mirrorinfo') | 
 | 	try: | 
 | 		text = open(infofilename, 'r').read() | 
 | 	except IOError, msg: | 
 | 		text = '{}' | 
 | 	try: | 
 | 		info = eval(text) | 
 | 	except (SyntaxError, NameError): | 
 | 		print 'Bad mirror info in %s' % `infofilename` | 
 | 		info = {} | 
 | 	subdirs = [] | 
 | 	listing = [] | 
 | 	if verbose: print 'Listing remote directory %s...' % `pwd` | 
 | 	f.retrlines('LIST', listing.append) | 
 | 	filesfound = [] | 
 | 	for line in listing: | 
 | 		if verbose > 1: print '-->', `line` | 
 | 		if mac: | 
 | 			# Mac listing has just filenames; | 
 | 			# trailing / means subdirectory | 
 | 			filename = string.strip(line) | 
 | 			mode = '-' | 
 | 			if filename[-1:] == '/': | 
 | 				filename = filename[:-1] | 
 | 				mode = 'd' | 
 | 			infostuff = '' | 
 | 		else: | 
 | 			# Parse, assuming a UNIX listing | 
 | 			words = string.split(line, None, 8) | 
 | 			if len(words) < 6: | 
 | 				if verbose > 1: print 'Skipping short line' | 
 | 				continue | 
 | 			filename = string.lstrip(words[-1]) | 
 | 			i = string.find(filename, " -> ") | 
 | 			if i >= 0: | 
 | 				# words[0] had better start with 'l'... | 
 | 				if verbose > 1: | 
 | 				    print 'Found symbolic link %s' % `filename` | 
 | 				linkto = filename[i+4:] | 
 | 				filename = filename[:i] | 
 | 			infostuff = words[-5:-1] | 
 | 			mode = words[0] | 
 | 		skip = 0 | 
 | 		for pat in skippats: | 
 | 			if fnmatch(filename, pat): | 
 | 				if verbose > 1: | 
 | 					print 'Skip pattern', `pat`, | 
 | 					print 'matches', `filename` | 
 | 				skip = 1 | 
 | 				break | 
 | 		if skip: | 
 | 			continue | 
 | 		if mode[0] == 'd': | 
 | 			if verbose > 1: | 
 | 				print 'Remembering subdirectory', `filename` | 
 | 			subdirs.append(filename) | 
 | 			continue | 
 | 		filesfound.append(filename) | 
 | 		if info.has_key(filename) and info[filename] == infostuff: | 
 | 			if verbose > 1: | 
 | 				print 'Already have this version of',`filename` | 
 | 			continue | 
 | 		fullname = os.path.join(localdir, filename) | 
 | 		tempname = os.path.join(localdir, '@'+filename) | 
 | 		if interactive: | 
 | 			doit = askabout('file', filename, pwd) | 
 | 			if not doit: | 
 | 				if not info.has_key(filename): | 
 | 					info[filename] = 'Not retrieved' | 
 | 				continue | 
 | 		try: | 
 | 			os.unlink(tempname) | 
 | 		except os.error: | 
 | 			pass | 
 | 		if mode[0] == 'l': | 
 | 			if verbose: | 
 | 				print "Creating symlink %s -> %s" % ( | 
 | 					`filename`, `linkto`) | 
 | 			try: | 
 | 				os.symlink(linkto, tempname) | 
 | 			except IOError, msg: | 
 | 				print "Can't create %s: %s" % ( | 
 | 					`tempname`, str(msg)) | 
 | 				continue | 
 | 		else: | 
 | 			try: | 
 | 				fp = open(tempname, 'wb') | 
 | 			except IOError, msg: | 
 | 				print "Can't create %s: %s" % ( | 
 | 					`tempname`, str(msg)) | 
 | 				continue | 
 | 			if verbose: | 
 | 				print 'Retrieving %s from %s as %s...' % \ | 
 | 					  (`filename`, `pwd`, `fullname`) | 
 | 			if verbose: | 
 | 				fp1 = LoggingFile(fp, 1024, sys.stdout) | 
 | 			else: | 
 | 				fp1 = fp | 
 | 			t0 = time.time() | 
 | 			try: | 
 | 				f.retrbinary('RETR ' + filename, | 
 | 					     fp1.write, 8*1024) | 
 | 			except ftplib.error_perm, msg: | 
 | 				print msg | 
 | 			t1 = time.time() | 
 | 			bytes = fp.tell() | 
 | 			fp.close() | 
 | 			if fp1 != fp: | 
 | 				fp1.close() | 
 | 		try: | 
 | 			os.unlink(fullname) | 
 | 		except os.error: | 
 | 			pass		# Ignore the error | 
 | 		try: | 
 | 			os.rename(tempname, fullname) | 
 | 		except os.error, msg: | 
 | 			print "Can't rename %s to %s: %s" % (`tempname`, | 
 | 							     `fullname`, | 
 | 							     str(msg)) | 
 | 			continue | 
 | 		info[filename] = infostuff | 
 | 		writedict(info, infofilename) | 
 | 		if verbose and mode[0] != 'l': | 
 | 			dt = t1 - t0 | 
 | 			kbytes = bytes / 1024.0 | 
 | 			print int(round(kbytes)), | 
 | 			print 'Kbytes in', | 
 | 			print int(round(dt)), | 
 | 			print 'seconds', | 
 | 			if t1 > t0: | 
 | 				print '(~%d Kbytes/sec)' % \ | 
 | 					  int(round(kbytes/dt),) | 
 | 			print | 
 | 	# | 
 | 	# Remove files from info that are no longer remote | 
 | 	deletions = 0 | 
 | 	for filename in info.keys(): | 
 | 		if filename not in filesfound: | 
 | 			if verbose: | 
 | 				print "Removing obsolete info entry for", | 
 | 				print `filename`, "in", `localdir or "."` | 
 | 			del info[filename] | 
 | 			deletions = deletions + 1 | 
 | 	if deletions: | 
 | 		writedict(info, infofilename) | 
 | 	# | 
 | 	# Remove local files that are no longer in the remote directory | 
 | 	try: | 
 | 	    if not localdir: names = os.listdir(os.curdir) | 
 | 	    else: names = os.listdir(localdir) | 
 | 	except os.error: | 
 | 	    names = [] | 
 | 	for name in names: | 
 | 		if name[0] == '.' or info.has_key(name) or name in subdirs: | 
 | 			continue | 
 | 		skip = 0 | 
 | 		for pat in skippats: | 
 | 			if fnmatch(name, pat): | 
 | 				if verbose > 1: | 
 | 					print 'Skip pattern', `pat`, | 
 | 					print 'matches', `name` | 
 | 				skip = 1 | 
 | 				break | 
 | 		if skip: | 
 | 			continue | 
 | 		fullname = os.path.join(localdir, name) | 
 | 		if not rmok: | 
 | 			if verbose: | 
 | 				print 'Local file', `fullname`, | 
 | 				print 'is no longer pertinent' | 
 | 			continue | 
 | 		if verbose: print 'Removing local file/dir', `fullname` | 
 | 		remove(fullname) | 
 | 	# | 
 | 	# Recursively mirror subdirectories | 
 | 	for subdir in subdirs: | 
 | 		if interactive: | 
 | 			doit = askabout('subdirectory', subdir, pwd) | 
 | 			if not doit: continue | 
 | 		if verbose: print 'Processing subdirectory', `subdir` | 
 | 		localsubdir = os.path.join(localdir, subdir) | 
 | 		pwd = f.pwd() | 
 | 		if verbose > 1: | 
 | 			print 'Remote directory now:', `pwd` | 
 | 			print 'Remote cwd', `subdir` | 
 | 		try: | 
 | 			f.cwd(subdir) | 
 | 		except ftplib.error_perm, msg: | 
 | 			print "Can't chdir to", `subdir`, ":", `msg` | 
 | 		else: | 
 | 			if verbose: print 'Mirroring as', `localsubdir` | 
 | 			mirrorsubdir(f, localsubdir) | 
 | 			if verbose > 1: print 'Remote cwd ..' | 
 | 			f.cwd('..') | 
 | 		newpwd = f.pwd() | 
 | 		if newpwd != pwd: | 
 | 			print 'Ended up in wrong directory after cd + cd ..' | 
 | 			print 'Giving up now.' | 
 | 			break | 
 | 		else: | 
 | 			if verbose > 1: print 'OK.' | 
 |  | 
 | # Helper to remove a file or directory tree | 
 | def remove(fullname): | 
 | 	if os.path.isdir(fullname) and not os.path.islink(fullname): | 
 | 		try: | 
 | 			names = os.listdir(fullname) | 
 | 		except os.error: | 
 | 			names = [] | 
 | 		ok = 1 | 
 | 		for name in names: | 
 | 			if not remove(os.path.join(fullname, name)): | 
 | 				ok = 0 | 
 | 		if not ok: | 
 | 			return 0 | 
 | 		try: | 
 | 			os.rmdir(fullname) | 
 | 		except os.error, msg: | 
 | 			print "Can't remove local directory %s: %s" % \ | 
 | 			      (`fullname`, str(msg)) | 
 | 			return 0 | 
 | 	else: | 
 | 		try: | 
 | 			os.unlink(fullname) | 
 | 		except os.error, msg: | 
 | 			print "Can't remove local file %s: %s" % \ | 
 | 			      (`fullname`, str(msg)) | 
 | 			return 0 | 
 | 	return 1 | 
 |  | 
 | # Wrapper around a file for writing to write a hash sign every block. | 
 | class LoggingFile: | 
 | 	def __init__(self, fp, blocksize, outfp): | 
 | 		self.fp = fp | 
 | 		self.bytes = 0 | 
 | 		self.hashes = 0 | 
 | 		self.blocksize = blocksize | 
 | 		self.outfp = outfp | 
 | 	def write(self, data): | 
 | 		self.bytes = self.bytes + len(data) | 
 | 		hashes = int(self.bytes) / self.blocksize | 
 | 		while hashes > self.hashes: | 
 | 			self.outfp.write('#') | 
 | 			self.outfp.flush() | 
 | 			self.hashes = self.hashes + 1 | 
 | 		self.fp.write(data) | 
 | 	def close(self): | 
 | 		self.outfp.write('\n') | 
 |  | 
 | # Ask permission to download a file. | 
 | def askabout(filetype, filename, pwd): | 
 | 	prompt = 'Retrieve %s %s from %s ? [ny] ' % (filetype, filename, pwd) | 
 | 	while 1: | 
 | 		reply = string.lower(string.strip(raw_input(prompt))) | 
 | 		if reply in ['y', 'ye', 'yes']: | 
 | 			return 1 | 
 | 		if reply in ['', 'n', 'no', 'nop', 'nope']: | 
 | 			return 0 | 
 | 		print 'Please answer yes or no.' | 
 |  | 
 | # Create a directory if it doesn't exist.  Recursively create the | 
 | # parent directory as well if needed. | 
 | def makedir(pathname): | 
 | 	if os.path.isdir(pathname): | 
 | 		return | 
 | 	dirname = os.path.dirname(pathname) | 
 | 	if dirname: makedir(dirname) | 
 | 	os.mkdir(pathname, 0777) | 
 |  | 
 | # Write a dictionary to a file in a way that can be read back using | 
 | # rval() but is still somewhat readable (i.e. not a single long line). | 
 | # Also creates a backup file. | 
 | def writedict(dict, filename): | 
 | 	dir, file = os.path.split(filename) | 
 | 	tempname = os.path.join(dir, '@' + file) | 
 | 	backup = os.path.join(dir, file + '~') | 
 | 	try: | 
 | 		os.unlink(backup) | 
 | 	except os.error: | 
 | 		pass | 
 | 	fp = open(tempname, 'w') | 
 | 	fp.write('{\n') | 
 | 	for key, value in dict.items(): | 
 | 		fp.write('%s: %s,\n' % (`key`, `value`)) | 
 | 	fp.write('}\n') | 
 | 	fp.close() | 
 | 	try: | 
 | 		os.rename(filename, backup) | 
 | 	except os.error: | 
 | 		pass | 
 | 	os.rename(tempname, filename) | 
 |  | 
 | main() |