Benjamin Peterson | 90f5ba5 | 2010-03-11 22:53:45 +0000 | [diff] [blame] | 1 | #! /usr/bin/env python3 |
Guido van Rossum | 9966e2c | 2001-06-22 16:05:48 +0000 | [diff] [blame] | 2 | |
| 3 | """Python utility to print MD5 checksums of argument files. |
Guido van Rossum | 9966e2c | 2001-06-22 16:05:48 +0000 | [diff] [blame] | 4 | """ |
| 5 | |
Guido van Rossum | 9966e2c | 2001-06-22 16:05:48 +0000 | [diff] [blame] | 6 | |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 7 | bufsize = 8096 |
| 8 | fnfilter = None |
Tim Peters | 1a3abcb | 2003-08-18 23:52:09 +0000 | [diff] [blame] | 9 | rmode = 'rb' |
Guido van Rossum | 9966e2c | 2001-06-22 16:05:48 +0000 | [diff] [blame] | 10 | |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 11 | usage = """ |
Berker Peksag | 7aee3ec | 2014-07-11 20:42:18 +0300 | [diff] [blame] | 12 | usage: md5sum.py [-b] [-t] [-l] [-s bufsize] [file ...] |
Tim Peters | 1a3abcb | 2003-08-18 23:52:09 +0000 | [diff] [blame] | 13 | -b : read files in binary mode (default) |
| 14 | -t : read files in text mode (you almost certainly don't want this!) |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 15 | -l : print last pathname component only |
| 16 | -s bufsize: read buffer size (default %d) |
| 17 | file ... : files to sum; '-' or no files means stdin |
| 18 | """ % bufsize |
| 19 | |
Berker Peksag | 7aee3ec | 2014-07-11 20:42:18 +0300 | [diff] [blame] | 20 | import io |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 21 | import sys |
| 22 | import os |
| 23 | import getopt |
R David Murray | 54ac832 | 2012-04-04 21:28:14 -0400 | [diff] [blame] | 24 | from hashlib import md5 |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 25 | |
| 26 | def sum(*files): |
| 27 | sts = 0 |
Berker Peksag | 7aee3ec | 2014-07-11 20:42:18 +0300 | [diff] [blame] | 28 | if files and isinstance(files[-1], io.IOBase): |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 29 | out, files = files[-1], files[:-1] |
| 30 | else: |
| 31 | out = sys.stdout |
| 32 | if len(files) == 1 and not isinstance(files[0], str): |
| 33 | files = files[0] |
| 34 | for f in files: |
| 35 | if isinstance(f, str): |
| 36 | if f == '-': |
| 37 | sts = printsumfp(sys.stdin, '<stdin>', out) or sts |
| 38 | else: |
| 39 | sts = printsum(f, out) or sts |
| 40 | else: |
| 41 | sts = sum(f, out) or sts |
| 42 | return sts |
| 43 | |
Tim Peters | 1a3abcb | 2003-08-18 23:52:09 +0000 | [diff] [blame] | 44 | def printsum(filename, out=sys.stdout): |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 45 | try: |
| 46 | fp = open(filename, rmode) |
Guido van Rossum | b940e11 | 2007-01-10 16:19:56 +0000 | [diff] [blame] | 47 | except IOError as msg: |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 48 | sys.stderr.write('%s: Can\'t open: %s\n' % (filename, msg)) |
| 49 | return 1 |
| 50 | if fnfilter: |
| 51 | filename = fnfilter(filename) |
| 52 | sts = printsumfp(fp, filename, out) |
| 53 | fp.close() |
| 54 | return sts |
| 55 | |
Tim Peters | 1a3abcb | 2003-08-18 23:52:09 +0000 | [diff] [blame] | 56 | def printsumfp(fp, filename, out=sys.stdout): |
Berker Peksag | 7aee3ec | 2014-07-11 20:42:18 +0300 | [diff] [blame] | 57 | m = md5() |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 58 | try: |
Guido van Rossum | 9966e2c | 2001-06-22 16:05:48 +0000 | [diff] [blame] | 59 | while 1: |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 60 | data = fp.read(bufsize) |
Tim Peters | 1a3abcb | 2003-08-18 23:52:09 +0000 | [diff] [blame] | 61 | if not data: |
| 62 | break |
Berker Peksag | 7aee3ec | 2014-07-11 20:42:18 +0300 | [diff] [blame] | 63 | if isinstance(data, str): |
| 64 | data = data.encode(fp.encoding) |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 65 | m.update(data) |
Guido van Rossum | b940e11 | 2007-01-10 16:19:56 +0000 | [diff] [blame] | 66 | except IOError as msg: |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 67 | sys.stderr.write('%s: I/O error: %s\n' % (filename, msg)) |
| 68 | return 1 |
| 69 | out.write('%s %s\n' % (m.hexdigest(), filename)) |
| 70 | return 0 |
Guido van Rossum | 9966e2c | 2001-06-22 16:05:48 +0000 | [diff] [blame] | 71 | |
Tim Peters | 1a3abcb | 2003-08-18 23:52:09 +0000 | [diff] [blame] | 72 | def main(args = sys.argv[1:], out=sys.stdout): |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 73 | global fnfilter, rmode, bufsize |
| 74 | try: |
| 75 | opts, args = getopt.getopt(args, 'blts:') |
Guido van Rossum | b940e11 | 2007-01-10 16:19:56 +0000 | [diff] [blame] | 76 | except getopt.error as msg: |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 77 | sys.stderr.write('%s: %s\n%s' % (sys.argv[0], msg, usage)) |
| 78 | return 2 |
| 79 | for o, a in opts: |
| 80 | if o == '-l': |
| 81 | fnfilter = os.path.basename |
Tim Peters | 1a3abcb | 2003-08-18 23:52:09 +0000 | [diff] [blame] | 82 | elif o == '-b': |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 83 | rmode = 'rb' |
Tim Peters | 1a3abcb | 2003-08-18 23:52:09 +0000 | [diff] [blame] | 84 | elif o == '-t': |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 85 | rmode = 'r' |
Tim Peters | 1a3abcb | 2003-08-18 23:52:09 +0000 | [diff] [blame] | 86 | elif o == '-s': |
Andrew M. Kuchling | 4693d46 | 2003-05-13 17:39:26 +0000 | [diff] [blame] | 87 | bufsize = int(a) |
| 88 | if not args: |
| 89 | args = ['-'] |
| 90 | return sum(args, out) |
| 91 | |
| 92 | if __name__ == '__main__' or __name__ == sys.argv[0]: |
| 93 | sys.exit(main(sys.argv[1:], sys.stdout)) |