Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 1 | """Recognize image file formats based on their first few bytes.""" |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 2 | |
Berker Peksag | ef223a1 | 2016-10-01 05:01:54 +0300 | [diff] [blame] | 3 | from os import PathLike |
| 4 | |
Skip Montanaro | 17ab123 | 2001-01-24 06:27:27 +0000 | [diff] [blame] | 5 | __all__ = ["what"] |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 6 | |
| 7 | #-------------------------# |
Guido van Rossum | 45ac47c | 1997-10-08 15:22:32 +0000 | [diff] [blame] | 8 | # Recognize image headers # |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 9 | #-------------------------# |
| 10 | |
Guido van Rossum | 45ac47c | 1997-10-08 15:22:32 +0000 | [diff] [blame] | 11 | def what(file, h=None): |
Serhiy Storchaka | 91b0bc2 | 2014-01-25 19:43:02 +0200 | [diff] [blame] | 12 | f = None |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 13 | try: |
Serhiy Storchaka | 91b0bc2 | 2014-01-25 19:43:02 +0200 | [diff] [blame] | 14 | if h is None: |
Berker Peksag | ef223a1 | 2016-10-01 05:01:54 +0300 | [diff] [blame] | 15 | if isinstance(file, (str, PathLike)): |
Serhiy Storchaka | 91b0bc2 | 2014-01-25 19:43:02 +0200 | [diff] [blame] | 16 | f = open(file, 'rb') |
| 17 | h = f.read(32) |
| 18 | else: |
| 19 | location = file.tell() |
| 20 | h = file.read(32) |
| 21 | file.seek(location) |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 22 | for tf in tests: |
| 23 | res = tf(h, f) |
| 24 | if res: |
| 25 | return res |
| 26 | finally: |
| 27 | if f: f.close() |
| 28 | return None |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 29 | |
| 30 | |
| 31 | #---------------------------------# |
| 32 | # Subroutines per image file type # |
| 33 | #---------------------------------# |
| 34 | |
| 35 | tests = [] |
| 36 | |
Benjamin Peterson | 0b95290 | 2008-08-16 16:48:16 +0000 | [diff] [blame] | 37 | def test_jpeg(h, f): |
| 38 | """JPEG data in JFIF or Exif format""" |
| 39 | if h[6:10] in (b'JFIF', b'Exif'): |
| 40 | return 'jpeg' |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 41 | |
Benjamin Peterson | 0b95290 | 2008-08-16 16:48:16 +0000 | [diff] [blame] | 42 | tests.append(test_jpeg) |
| 43 | |
| 44 | def test_png(h, f): |
| 45 | if h.startswith(b'\211PNG\r\n\032\n'): |
| 46 | return 'png' |
| 47 | |
| 48 | tests.append(test_png) |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 49 | |
| 50 | def test_gif(h, f): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 51 | """GIF ('87 and '89 variants)""" |
Barry Warsaw | 72937f3 | 2007-08-12 14:37:20 +0000 | [diff] [blame] | 52 | if h[:6] in (b'GIF87a', b'GIF89a'): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 53 | return 'gif' |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 54 | |
| 55 | tests.append(test_gif) |
| 56 | |
Benjamin Peterson | 0b95290 | 2008-08-16 16:48:16 +0000 | [diff] [blame] | 57 | def test_tiff(h, f): |
| 58 | """TIFF (can be in Motorola or Intel byte order)""" |
| 59 | if h[:2] in (b'MM', b'II'): |
| 60 | return 'tiff' |
| 61 | |
| 62 | tests.append(test_tiff) |
| 63 | |
| 64 | def test_rgb(h, f): |
| 65 | """SGI image library""" |
| 66 | if h.startswith(b'\001\332'): |
| 67 | return 'rgb' |
| 68 | |
| 69 | tests.append(test_rgb) |
| 70 | |
Guido van Rossum | 2db9135 | 1992-10-18 17:09:59 +0000 | [diff] [blame] | 71 | def test_pbm(h, f): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 72 | """PBM (portable bitmap)""" |
| 73 | if len(h) >= 3 and \ |
Guido van Rossum | c934128 | 2007-08-13 17:50:00 +0000 | [diff] [blame] | 74 | h[0] == ord(b'P') and h[1] in b'14' and h[2] in b' \t\n\r': |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 75 | return 'pbm' |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 76 | |
Guido van Rossum | 2db9135 | 1992-10-18 17:09:59 +0000 | [diff] [blame] | 77 | tests.append(test_pbm) |
| 78 | |
| 79 | def test_pgm(h, f): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 80 | """PGM (portable graymap)""" |
| 81 | if len(h) >= 3 and \ |
Guido van Rossum | c934128 | 2007-08-13 17:50:00 +0000 | [diff] [blame] | 82 | h[0] == ord(b'P') and h[1] in b'25' and h[2] in b' \t\n\r': |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 83 | return 'pgm' |
Guido van Rossum | 2db9135 | 1992-10-18 17:09:59 +0000 | [diff] [blame] | 84 | |
| 85 | tests.append(test_pgm) |
| 86 | |
| 87 | def test_ppm(h, f): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 88 | """PPM (portable pixmap)""" |
| 89 | if len(h) >= 3 and \ |
Guido van Rossum | c934128 | 2007-08-13 17:50:00 +0000 | [diff] [blame] | 90 | h[0] == ord(b'P') and h[1] in b'36' and h[2] in b' \t\n\r': |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 91 | return 'ppm' |
Guido van Rossum | 2db9135 | 1992-10-18 17:09:59 +0000 | [diff] [blame] | 92 | |
| 93 | tests.append(test_ppm) |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 94 | |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 95 | def test_rast(h, f): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 96 | """Sun raster file""" |
Guido van Rossum | c934128 | 2007-08-13 17:50:00 +0000 | [diff] [blame] | 97 | if h.startswith(b'\x59\xA6\x6A\x95'): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 98 | return 'rast' |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 99 | |
| 100 | tests.append(test_rast) |
| 101 | |
Guido van Rossum | 05b55e7 | 1992-06-03 16:48:44 +0000 | [diff] [blame] | 102 | def test_xbm(h, f): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 103 | """X bitmap (X10 or X11)""" |
Guido van Rossum | c934128 | 2007-08-13 17:50:00 +0000 | [diff] [blame] | 104 | if h.startswith(b'#define '): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 105 | return 'xbm' |
Guido van Rossum | 05b55e7 | 1992-06-03 16:48:44 +0000 | [diff] [blame] | 106 | |
| 107 | tests.append(test_xbm) |
| 108 | |
Guido van Rossum | 9e33074 | 1997-04-11 18:59:38 +0000 | [diff] [blame] | 109 | def test_bmp(h, f): |
Guido van Rossum | c934128 | 2007-08-13 17:50:00 +0000 | [diff] [blame] | 110 | if h.startswith(b'BM'): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 111 | return 'bmp' |
Tim Peters | 07e99cb | 2001-01-14 23:47:14 +0000 | [diff] [blame] | 112 | |
Guido van Rossum | 9e33074 | 1997-04-11 18:59:38 +0000 | [diff] [blame] | 113 | tests.append(test_bmp) |
| 114 | |
Serhiy Storchaka | 2f8dca7 | 2014-05-25 11:45:37 +0300 | [diff] [blame] | 115 | def test_webp(h, f): |
| 116 | if h.startswith(b'RIFF') and h[8:12] == b'WEBP': |
| 117 | return 'webp' |
| 118 | |
| 119 | tests.append(test_webp) |
| 120 | |
R David Murray | 2f60820 | 2014-06-26 12:27:57 -0400 | [diff] [blame] | 121 | def test_exr(h, f): |
| 122 | if h.startswith(b'\x76\x2f\x31\x01'): |
| 123 | return 'exr' |
| 124 | |
| 125 | tests.append(test_exr) |
| 126 | |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 127 | #--------------------# |
| 128 | # Small test program # |
| 129 | #--------------------# |
| 130 | |
| 131 | def test(): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 132 | import sys |
| 133 | recursive = 0 |
| 134 | if sys.argv[1:] and sys.argv[1] == '-r': |
| 135 | del sys.argv[1:2] |
| 136 | recursive = 1 |
| 137 | try: |
| 138 | if sys.argv[1:]: |
| 139 | testall(sys.argv[1:], recursive, 1) |
| 140 | else: |
| 141 | testall(['.'], recursive, 1) |
| 142 | except KeyboardInterrupt: |
| 143 | sys.stderr.write('\n[Interrupted]\n') |
| 144 | sys.exit(1) |
Guido van Rossum | 1c34fc7 | 1992-05-27 14:06:59 +0000 | [diff] [blame] | 145 | |
| 146 | def testall(list, recursive, toplevel): |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 147 | import sys |
| 148 | import os |
| 149 | for filename in list: |
| 150 | if os.path.isdir(filename): |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 151 | print(filename + '/:', end=' ') |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 152 | if recursive or toplevel: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 153 | print('recursing down:') |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 154 | import glob |
| 155 | names = glob.glob(os.path.join(filename, '*')) |
| 156 | testall(names, recursive, 0) |
| 157 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 158 | print('*** directory (use -r) ***') |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 159 | else: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 160 | print(filename + ':', end=' ') |
Guido van Rossum | 54f22ed | 2000-02-04 15:10:34 +0000 | [diff] [blame] | 161 | sys.stdout.flush() |
| 162 | try: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 163 | print(what(filename)) |
Andrew Svetlov | f7a17b4 | 2012-12-25 16:47:37 +0200 | [diff] [blame] | 164 | except OSError: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 165 | print('*** not found ***') |
Barry Warsaw | 72937f3 | 2007-08-12 14:37:20 +0000 | [diff] [blame] | 166 | |
| 167 | if __name__ == '__main__': |
| 168 | test() |