Barry Warsaw | 61e5616 | 2004-05-13 22:50:12 +0000 | [diff] [blame] | 1 | # Copyright (C) 2001-2004 Python Software Foundation |
| 2 | # Author: barry@python.org (Barry Warsaw) |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 3 | |
Barry Warsaw | 61e5616 | 2004-05-13 22:50:12 +0000 | [diff] [blame] | 4 | """Encodings and related functions.""" |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 5 | |
| 6 | import base64 |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 7 | |
| 8 | |
Barry Warsaw | e968ead | 2001-10-04 17:05:11 +0000 | [diff] [blame] | 9 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 10 | # Helpers |
Barry Warsaw | 8c1aac2 | 2002-05-19 23:44:19 +0000 | [diff] [blame] | 11 | try: |
| 12 | from quopri import encodestring as _encodestring |
| 13 | |
| 14 | def _qencode(s): |
| 15 | enc = _encodestring(s, quotetabs=1) |
| 16 | # Must encode spaces, which quopri.encodestring() doesn't do |
| 17 | return enc.replace(' ', '=20') |
| 18 | except ImportError: |
| 19 | # Python 2.1 doesn't have quopri.encodestring() |
| 20 | from cStringIO import StringIO |
| 21 | import quopri as _quopri |
| 22 | |
| 23 | def _qencode(s): |
| 24 | if not s: |
| 25 | return s |
| 26 | hasnewline = (s[-1] == '\n') |
| 27 | infp = StringIO(s) |
| 28 | outfp = StringIO() |
| 29 | _quopri.encode(infp, outfp, quotetabs=1) |
| 30 | # Python 2.x's encode() doesn't encode spaces even when quotetabs==1 |
| 31 | value = outfp.getvalue().replace(' ', '=20') |
| 32 | if not hasnewline and value[-1] == '\n': |
| 33 | return value[:-1] |
| 34 | return value |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 35 | |
Barry Warsaw | 6f70c41 | 2001-09-26 05:26:22 +0000 | [diff] [blame] | 36 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 37 | def _bencode(s): |
| 38 | # We can't quite use base64.encodestring() since it tacks on a "courtesy |
| 39 | # newline". Blech! |
| 40 | if not s: |
| 41 | return s |
| 42 | hasnewline = (s[-1] == '\n') |
| 43 | value = base64.encodestring(s) |
| 44 | if not hasnewline and value[-1] == '\n': |
| 45 | return value[:-1] |
| 46 | return value |
| 47 | |
| 48 | |
Barry Warsaw | e968ead | 2001-10-04 17:05:11 +0000 | [diff] [blame] | 49 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 50 | def encode_base64(msg): |
| 51 | """Encode the message's payload in Base64. |
| 52 | |
Barry Warsaw | 12272a2 | 2002-10-01 00:05:24 +0000 | [diff] [blame] | 53 | Also, add an appropriate Content-Transfer-Encoding header. |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 54 | """ |
| 55 | orig = msg.get_payload() |
| 56 | encdata = _bencode(orig) |
| 57 | msg.set_payload(encdata) |
| 58 | msg['Content-Transfer-Encoding'] = 'base64' |
| 59 | |
| 60 | |
Barry Warsaw | e968ead | 2001-10-04 17:05:11 +0000 | [diff] [blame] | 61 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 62 | def encode_quopri(msg): |
Barry Warsaw | 12272a2 | 2002-10-01 00:05:24 +0000 | [diff] [blame] | 63 | """Encode the message's payload in quoted-printable. |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 64 | |
Barry Warsaw | 12272a2 | 2002-10-01 00:05:24 +0000 | [diff] [blame] | 65 | Also, add an appropriate Content-Transfer-Encoding header. |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 66 | """ |
| 67 | orig = msg.get_payload() |
| 68 | encdata = _qencode(orig) |
| 69 | msg.set_payload(encdata) |
| 70 | msg['Content-Transfer-Encoding'] = 'quoted-printable' |
| 71 | |
| 72 | |
Barry Warsaw | e968ead | 2001-10-04 17:05:11 +0000 | [diff] [blame] | 73 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 74 | def encode_7or8bit(msg): |
Barry Warsaw | 12272a2 | 2002-10-01 00:05:24 +0000 | [diff] [blame] | 75 | """Set the Content-Transfer-Encoding header to 7bit or 8bit.""" |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 76 | orig = msg.get_payload() |
Barry Warsaw | 409a4c0 | 2002-04-10 21:01:31 +0000 | [diff] [blame] | 77 | if orig is None: |
| 78 | # There's no payload. For backwards compatibility we use 7bit |
| 79 | msg['Content-Transfer-Encoding'] = '7bit' |
| 80 | return |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 81 | # We play a trick to make this go fast. If encoding to ASCII succeeds, we |
| 82 | # know the data must be 7bit, otherwise treat it as 8bit. |
| 83 | try: |
| 84 | orig.encode('ascii') |
| 85 | except UnicodeError: |
Barry Warsaw | 61e5616 | 2004-05-13 22:50:12 +0000 | [diff] [blame] | 86 | # iso-2022-* is non-ASCII but still 7-bit |
| 87 | charset = msg.get_charset() |
| 88 | output_cset = charset and charset.output_charset |
| 89 | if output_cset and output_cset.lower().startswith('iso-2202-'): |
| 90 | msg['Content-Transfer-Encoding'] = '7bit' |
| 91 | else: |
| 92 | msg['Content-Transfer-Encoding'] = '8bit' |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 93 | else: |
| 94 | msg['Content-Transfer-Encoding'] = '7bit' |
| 95 | |
| 96 | |
Barry Warsaw | e968ead | 2001-10-04 17:05:11 +0000 | [diff] [blame] | 97 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 98 | def encode_noop(msg): |
| 99 | """Do nothing.""" |