Barry Warsaw | 61e5616 | 2004-05-13 22:50:12 +0000 | [diff] [blame] | 1 | # Copyright (C) 2001-2004 Python Software Foundation |
Barry Warsaw | bb11386 | 2004-10-03 03:16:19 +0000 | [diff] [blame] | 2 | # Author: Barry Warsaw |
| 3 | # Contact: email-sig@python.org |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 4 | |
Barry Warsaw | 61e5616 | 2004-05-13 22:50:12 +0000 | [diff] [blame] | 5 | """Encodings and related functions.""" |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 6 | |
| 7 | import base64 |
Barry Warsaw | bb11386 | 2004-10-03 03:16:19 +0000 | [diff] [blame] | 8 | from quopri import encodestring as _encodestring |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 9 | |
Barry Warsaw | bb11386 | 2004-10-03 03:16:19 +0000 | [diff] [blame] | 10 | def _qencode(s): |
| 11 | enc = _encodestring(s, quotetabs=True) |
| 12 | # Must encode spaces, which quopri.encodestring() doesn't do |
| 13 | return enc.replace(' ', '=20') |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 14 | |
Barry Warsaw | 6f70c41 | 2001-09-26 05:26:22 +0000 | [diff] [blame] | 15 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 16 | def _bencode(s): |
| 17 | # We can't quite use base64.encodestring() since it tacks on a "courtesy |
| 18 | # newline". Blech! |
| 19 | if not s: |
| 20 | return s |
| 21 | hasnewline = (s[-1] == '\n') |
| 22 | value = base64.encodestring(s) |
| 23 | if not hasnewline and value[-1] == '\n': |
| 24 | return value[:-1] |
| 25 | return value |
| 26 | |
| 27 | |
Barry Warsaw | e968ead | 2001-10-04 17:05:11 +0000 | [diff] [blame] | 28 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 29 | def encode_base64(msg): |
| 30 | """Encode the message's payload in Base64. |
| 31 | |
Barry Warsaw | 12272a2 | 2002-10-01 00:05:24 +0000 | [diff] [blame] | 32 | Also, add an appropriate Content-Transfer-Encoding header. |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 33 | """ |
| 34 | orig = msg.get_payload() |
| 35 | encdata = _bencode(orig) |
| 36 | msg.set_payload(encdata) |
| 37 | msg['Content-Transfer-Encoding'] = 'base64' |
| 38 | |
| 39 | |
Barry Warsaw | e968ead | 2001-10-04 17:05:11 +0000 | [diff] [blame] | 40 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 41 | def encode_quopri(msg): |
Barry Warsaw | 12272a2 | 2002-10-01 00:05:24 +0000 | [diff] [blame] | 42 | """Encode the message's payload in quoted-printable. |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 43 | |
Barry Warsaw | 12272a2 | 2002-10-01 00:05:24 +0000 | [diff] [blame] | 44 | Also, add an appropriate Content-Transfer-Encoding header. |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 45 | """ |
| 46 | orig = msg.get_payload() |
| 47 | encdata = _qencode(orig) |
| 48 | msg.set_payload(encdata) |
| 49 | msg['Content-Transfer-Encoding'] = 'quoted-printable' |
| 50 | |
| 51 | |
Barry Warsaw | e968ead | 2001-10-04 17:05:11 +0000 | [diff] [blame] | 52 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 53 | def encode_7or8bit(msg): |
Barry Warsaw | 12272a2 | 2002-10-01 00:05:24 +0000 | [diff] [blame] | 54 | """Set the Content-Transfer-Encoding header to 7bit or 8bit.""" |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 55 | orig = msg.get_payload() |
Barry Warsaw | 409a4c0 | 2002-04-10 21:01:31 +0000 | [diff] [blame] | 56 | if orig is None: |
| 57 | # There's no payload. For backwards compatibility we use 7bit |
| 58 | msg['Content-Transfer-Encoding'] = '7bit' |
| 59 | return |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 60 | # We play a trick to make this go fast. If encoding to ASCII succeeds, we |
| 61 | # know the data must be 7bit, otherwise treat it as 8bit. |
| 62 | try: |
| 63 | orig.encode('ascii') |
| 64 | except UnicodeError: |
Barry Warsaw | 61e5616 | 2004-05-13 22:50:12 +0000 | [diff] [blame] | 65 | # iso-2022-* is non-ASCII but still 7-bit |
| 66 | charset = msg.get_charset() |
| 67 | output_cset = charset and charset.output_charset |
| 68 | if output_cset and output_cset.lower().startswith('iso-2202-'): |
| 69 | msg['Content-Transfer-Encoding'] = '7bit' |
| 70 | else: |
| 71 | msg['Content-Transfer-Encoding'] = '8bit' |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 72 | else: |
| 73 | msg['Content-Transfer-Encoding'] = '7bit' |
| 74 | |
| 75 | |
Barry Warsaw | e968ead | 2001-10-04 17:05:11 +0000 | [diff] [blame] | 76 | |
Barry Warsaw | ba92580 | 2001-09-23 03:17:28 +0000 | [diff] [blame] | 77 | def encode_noop(msg): |
| 78 | """Do nothing.""" |