blob: 9c15752fe3123520ba236be27f3ad06953304707 [file] [log] [blame]
Benjamin Peterson90f5ba52010-03-11 22:53:45 +00001#! /usr/bin/env python3
Guido van Rossumaa925a51997-04-02 05:47:39 +00002
Barry Warsaw4c904d12004-01-04 01:12:26 +00003"""RFC 3548: Base16, Base32, Base64 Data Encodings"""
Guido van Rossum4acc25b2000-02-02 15:10:15 +00004
Barry Warsaw4c904d12004-01-04 01:12:26 +00005# Modified 04-Oct-1995 by Jack Jansen to use binascii module
6# Modified 30-Dec-2003 by Barry Warsaw to add full RFC 3548 support
Guido van Rossum4581ae52007-05-22 21:56:47 +00007# Modified 22-May-2007 by Guido van Rossum to use bytes everywhere
Jack Jansen951213e1995-10-04 16:39:20 +00008
Barry Warsaw4c904d12004-01-04 01:12:26 +00009import re
10import struct
Jack Jansen951213e1995-10-04 16:39:20 +000011import binascii
12
Barry Warsaw4c904d12004-01-04 01:12:26 +000013
14__all__ = [
15 # Legacy interface exports traditional RFC 1521 Base64 encodings
Georg Brandlb54d8012009-06-04 09:11:51 +000016 'encode', 'decode', 'encodebytes', 'decodebytes',
Barry Warsaw4c904d12004-01-04 01:12:26 +000017 # Generalized interface for other encodings
18 'b64encode', 'b64decode', 'b32encode', 'b32decode',
19 'b16encode', 'b16decode',
20 # Standard Base64 encoding
21 'standard_b64encode', 'standard_b64decode',
22 # Some common Base64 alternatives. As referenced by RFC 3458, see thread
23 # starting at:
24 #
25 # http://zgp.org/pipermail/p2p-hackers/2001-September/000316.html
Barry Warsaw4c904d12004-01-04 01:12:26 +000026 'urlsafe_b64encode', 'urlsafe_b64decode',
27 ]
28
Barry Warsaw4c904d12004-01-04 01:12:26 +000029
Guido van Rossum254348e2007-11-21 19:29:53 +000030bytes_types = (bytes, bytearray) # Types acceptable as binary data
Guido van Rossum98297ee2007-11-06 21:34:58 +000031
Antoine Pitrouea6b4d52012-02-20 19:30:23 +010032def _bytes_from_decode_data(s):
33 if isinstance(s, str):
34 try:
35 return s.encode('ascii')
36 except UnicodeEncodeError:
37 raise ValueError('string argument should contain only ASCII characters')
38 elif isinstance(s, bytes_types):
39 return s
40 else:
41 raise TypeError("argument should be bytes or ASCII string, not %s" % s.__class__.__name__)
Guido van Rossum98297ee2007-11-06 21:34:58 +000042
Barry Warsaw4c904d12004-01-04 01:12:26 +000043
Antoine Pitroufd036452008-08-19 17:56:33 +000044
Barry Warsaw4c904d12004-01-04 01:12:26 +000045# Base64 encoding/decoding uses binascii
46
47def b64encode(s, altchars=None):
Guido van Rossum4581ae52007-05-22 21:56:47 +000048 """Encode a byte string using Base64.
Barry Warsaw4c904d12004-01-04 01:12:26 +000049
Guido van Rossum4581ae52007-05-22 21:56:47 +000050 s is the byte string to encode. Optional altchars must be a byte
51 string of length 2 which specifies an alternative alphabet for the
52 '+' and '/' characters. This allows an application to
53 e.g. generate url or filesystem safe Base64 strings.
Barry Warsaw4c904d12004-01-04 01:12:26 +000054
Guido van Rossum4581ae52007-05-22 21:56:47 +000055 The encoded byte string is returned.
Barry Warsaw4c904d12004-01-04 01:12:26 +000056 """
Guido van Rossum254348e2007-11-21 19:29:53 +000057 if not isinstance(s, bytes_types):
Alexandre Vassalotti5209857f2008-05-03 04:39:38 +000058 raise TypeError("expected bytes, not %s" % s.__class__.__name__)
Barry Warsaw4c904d12004-01-04 01:12:26 +000059 # Strip off the trailing newline
60 encoded = binascii.b2a_base64(s)[:-1]
61 if altchars is not None:
Guido van Rossum254348e2007-11-21 19:29:53 +000062 if not isinstance(altchars, bytes_types):
Alexandre Vassalotti56292682009-06-29 01:13:41 +000063 raise TypeError("expected bytes, not %s"
64 % altchars.__class__.__name__)
Guido van Rossum4581ae52007-05-22 21:56:47 +000065 assert len(altchars) == 2, repr(altchars)
Guido van Rossum95c1c482012-06-22 15:16:09 -070066 return encoded.translate(bytes.maketrans(b'+/', altchars))
Barry Warsaw4c904d12004-01-04 01:12:26 +000067 return encoded
68
69
R. David Murray64951362010-11-11 20:09:20 +000070def b64decode(s, altchars=None, validate=False):
Guido van Rossum4581ae52007-05-22 21:56:47 +000071 """Decode a Base64 encoded byte string.
Barry Warsaw4c904d12004-01-04 01:12:26 +000072
Guido van Rossum4581ae52007-05-22 21:56:47 +000073 s is the byte string to decode. Optional altchars must be a
74 string of length 2 which specifies the alternative alphabet used
75 instead of the '+' and '/' characters.
Barry Warsaw4c904d12004-01-04 01:12:26 +000076
R. David Murray64951362010-11-11 20:09:20 +000077 The decoded string is returned. A binascii.Error is raised if s is
78 incorrectly padded.
79
80 If validate is False (the default), non-base64-alphabet characters are
81 discarded prior to the padding check. If validate is True,
82 non-base64-alphabet characters in the input result in a binascii.Error.
Barry Warsaw4c904d12004-01-04 01:12:26 +000083 """
Antoine Pitrouea6b4d52012-02-20 19:30:23 +010084 s = _bytes_from_decode_data(s)
Barry Warsaw4c904d12004-01-04 01:12:26 +000085 if altchars is not None:
Antoine Pitrouea6b4d52012-02-20 19:30:23 +010086 altchars = _bytes_from_decode_data(altchars)
Guido van Rossum4581ae52007-05-22 21:56:47 +000087 assert len(altchars) == 2, repr(altchars)
Guido van Rossum95c1c482012-06-22 15:16:09 -070088 s = s.translate(bytes.maketrans(altchars, b'+/'))
R. David Murray64951362010-11-11 20:09:20 +000089 if validate and not re.match(b'^[A-Za-z0-9+/]*={0,2}$', s):
90 raise binascii.Error('Non-base64 digit found')
Guido van Rossum4581ae52007-05-22 21:56:47 +000091 return binascii.a2b_base64(s)
Barry Warsaw4c904d12004-01-04 01:12:26 +000092
93
94def standard_b64encode(s):
Guido van Rossum4581ae52007-05-22 21:56:47 +000095 """Encode a byte string using the standard Base64 alphabet.
Barry Warsaw4c904d12004-01-04 01:12:26 +000096
Guido van Rossum4581ae52007-05-22 21:56:47 +000097 s is the byte string to encode. The encoded byte string is returned.
Barry Warsaw4c904d12004-01-04 01:12:26 +000098 """
99 return b64encode(s)
100
101def standard_b64decode(s):
Guido van Rossum4581ae52007-05-22 21:56:47 +0000102 """Decode a byte string encoded with the standard Base64 alphabet.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000103
Guido van Rossum4581ae52007-05-22 21:56:47 +0000104 s is the byte string to decode. The decoded byte string is
105 returned. binascii.Error is raised if the input is incorrectly
106 padded or if there are non-alphabet characters present in the
107 input.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000108 """
109 return b64decode(s)
110
Guido van Rossum95c1c482012-06-22 15:16:09 -0700111
112_urlsafe_encode_translation = bytes.maketrans(b'+/', b'-_')
113_urlsafe_decode_translation = bytes.maketrans(b'-_', b'+/')
114
Barry Warsaw4c904d12004-01-04 01:12:26 +0000115def urlsafe_b64encode(s):
Guido van Rossum4581ae52007-05-22 21:56:47 +0000116 """Encode a byte string using a url-safe Base64 alphabet.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000117
Guido van Rossum4581ae52007-05-22 21:56:47 +0000118 s is the byte string to encode. The encoded byte string is
119 returned. The alphabet uses '-' instead of '+' and '_' instead of
120 '/'.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000121 """
Guido van Rossum95c1c482012-06-22 15:16:09 -0700122 return b64encode(s).translate(_urlsafe_encode_translation)
Barry Warsaw4c904d12004-01-04 01:12:26 +0000123
124def urlsafe_b64decode(s):
Guido van Rossum4581ae52007-05-22 21:56:47 +0000125 """Decode a byte string encoded with the standard Base64 alphabet.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000126
Guido van Rossum4581ae52007-05-22 21:56:47 +0000127 s is the byte string to decode. The decoded byte string is
128 returned. binascii.Error is raised if the input is incorrectly
129 padded or if there are non-alphabet characters present in the
130 input.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000131
132 The alphabet uses '-' instead of '+' and '_' instead of '/'.
133 """
Guido van Rossum95c1c482012-06-22 15:16:09 -0700134 s = _bytes_from_decode_data(s)
135 s = s.translate(_urlsafe_decode_translation)
136 return b64decode(s)
Barry Warsaw4c904d12004-01-04 01:12:26 +0000137
138
Antoine Pitroufd036452008-08-19 17:56:33 +0000139
Barry Warsaw4c904d12004-01-04 01:12:26 +0000140# Base32 encoding/decoding must be done in Python
Serhiy Storchaka87aa7dc2013-05-19 11:49:32 +0300141_b32alphabet = b'ABCDEFGHIJKLMNOPQRSTUVWXYZ234567'
142_b32tab = [bytes([i]) for i in _b32alphabet]
143_b32tab2 = [a + b for a in _b32tab for b in _b32tab]
144_b32rev = {v: k for k, v in enumerate(_b32alphabet)}
Barry Warsaw4c904d12004-01-04 01:12:26 +0000145
146def b32encode(s):
Guido van Rossum4581ae52007-05-22 21:56:47 +0000147 """Encode a byte string using Base32.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000148
Guido van Rossum4581ae52007-05-22 21:56:47 +0000149 s is the byte string to encode. The encoded byte string is returned.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000150 """
Guido van Rossum254348e2007-11-21 19:29:53 +0000151 if not isinstance(s, bytes_types):
Alexandre Vassalotti5209857f2008-05-03 04:39:38 +0000152 raise TypeError("expected bytes, not %s" % s.__class__.__name__)
Serhiy Storchaka87aa7dc2013-05-19 11:49:32 +0300153 leftover = len(s) % 5
Barry Warsaw4c904d12004-01-04 01:12:26 +0000154 # Pad the last quantum with zero bits if necessary
155 if leftover:
Guido van Rossum4581ae52007-05-22 21:56:47 +0000156 s = s + bytes(5 - leftover) # Don't use += !
Serhiy Storchaka2c3f2f12013-05-19 11:41:15 +0300157 encoded = bytearray()
Serhiy Storchaka87aa7dc2013-05-19 11:49:32 +0300158 from_bytes = int.from_bytes
159 b32tab2 = _b32tab2
160 for i in range(0, len(s), 5):
161 c = from_bytes(s[i: i + 5], 'big')
162 encoded += (b32tab2[c >> 30] + # bits 1 - 10
163 b32tab2[(c >> 20) & 0x3ff] + # bits 11 - 20
164 b32tab2[(c >> 10) & 0x3ff] + # bits 21 - 30
165 b32tab2[c & 0x3ff] # bits 31 - 40
166 )
Barry Warsaw4c904d12004-01-04 01:12:26 +0000167 # Adjust for any leftover partial quanta
168 if leftover == 1:
Serhiy Storchaka2c3f2f12013-05-19 11:41:15 +0300169 encoded[-6:] = b'======'
Barry Warsaw4c904d12004-01-04 01:12:26 +0000170 elif leftover == 2:
Serhiy Storchaka2c3f2f12013-05-19 11:41:15 +0300171 encoded[-4:] = b'===='
Barry Warsaw4c904d12004-01-04 01:12:26 +0000172 elif leftover == 3:
Serhiy Storchaka2c3f2f12013-05-19 11:41:15 +0300173 encoded[-3:] = b'==='
Barry Warsaw4c904d12004-01-04 01:12:26 +0000174 elif leftover == 4:
Serhiy Storchaka2c3f2f12013-05-19 11:41:15 +0300175 encoded[-1:] = b'='
176 return bytes(encoded)
Barry Warsaw4c904d12004-01-04 01:12:26 +0000177
178def b32decode(s, casefold=False, map01=None):
Guido van Rossum4581ae52007-05-22 21:56:47 +0000179 """Decode a Base32 encoded byte string.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000180
Guido van Rossum4581ae52007-05-22 21:56:47 +0000181 s is the byte string to decode. Optional casefold is a flag
182 specifying whether a lowercase alphabet is acceptable as input.
183 For security purposes, the default is False.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000184
Guido van Rossum4581ae52007-05-22 21:56:47 +0000185 RFC 3548 allows for optional mapping of the digit 0 (zero) to the
186 letter O (oh), and for optional mapping of the digit 1 (one) to
187 either the letter I (eye) or letter L (el). The optional argument
188 map01 when not None, specifies which letter the digit 1 should be
189 mapped to (when map01 is not None, the digit 0 is always mapped to
190 the letter O). For security purposes the default is None, so that
191 0 and 1 are not allowed in the input.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000192
Guido van Rossum4581ae52007-05-22 21:56:47 +0000193 The decoded byte string is returned. binascii.Error is raised if
194 the input is incorrectly padded or if there are non-alphabet
195 characters present in the input.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000196 """
Antoine Pitrouea6b4d52012-02-20 19:30:23 +0100197 s = _bytes_from_decode_data(s)
Serhiy Storchaka87aa7dc2013-05-19 11:49:32 +0300198 if len(s) % 8:
Guido van Rossum4581ae52007-05-22 21:56:47 +0000199 raise binascii.Error('Incorrect padding')
Barry Warsaw4c904d12004-01-04 01:12:26 +0000200 # Handle section 2.4 zero and one mapping. The flag map01 will be either
201 # False, or the character to map the digit 1 (one) to. It should be
202 # either L (el) or I (eye).
Alexandre Vassalotti5209857f2008-05-03 04:39:38 +0000203 if map01 is not None:
Antoine Pitrouea6b4d52012-02-20 19:30:23 +0100204 map01 = _bytes_from_decode_data(map01)
Guido van Rossum4581ae52007-05-22 21:56:47 +0000205 assert len(map01) == 1, repr(map01)
Guido van Rossum95c1c482012-06-22 15:16:09 -0700206 s = s.translate(bytes.maketrans(b'01', b'O' + map01))
Barry Warsaw4c904d12004-01-04 01:12:26 +0000207 if casefold:
Guido van Rossum98297ee2007-11-06 21:34:58 +0000208 s = s.upper()
Barry Warsaw4c904d12004-01-04 01:12:26 +0000209 # Strip off pad characters from the right. We need to count the pad
210 # characters because this will tell us how many null bytes to remove from
211 # the end of the decoded string.
Serhiy Storchaka87aa7dc2013-05-19 11:49:32 +0300212 l = len(s)
213 s = s.rstrip(b'=')
214 padchars = l - len(s)
Barry Warsaw4c904d12004-01-04 01:12:26 +0000215 # Now decode the full quanta
Serhiy Storchaka87aa7dc2013-05-19 11:49:32 +0300216 decoded = bytearray()
217 b32rev = _b32rev
218 for i in range(0, len(s), 8):
219 quanta = s[i: i + 8]
220 acc = 0
221 try:
222 for c in quanta:
223 acc = (acc << 5) + b32rev[c]
224 except KeyError:
Serhiy Storchaka5cc9d322013-05-28 15:42:34 +0300225 raise binascii.Error('Non-base32 digit found') from None
Serhiy Storchaka87aa7dc2013-05-19 11:49:32 +0300226 decoded += acc.to_bytes(5, 'big')
Barry Warsaw4c904d12004-01-04 01:12:26 +0000227 # Process the last, partial quanta
Serhiy Storchaka87aa7dc2013-05-19 11:49:32 +0300228 if padchars:
229 acc <<= 5 * padchars
230 last = acc.to_bytes(5, 'big')
231 if padchars == 1:
232 decoded[-5:] = last[:-1]
233 elif padchars == 3:
234 decoded[-5:] = last[:-2]
235 elif padchars == 4:
236 decoded[-5:] = last[:-3]
237 elif padchars == 6:
238 decoded[-5:] = last[:-4]
239 else:
240 raise binascii.Error('Incorrect padding')
241 return bytes(decoded)
Barry Warsaw4c904d12004-01-04 01:12:26 +0000242
243
Antoine Pitroufd036452008-08-19 17:56:33 +0000244
Barry Warsaw4c904d12004-01-04 01:12:26 +0000245# RFC 3548, Base 16 Alphabet specifies uppercase, but hexlify() returns
246# lowercase. The RFC also recommends against accepting input case
247# insensitively.
248def b16encode(s):
Guido van Rossum4581ae52007-05-22 21:56:47 +0000249 """Encode a byte string using Base16.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000250
Guido van Rossum4581ae52007-05-22 21:56:47 +0000251 s is the byte string to encode. The encoded byte string is returned.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000252 """
Alexandre Vassalotti5209857f2008-05-03 04:39:38 +0000253 if not isinstance(s, bytes_types):
254 raise TypeError("expected bytes, not %s" % s.__class__.__name__)
Guido van Rossum98297ee2007-11-06 21:34:58 +0000255 return binascii.hexlify(s).upper()
Barry Warsaw4c904d12004-01-04 01:12:26 +0000256
257
258def b16decode(s, casefold=False):
Guido van Rossum4581ae52007-05-22 21:56:47 +0000259 """Decode a Base16 encoded byte string.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000260
Guido van Rossum4581ae52007-05-22 21:56:47 +0000261 s is the byte string to decode. Optional casefold is a flag
262 specifying whether a lowercase alphabet is acceptable as input.
263 For security purposes, the default is False.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000264
Guido van Rossum4581ae52007-05-22 21:56:47 +0000265 The decoded byte string is returned. binascii.Error is raised if
266 s were incorrectly padded or if there are non-alphabet characters
267 present in the string.
Barry Warsaw4c904d12004-01-04 01:12:26 +0000268 """
Antoine Pitrouea6b4d52012-02-20 19:30:23 +0100269 s = _bytes_from_decode_data(s)
Barry Warsaw4c904d12004-01-04 01:12:26 +0000270 if casefold:
Guido van Rossum98297ee2007-11-06 21:34:58 +0000271 s = s.upper()
Antoine Pitroufd036452008-08-19 17:56:33 +0000272 if re.search(b'[^0-9A-F]', s):
Guido van Rossum4581ae52007-05-22 21:56:47 +0000273 raise binascii.Error('Non-base16 digit found')
Barry Warsaw4c904d12004-01-04 01:12:26 +0000274 return binascii.unhexlify(s)
275
276
Antoine Pitroufd036452008-08-19 17:56:33 +0000277
Barry Warsaw4c904d12004-01-04 01:12:26 +0000278# Legacy interface. This code could be cleaned up since I don't believe
279# binascii has any line length limitations. It just doesn't seem worth it
Guido van Rossum4581ae52007-05-22 21:56:47 +0000280# though. The files should be opened in binary mode.
Skip Montanaroe99d5ea2001-01-20 19:54:20 +0000281
Guido van Rossumf1945461995-06-14 23:43:44 +0000282MAXLINESIZE = 76 # Excluding the CRLF
Guido van Rossum54e54c62001-09-04 19:14:14 +0000283MAXBINSIZE = (MAXLINESIZE//4)*3
Guido van Rossumf1945461995-06-14 23:43:44 +0000284
Guido van Rossumf1945461995-06-14 23:43:44 +0000285def encode(input, output):
Guido van Rossum54a40cb2007-08-27 22:27:41 +0000286 """Encode a file; input and output are binary files."""
Barry Warsaw4c904d12004-01-04 01:12:26 +0000287 while True:
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000288 s = input.read(MAXBINSIZE)
Barry Warsaw4c904d12004-01-04 01:12:26 +0000289 if not s:
290 break
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000291 while len(s) < MAXBINSIZE:
292 ns = input.read(MAXBINSIZE-len(s))
Barry Warsaw4c904d12004-01-04 01:12:26 +0000293 if not ns:
294 break
295 s += ns
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000296 line = binascii.b2a_base64(s)
297 output.write(line)
Guido van Rossumf1945461995-06-14 23:43:44 +0000298
Barry Warsaw4c904d12004-01-04 01:12:26 +0000299
Guido van Rossumf1945461995-06-14 23:43:44 +0000300def decode(input, output):
Guido van Rossum54a40cb2007-08-27 22:27:41 +0000301 """Decode a file; input and output are binary files."""
Barry Warsaw4c904d12004-01-04 01:12:26 +0000302 while True:
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000303 line = input.readline()
Barry Warsaw4c904d12004-01-04 01:12:26 +0000304 if not line:
305 break
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000306 s = binascii.a2b_base64(line)
307 output.write(s)
Guido van Rossumf1945461995-06-14 23:43:44 +0000308
Barry Warsaw4c904d12004-01-04 01:12:26 +0000309
Georg Brandlb54d8012009-06-04 09:11:51 +0000310def encodebytes(s):
311 """Encode a bytestring into a bytestring containing multiple lines
312 of base-64 data."""
Guido van Rossum254348e2007-11-21 19:29:53 +0000313 if not isinstance(s, bytes_types):
Guido van Rossum98b349f2007-08-27 21:47:52 +0000314 raise TypeError("expected bytes, not %s" % s.__class__.__name__)
Peter Schneider-Kampfbb2b4c2001-06-07 18:56:13 +0000315 pieces = []
316 for i in range(0, len(s), MAXBINSIZE):
317 chunk = s[i : i + MAXBINSIZE]
318 pieces.append(binascii.b2a_base64(chunk))
Guido van Rossum4581ae52007-05-22 21:56:47 +0000319 return b"".join(pieces)
Guido van Rossumf1945461995-06-14 23:43:44 +0000320
Georg Brandlb54d8012009-06-04 09:11:51 +0000321def encodestring(s):
322 """Legacy alias of encodebytes()."""
323 import warnings
324 warnings.warn("encodestring() is a deprecated alias, use encodebytes()",
325 DeprecationWarning, 2)
326 return encodebytes(s)
Barry Warsaw4c904d12004-01-04 01:12:26 +0000327
Guido van Rossum54a40cb2007-08-27 22:27:41 +0000328
Georg Brandlb54d8012009-06-04 09:11:51 +0000329def decodebytes(s):
330 """Decode a bytestring of base-64 data into a bytestring."""
Guido van Rossum254348e2007-11-21 19:29:53 +0000331 if not isinstance(s, bytes_types):
Guido van Rossum98b349f2007-08-27 21:47:52 +0000332 raise TypeError("expected bytes, not %s" % s.__class__.__name__)
Peter Schneider-Kampfbb2b4c2001-06-07 18:56:13 +0000333 return binascii.a2b_base64(s)
Guido van Rossumf1945461995-06-14 23:43:44 +0000334
Georg Brandlb54d8012009-06-04 09:11:51 +0000335def decodestring(s):
336 """Legacy alias of decodebytes()."""
337 import warnings
338 warnings.warn("decodestring() is a deprecated alias, use decodebytes()",
339 DeprecationWarning, 2)
340 return decodebytes(s)
Barry Warsaw4c904d12004-01-04 01:12:26 +0000341
Antoine Pitroufd036452008-08-19 17:56:33 +0000342
Guido van Rossum4581ae52007-05-22 21:56:47 +0000343# Usable as a script...
344def main():
345 """Small main program"""
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000346 import sys, getopt
347 try:
348 opts, args = getopt.getopt(sys.argv[1:], 'deut')
Guido van Rossumb940e112007-01-10 16:19:56 +0000349 except getopt.error as msg:
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000350 sys.stdout = sys.stderr
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000351 print(msg)
352 print("""usage: %s [-d|-e|-u|-t] [file|-]
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000353 -d, -u: decode
354 -e: encode (default)
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000355 -t: encode and decode string 'Aladdin:open sesame'"""%sys.argv[0])
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000356 sys.exit(2)
357 func = encode
358 for o, a in opts:
359 if o == '-e': func = encode
360 if o == '-d': func = decode
361 if o == '-u': func = decode
Guido van Rossum4581ae52007-05-22 21:56:47 +0000362 if o == '-t': test(); return
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000363 if args and args[0] != '-':
Antoine Pitroub86680e2010-10-14 21:15:17 +0000364 with open(args[0], 'rb') as f:
365 func(f, sys.stdout.buffer)
Guido van Rossum4acc25b2000-02-02 15:10:15 +0000366 else:
Victor Stinner479736b2010-05-25 21:12:34 +0000367 func(sys.stdin.buffer, sys.stdout.buffer)
Guido van Rossumf1945461995-06-14 23:43:44 +0000368
Barry Warsaw4c904d12004-01-04 01:12:26 +0000369
Guido van Rossum4581ae52007-05-22 21:56:47 +0000370def test():
371 s0 = b"Aladdin:open sesame"
372 print(repr(s0))
Georg Brandl706824f2009-06-04 09:42:55 +0000373 s1 = encodebytes(s0)
Guido van Rossum4581ae52007-05-22 21:56:47 +0000374 print(repr(s1))
Georg Brandl706824f2009-06-04 09:42:55 +0000375 s2 = decodebytes(s1)
Guido van Rossum4581ae52007-05-22 21:56:47 +0000376 print(repr(s2))
377 assert s0 == s2
Guido van Rossumf1945461995-06-14 23:43:44 +0000378
Barry Warsaw4c904d12004-01-04 01:12:26 +0000379
Guido van Rossumf1945461995-06-14 23:43:44 +0000380if __name__ == '__main__':
Guido van Rossum4581ae52007-05-22 21:56:47 +0000381 main()