blob: 9b9cd7f011153cc4b02d199ffa69a65675208ca9 [file] [log] [blame]
Jack Jansen72781191995-08-07 14:34:15 +00001/*
2** Routines to represent binary data in ASCII and vice-versa
3**
4** This module currently supports the following encodings:
5** uuencode:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00006** each line encodes 45 bytes (except possibly the last)
7** First char encodes (binary) length, rest data
8** each char encodes 6 bits, as follows:
9** binary: 01234567 abcdefgh ijklmnop
10** ascii: 012345 67abcd efghij klmnop
11** ASCII encoding method is "excess-space": 000000 is encoded as ' ', etc.
12** short binary data is zero-extended (so the bits are always in the
13** right place), this does *not* reflect in the length.
Jack Jansen84bbc2e1995-10-04 16:38:44 +000014** base64:
15** Line breaks are insignificant, but lines are at most 76 chars
16** each char encodes 6 bits, in similar order as uucode/hqx. Encoding
17** is done via a table.
18** Short binary data is filled (in ASCII) with '='.
Jack Jansen72781191995-08-07 14:34:15 +000019** hqx:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000020** File starts with introductory text, real data starts and ends
21** with colons.
22** Data consists of three similar parts: info, datafork, resourcefork.
23** Each part is protected (at the end) with a 16-bit crc
24** The binary data is run-length encoded, and then ascii-fied:
25** binary: 01234567 abcdefgh ijklmnop
26** ascii: 012345 67abcd efghij klmnop
27** ASCII encoding is table-driven, see the code.
28** Short binary data results in the runt ascii-byte being output with
29** the bits in the right place.
Jack Jansen72781191995-08-07 14:34:15 +000030**
31** While I was reading dozens of programs that encode or decode the formats
32** here (documentation? hihi:-) I have formulated Jansen's Observation:
33**
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000034** Programs that encode binary data in ASCII are written in
35** such a style that they are as unreadable as possible. Devices used
36** include unnecessary global variables, burying important tables
37** in unrelated sourcefiles, putting functions in include files,
38** using seemingly-descriptive variable names for different purposes,
39** calls to empty subroutines and a host of others.
Jack Jansen72781191995-08-07 14:34:15 +000040**
41** I have attempted to break with this tradition, but I guess that that
42** does make the performance sub-optimal. Oh well, too bad...
43**
44** Jack Jansen, CWI, July 1995.
Tim Peters934c1a12002-07-02 22:24:50 +000045**
Martin v. Löwis16dc7f42001-09-30 20:32:11 +000046** Added support for quoted-printable encoding, based on rfc 1521 et al
Tim Peters934c1a12002-07-02 22:24:50 +000047** quoted-printable encoding specifies that non printable characters (anything
Martin v. Löwis16dc7f42001-09-30 20:32:11 +000048** below 32 and above 126) be encoded as =XX where XX is the hexadecimal value
49** of the character. It also specifies some other behavior to enable 8bit data
Tim Peters934c1a12002-07-02 22:24:50 +000050** in a mail message with little difficulty (maximum line sizes, protecting
51** some cases of whitespace, etc).
Martin v. Löwis16dc7f42001-09-30 20:32:11 +000052**
53** Brandon Long, September 2001.
Jack Jansen72781191995-08-07 14:34:15 +000054*/
55
Thomas Wouters9c544482006-03-01 21:59:44 +000056#define PY_SSIZE_T_CLEAN
Jack Jansen72781191995-08-07 14:34:15 +000057
58#include "Python.h"
Gregory P. Smith9c6b9162015-04-26 00:42:13 +000059#include "pystrhex.h"
Christian Heimes1dc54002008-03-24 02:19:29 +000060#ifdef USE_ZLIB_CRC32
61#include "zlib.h"
62#endif
Jack Jansen72781191995-08-07 14:34:15 +000063
64static PyObject *Error;
65static PyObject *Incomplete;
66
67/*
68** hqx lookup table, ascii->binary.
69*/
70
71#define RUNCHAR 0x90
72
73#define DONE 0x7F
74#define SKIP 0x7E
75#define FAIL 0x7D
76
Serhiy Storchaka2d06e842015-12-25 19:53:18 +020077static const unsigned char table_a2b_hqx[256] = {
Jack Jansen72781191995-08-07 14:34:15 +000078/* ^@ ^A ^B ^C ^D ^E ^F ^G */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000079/* 0*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +000080/* \b \t \n ^K ^L \r ^N ^O */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000081/* 1*/ FAIL, FAIL, SKIP, FAIL, FAIL, SKIP, FAIL, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +000082/* ^P ^Q ^R ^S ^T ^U ^V ^W */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000083/* 2*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +000084/* ^X ^Y ^Z ^[ ^\ ^] ^^ ^_ */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000085/* 3*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +000086/* ! " # $ % & ' */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000087/* 4*/ FAIL, 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06,
Jack Jansen72781191995-08-07 14:34:15 +000088/* ( ) * + , - . / */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000089/* 5*/ 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, FAIL, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +000090/* 0 1 2 3 4 5 6 7 */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000091/* 6*/ 0x0D, 0x0E, 0x0F, 0x10, 0x11, 0x12, 0x13, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +000092/* 8 9 : ; < = > ? */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000093/* 7*/ 0x14, 0x15, DONE, FAIL, FAIL, FAIL, FAIL, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +000094/* @ A B C D E F G */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000095/* 8*/ 0x16, 0x17, 0x18, 0x19, 0x1A, 0x1B, 0x1C, 0x1D,
Jack Jansen72781191995-08-07 14:34:15 +000096/* H I J K L M N O */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000097/* 9*/ 0x1E, 0x1F, 0x20, 0x21, 0x22, 0x23, 0x24, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +000098/* P Q R S T U V W */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000099/*10*/ 0x25, 0x26, 0x27, 0x28, 0x29, 0x2A, 0x2B, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +0000100/* X Y Z [ \ ] ^ _ */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000101/*11*/ 0x2C, 0x2D, 0x2E, 0x2F, FAIL, FAIL, FAIL, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +0000102/* ` a b c d e f g */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000103/*12*/ 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +0000104/* h i j k l m n o */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000105/*13*/ 0x37, 0x38, 0x39, 0x3A, 0x3B, 0x3C, FAIL, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +0000106/* p q r s t u v w */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000107/*14*/ 0x3D, 0x3E, 0x3F, FAIL, FAIL, FAIL, FAIL, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +0000108/* x y z { | } ~ ^? */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000109/*15*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
110/*16*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
111 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
112 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
113 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
114 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
115 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
116 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
117 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
118 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
119 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
120 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
121 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
122 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
123 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
124 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
125 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
Jack Jansen72781191995-08-07 14:34:15 +0000126};
127
Serhiy Storchaka2d06e842015-12-25 19:53:18 +0200128static const unsigned char table_b2a_hqx[] =
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000129"!\"#$%&'()*+,-012345689@ABCDEFGHIJKLMNPQRSTUVXYZ[`abcdefhijklmpqr";
Jack Jansen72781191995-08-07 14:34:15 +0000130
Serhiy Storchaka2d06e842015-12-25 19:53:18 +0200131static const char table_a2b_base64[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000132 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
133 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
134 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,62, -1,-1,-1,63,
135 52,53,54,55, 56,57,58,59, 60,61,-1,-1, -1, 0,-1,-1, /* Note PAD->0 */
136 -1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9,10, 11,12,13,14,
137 15,16,17,18, 19,20,21,22, 23,24,25,-1, -1,-1,-1,-1,
138 -1,26,27,28, 29,30,31,32, 33,34,35,36, 37,38,39,40,
139 41,42,43,44, 45,46,47,48, 49,50,51,-1, -1,-1,-1,-1
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000140};
141
142#define BASE64_PAD '='
Guido van Rossum355bc0c2001-10-30 03:00:52 +0000143
144/* Max binary chunk size; limited only by available memory */
Guido van Rossum0e225aa2007-05-22 20:24:57 +0000145#define BASE64_MAXBIN ((PY_SSIZE_T_MAX - 3) / 2)
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000146
Serhiy Storchaka2d06e842015-12-25 19:53:18 +0200147static const unsigned char table_b2a_base64[] =
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000148"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000149
150
151
Serhiy Storchaka2d06e842015-12-25 19:53:18 +0200152static const unsigned short crctab_hqx[256] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000153 0x0000, 0x1021, 0x2042, 0x3063, 0x4084, 0x50a5, 0x60c6, 0x70e7,
154 0x8108, 0x9129, 0xa14a, 0xb16b, 0xc18c, 0xd1ad, 0xe1ce, 0xf1ef,
155 0x1231, 0x0210, 0x3273, 0x2252, 0x52b5, 0x4294, 0x72f7, 0x62d6,
156 0x9339, 0x8318, 0xb37b, 0xa35a, 0xd3bd, 0xc39c, 0xf3ff, 0xe3de,
157 0x2462, 0x3443, 0x0420, 0x1401, 0x64e6, 0x74c7, 0x44a4, 0x5485,
158 0xa56a, 0xb54b, 0x8528, 0x9509, 0xe5ee, 0xf5cf, 0xc5ac, 0xd58d,
159 0x3653, 0x2672, 0x1611, 0x0630, 0x76d7, 0x66f6, 0x5695, 0x46b4,
160 0xb75b, 0xa77a, 0x9719, 0x8738, 0xf7df, 0xe7fe, 0xd79d, 0xc7bc,
161 0x48c4, 0x58e5, 0x6886, 0x78a7, 0x0840, 0x1861, 0x2802, 0x3823,
162 0xc9cc, 0xd9ed, 0xe98e, 0xf9af, 0x8948, 0x9969, 0xa90a, 0xb92b,
163 0x5af5, 0x4ad4, 0x7ab7, 0x6a96, 0x1a71, 0x0a50, 0x3a33, 0x2a12,
164 0xdbfd, 0xcbdc, 0xfbbf, 0xeb9e, 0x9b79, 0x8b58, 0xbb3b, 0xab1a,
165 0x6ca6, 0x7c87, 0x4ce4, 0x5cc5, 0x2c22, 0x3c03, 0x0c60, 0x1c41,
166 0xedae, 0xfd8f, 0xcdec, 0xddcd, 0xad2a, 0xbd0b, 0x8d68, 0x9d49,
167 0x7e97, 0x6eb6, 0x5ed5, 0x4ef4, 0x3e13, 0x2e32, 0x1e51, 0x0e70,
168 0xff9f, 0xefbe, 0xdfdd, 0xcffc, 0xbf1b, 0xaf3a, 0x9f59, 0x8f78,
169 0x9188, 0x81a9, 0xb1ca, 0xa1eb, 0xd10c, 0xc12d, 0xf14e, 0xe16f,
170 0x1080, 0x00a1, 0x30c2, 0x20e3, 0x5004, 0x4025, 0x7046, 0x6067,
171 0x83b9, 0x9398, 0xa3fb, 0xb3da, 0xc33d, 0xd31c, 0xe37f, 0xf35e,
172 0x02b1, 0x1290, 0x22f3, 0x32d2, 0x4235, 0x5214, 0x6277, 0x7256,
173 0xb5ea, 0xa5cb, 0x95a8, 0x8589, 0xf56e, 0xe54f, 0xd52c, 0xc50d,
174 0x34e2, 0x24c3, 0x14a0, 0x0481, 0x7466, 0x6447, 0x5424, 0x4405,
175 0xa7db, 0xb7fa, 0x8799, 0x97b8, 0xe75f, 0xf77e, 0xc71d, 0xd73c,
176 0x26d3, 0x36f2, 0x0691, 0x16b0, 0x6657, 0x7676, 0x4615, 0x5634,
177 0xd94c, 0xc96d, 0xf90e, 0xe92f, 0x99c8, 0x89e9, 0xb98a, 0xa9ab,
178 0x5844, 0x4865, 0x7806, 0x6827, 0x18c0, 0x08e1, 0x3882, 0x28a3,
179 0xcb7d, 0xdb5c, 0xeb3f, 0xfb1e, 0x8bf9, 0x9bd8, 0xabbb, 0xbb9a,
180 0x4a75, 0x5a54, 0x6a37, 0x7a16, 0x0af1, 0x1ad0, 0x2ab3, 0x3a92,
181 0xfd2e, 0xed0f, 0xdd6c, 0xcd4d, 0xbdaa, 0xad8b, 0x9de8, 0x8dc9,
182 0x7c26, 0x6c07, 0x5c64, 0x4c45, 0x3ca2, 0x2c83, 0x1ce0, 0x0cc1,
183 0xef1f, 0xff3e, 0xcf5d, 0xdf7c, 0xaf9b, 0xbfba, 0x8fd9, 0x9ff8,
184 0x6e17, 0x7e36, 0x4e55, 0x5e74, 0x2e93, 0x3eb2, 0x0ed1, 0x1ef0,
Jack Jansen72781191995-08-07 14:34:15 +0000185};
186
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200187/*[clinic input]
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200188module binascii
189[clinic start generated code]*/
Serhiy Storchaka1009bf12015-04-03 23:53:51 +0300190/*[clinic end generated code: output=da39a3ee5e6b4b0d input=de89fb46bcaf3fec]*/
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200191
192/*[python input]
193
194class ascii_buffer_converter(CConverter):
195 type = 'Py_buffer'
196 converter = 'ascii_buffer_converter'
197 impl_by_reference = True
Benjamin Petersonb62deac2014-01-26 10:41:58 -0500198 c_default = "{NULL, NULL}"
199
200 def cleanup(self):
201 name = self.name
202 return "".join(["if (", name, ".obj)\n PyBuffer_Release(&", name, ");\n"])
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200203
204[python start generated code]*/
Larry Hastings581ee362014-01-28 05:00:08 -0800205/*[python end generated code: output=da39a3ee5e6b4b0d input=3eb7b63610da92cd]*/
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200206
Antoine Pitrou08316762011-12-20 13:58:41 +0100207static int
208ascii_buffer_converter(PyObject *arg, Py_buffer *buf)
209{
210 if (arg == NULL) {
211 PyBuffer_Release(buf);
212 return 1;
213 }
214 if (PyUnicode_Check(arg)) {
215 if (PyUnicode_READY(arg) < 0)
216 return 0;
217 if (!PyUnicode_IS_ASCII(arg)) {
218 PyErr_SetString(PyExc_ValueError,
219 "string argument should contain only ASCII characters");
220 return 0;
221 }
222 assert(PyUnicode_KIND(arg) == PyUnicode_1BYTE_KIND);
223 buf->buf = (void *) PyUnicode_1BYTE_DATA(arg);
224 buf->len = PyUnicode_GET_LENGTH(arg);
225 buf->obj = NULL;
226 return 1;
227 }
228 if (PyObject_GetBuffer(arg, buf, PyBUF_SIMPLE) != 0) {
229 PyErr_Format(PyExc_TypeError,
230 "argument should be bytes, buffer or ASCII string, "
Berker Peksag3cd30c22015-02-15 00:31:00 +0200231 "not '%.100s'", Py_TYPE(arg)->tp_name);
Antoine Pitrou08316762011-12-20 13:58:41 +0100232 return 0;
233 }
234 if (!PyBuffer_IsContiguous(buf, 'C')) {
235 PyErr_Format(PyExc_TypeError,
236 "argument should be a contiguous buffer, "
Berker Peksag3cd30c22015-02-15 00:31:00 +0200237 "not '%.100s'", Py_TYPE(arg)->tp_name);
Antoine Pitrou08316762011-12-20 13:58:41 +0100238 PyBuffer_Release(buf);
239 return 0;
240 }
241 return Py_CLEANUP_SUPPORTED;
242}
243
Larry Hastingsf256c222014-01-25 21:30:37 -0800244#include "clinic/binascii.c.h"
Antoine Pitrou08316762011-12-20 13:58:41 +0100245
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200246/*[clinic input]
247binascii.a2b_uu
248
Serhiy Storchaka12785612014-01-25 11:49:49 +0200249 data: ascii_buffer
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200250 /
251
252Decode a line of uuencoded data.
253[clinic start generated code]*/
Jack Jansen72781191995-08-07 14:34:15 +0000254
255static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +0300256binascii_a2b_uu_impl(PyObject *module, Py_buffer *data)
257/*[clinic end generated code: output=e027f8e0b0598742 input=7cafeaf73df63d1c]*/
Jack Jansen72781191995-08-07 14:34:15 +0000258{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200259 const unsigned char *ascii_data;
260 unsigned char *bin_data;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000261 int leftbits = 0;
262 unsigned char this_ch;
263 unsigned int leftchar = 0;
264 PyObject *rv;
265 Py_ssize_t ascii_len, bin_len;
Tim Peters934c1a12002-07-02 22:24:50 +0000266
Serhiy Storchaka12785612014-01-25 11:49:49 +0200267 ascii_data = data->buf;
268 ascii_len = data->len;
Jack Jansen72781191995-08-07 14:34:15 +0000269
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000270 assert(ascii_len >= 0);
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000271
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000272 /* First byte: binary data length (in bytes) */
273 bin_len = (*ascii_data++ - ' ') & 077;
274 ascii_len--;
Jack Jansen72781191995-08-07 14:34:15 +0000275
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000276 /* Allocate the buffer */
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200277 if ( (rv=PyBytes_FromStringAndSize(NULL, bin_len)) == NULL )
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000278 return NULL;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000279 bin_data = (unsigned char *)PyBytes_AS_STRING(rv);
Tim Peters934c1a12002-07-02 22:24:50 +0000280
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000281 for( ; bin_len > 0 ; ascii_len--, ascii_data++ ) {
282 /* XXX is it really best to add NULs if there's no more data */
283 this_ch = (ascii_len > 0) ? *ascii_data : 0;
284 if ( this_ch == '\n' || this_ch == '\r' || ascii_len <= 0) {
285 /*
286 ** Whitespace. Assume some spaces got eaten at
287 ** end-of-line. (We check this later)
288 */
289 this_ch = 0;
290 } else {
291 /* Check the character for legality
292 ** The 64 in stead of the expected 63 is because
293 ** there are a few uuencodes out there that use
294 ** '`' as zero instead of space.
295 */
296 if ( this_ch < ' ' || this_ch > (' ' + 64)) {
297 PyErr_SetString(Error, "Illegal char");
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000298 Py_DECREF(rv);
299 return NULL;
300 }
301 this_ch = (this_ch - ' ') & 077;
302 }
303 /*
304 ** Shift it in on the low end, and see if there's
305 ** a byte ready for output.
306 */
307 leftchar = (leftchar << 6) | (this_ch);
308 leftbits += 6;
309 if ( leftbits >= 8 ) {
310 leftbits -= 8;
311 *bin_data++ = (leftchar >> leftbits) & 0xff;
312 leftchar &= ((1 << leftbits) - 1);
313 bin_len--;
314 }
315 }
316 /*
317 ** Finally, check that if there's anything left on the line
318 ** that it's whitespace only.
319 */
320 while( ascii_len-- > 0 ) {
321 this_ch = *ascii_data++;
322 /* Extra '`' may be written as padding in some cases */
323 if ( this_ch != ' ' && this_ch != ' '+64 &&
324 this_ch != '\n' && this_ch != '\r' ) {
325 PyErr_SetString(Error, "Trailing garbage");
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000326 Py_DECREF(rv);
327 return NULL;
328 }
329 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000330 return rv;
Jack Jansen72781191995-08-07 14:34:15 +0000331}
332
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200333/*[clinic input]
334binascii.b2a_uu
335
336 data: Py_buffer
337 /
338
339Uuencode line of data.
340[clinic start generated code]*/
Tim Peters934c1a12002-07-02 22:24:50 +0000341
Jack Jansen72781191995-08-07 14:34:15 +0000342static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +0300343binascii_b2a_uu_impl(PyObject *module, Py_buffer *data)
344/*[clinic end generated code: output=0070670e52e4aa6b input=00fdf458ce8b465b]*/
Jack Jansen72781191995-08-07 14:34:15 +0000345{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200346 unsigned char *ascii_data;
347 const unsigned char *bin_data;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000348 int leftbits = 0;
349 unsigned char this_ch;
350 unsigned int leftchar = 0;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200351 Py_ssize_t bin_len, out_len;
352 _PyBytesWriter writer;
Tim Peters934c1a12002-07-02 22:24:50 +0000353
Victor Stinnereaaaf132015-10-13 10:51:47 +0200354 _PyBytesWriter_Init(&writer);
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200355 bin_data = data->buf;
356 bin_len = data->len;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000357 if ( bin_len > 45 ) {
358 /* The 45 is a limit that appears in all uuencode's */
359 PyErr_SetString(Error, "At most 45 bytes at once");
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000360 return NULL;
361 }
Jack Jansen72781191995-08-07 14:34:15 +0000362
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000363 /* We're lazy and allocate to much (fixed up later) */
Victor Stinnereaaaf132015-10-13 10:51:47 +0200364 out_len = 2 + (bin_len + 2) / 3 * 4;
365 ascii_data = _PyBytesWriter_Alloc(&writer, out_len);
366 if (ascii_data == NULL)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000367 return NULL;
Jack Jansen72781191995-08-07 14:34:15 +0000368
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000369 /* Store the length */
370 *ascii_data++ = ' ' + (bin_len & 077);
Tim Peters934c1a12002-07-02 22:24:50 +0000371
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000372 for( ; bin_len > 0 || leftbits != 0 ; bin_len--, bin_data++ ) {
373 /* Shift the data (or padding) into our buffer */
374 if ( bin_len > 0 ) /* Data */
375 leftchar = (leftchar << 8) | *bin_data;
376 else /* Padding */
377 leftchar <<= 8;
378 leftbits += 8;
Jack Jansen72781191995-08-07 14:34:15 +0000379
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000380 /* See if there are 6-bit groups ready */
381 while ( leftbits >= 6 ) {
382 this_ch = (leftchar >> (leftbits-6)) & 0x3f;
383 leftbits -= 6;
384 *ascii_data++ = this_ch + ' ';
385 }
386 }
387 *ascii_data++ = '\n'; /* Append a courtesy newline */
Tim Peters934c1a12002-07-02 22:24:50 +0000388
Victor Stinnereaaaf132015-10-13 10:51:47 +0200389 return _PyBytesWriter_Finish(&writer, ascii_data);
Jack Jansen72781191995-08-07 14:34:15 +0000390}
391
Guido van Rossum2db4f471999-10-19 19:05:14 +0000392
393static int
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200394binascii_find_valid(const unsigned char *s, Py_ssize_t slen, int num)
Guido van Rossum2db4f471999-10-19 19:05:14 +0000395{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000396 /* Finds & returns the (num+1)th
397 ** valid character for base64, or -1 if none.
398 */
Guido van Rossum2db4f471999-10-19 19:05:14 +0000399
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000400 int ret = -1;
401 unsigned char c, b64val;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000402
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000403 while ((slen > 0) && (ret == -1)) {
404 c = *s;
405 b64val = table_a2b_base64[c & 0x7f];
406 if ( ((c <= 0x7f) && (b64val != (unsigned char)-1)) ) {
407 if (num == 0)
408 ret = *s;
409 num--;
410 }
Guido van Rossum2db4f471999-10-19 19:05:14 +0000411
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000412 s++;
413 slen--;
414 }
415 return ret;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000416}
417
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200418/*[clinic input]
419binascii.a2b_base64
420
Serhiy Storchaka12785612014-01-25 11:49:49 +0200421 data: ascii_buffer
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200422 /
423
424Decode a line of base64 data.
425[clinic start generated code]*/
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000426
427static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +0300428binascii_a2b_base64_impl(PyObject *module, Py_buffer *data)
429/*[clinic end generated code: output=0628223f19fd3f9b input=5872acf6e1cac243]*/
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000430{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200431 const unsigned char *ascii_data;
432 unsigned char *bin_data;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000433 int leftbits = 0;
434 unsigned char this_ch;
435 unsigned int leftchar = 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000436 Py_ssize_t ascii_len, bin_len;
437 int quad_pos = 0;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200438 _PyBytesWriter writer;
Tim Peters934c1a12002-07-02 22:24:50 +0000439
Serhiy Storchaka12785612014-01-25 11:49:49 +0200440 ascii_data = data->buf;
441 ascii_len = data->len;
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000442
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000443 assert(ascii_len >= 0);
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000444
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200445 if (ascii_len > PY_SSIZE_T_MAX - 3)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000446 return PyErr_NoMemory();
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000447
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000448 bin_len = ((ascii_len+3)/4)*3; /* Upper bound, corrected later */
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000449
Victor Stinnereaaaf132015-10-13 10:51:47 +0200450 _PyBytesWriter_Init(&writer);
451
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000452 /* Allocate the buffer */
Victor Stinnereaaaf132015-10-13 10:51:47 +0200453 bin_data = _PyBytesWriter_Alloc(&writer, bin_len);
454 if (bin_data == NULL)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000455 return NULL;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000456
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000457 for( ; ascii_len > 0; ascii_len--, ascii_data++) {
458 this_ch = *ascii_data;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000459
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000460 if (this_ch > 0x7f ||
461 this_ch == '\r' || this_ch == '\n' || this_ch == ' ')
462 continue;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000463
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000464 /* Check for pad sequences and ignore
465 ** the invalid ones.
466 */
467 if (this_ch == BASE64_PAD) {
468 if ( (quad_pos < 2) ||
469 ((quad_pos == 2) &&
470 (binascii_find_valid(ascii_data, ascii_len, 1)
471 != BASE64_PAD)) )
472 {
473 continue;
474 }
475 else {
476 /* A pad sequence means no more input.
477 ** We've already interpreted the data
478 ** from the quad at this point.
479 */
480 leftbits = 0;
481 break;
482 }
483 }
Guido van Rossum2db4f471999-10-19 19:05:14 +0000484
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000485 this_ch = table_a2b_base64[*ascii_data];
486 if ( this_ch == (unsigned char) -1 )
487 continue;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000488
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000489 /*
490 ** Shift it in on the low end, and see if there's
491 ** a byte ready for output.
492 */
493 quad_pos = (quad_pos + 1) & 0x03;
494 leftchar = (leftchar << 6) | (this_ch);
495 leftbits += 6;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000496
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000497 if ( leftbits >= 8 ) {
498 leftbits -= 8;
499 *bin_data++ = (leftchar >> leftbits) & 0xff;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000500 leftchar &= ((1 << leftbits) - 1);
501 }
502 }
Guido van Rossum2db4f471999-10-19 19:05:14 +0000503
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000504 if (leftbits != 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000505 PyErr_SetString(Error, "Incorrect padding");
Victor Stinnereaaaf132015-10-13 10:51:47 +0200506 _PyBytesWriter_Dealloc(&writer);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000507 return NULL;
508 }
Guido van Rossum2db4f471999-10-19 19:05:14 +0000509
Victor Stinnereaaaf132015-10-13 10:51:47 +0200510 return _PyBytesWriter_Finish(&writer, bin_data);
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000511}
512
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200513
514/*[clinic input]
515binascii.b2a_base64
516
517 data: Py_buffer
Victor Stinnere84c9762015-10-11 11:01:02 +0200518 *
519 newline: int(c_default="1") = True
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200520
521Base64-code line of data.
522[clinic start generated code]*/
Tim Peters934c1a12002-07-02 22:24:50 +0000523
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000524static PyObject *
Serhiy Storchaka2954f832016-07-07 18:20:03 +0300525binascii_b2a_base64_impl(PyObject *module, Py_buffer *data, int newline)
526/*[clinic end generated code: output=4ad62c8e8485d3b3 input=7b2ea6fa38d8924c]*/
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000527{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200528 unsigned char *ascii_data;
529 const unsigned char *bin_data;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000530 int leftbits = 0;
531 unsigned char this_ch;
532 unsigned int leftchar = 0;
Victor Stinnere84c9762015-10-11 11:01:02 +0200533 Py_ssize_t bin_len, out_len;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200534 _PyBytesWriter writer;
Tim Peters934c1a12002-07-02 22:24:50 +0000535
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200536 bin_data = data->buf;
537 bin_len = data->len;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200538 _PyBytesWriter_Init(&writer);
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000539
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000540 assert(bin_len >= 0);
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000541
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000542 if ( bin_len > BASE64_MAXBIN ) {
543 PyErr_SetString(Error, "Too much data for base64 line");
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000544 return NULL;
545 }
Tim Peters934c1a12002-07-02 22:24:50 +0000546
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000547 /* We're lazy and allocate too much (fixed up later).
Victor Stinnere84c9762015-10-11 11:01:02 +0200548 "+2" leaves room for up to two pad characters.
549 Note that 'b' gets encoded as 'Yg==\n' (1 in, 5 out). */
550 out_len = bin_len*2 + 2;
551 if (newline)
552 out_len++;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200553 ascii_data = _PyBytesWriter_Alloc(&writer, out_len);
554 if (ascii_data == NULL)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000555 return NULL;
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000556
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000557 for( ; bin_len > 0 ; bin_len--, bin_data++ ) {
558 /* Shift the data into our buffer */
559 leftchar = (leftchar << 8) | *bin_data;
560 leftbits += 8;
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000561
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000562 /* See if there are 6-bit groups ready */
563 while ( leftbits >= 6 ) {
564 this_ch = (leftchar >> (leftbits-6)) & 0x3f;
565 leftbits -= 6;
566 *ascii_data++ = table_b2a_base64[this_ch];
567 }
568 }
569 if ( leftbits == 2 ) {
570 *ascii_data++ = table_b2a_base64[(leftchar&3) << 4];
571 *ascii_data++ = BASE64_PAD;
572 *ascii_data++ = BASE64_PAD;
573 } else if ( leftbits == 4 ) {
574 *ascii_data++ = table_b2a_base64[(leftchar&0xf) << 2];
575 *ascii_data++ = BASE64_PAD;
576 }
Victor Stinnere84c9762015-10-11 11:01:02 +0200577 if (newline)
578 *ascii_data++ = '\n'; /* Append a courtesy newline */
Tim Peters934c1a12002-07-02 22:24:50 +0000579
Victor Stinnereaaaf132015-10-13 10:51:47 +0200580 return _PyBytesWriter_Finish(&writer, ascii_data);
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000581}
582
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200583/*[clinic input]
584binascii.a2b_hqx
585
Serhiy Storchaka12785612014-01-25 11:49:49 +0200586 data: ascii_buffer
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200587 /
588
589Decode .hqx coding.
590[clinic start generated code]*/
Jack Jansen72781191995-08-07 14:34:15 +0000591
592static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +0300593binascii_a2b_hqx_impl(PyObject *module, Py_buffer *data)
594/*[clinic end generated code: output=4d6d8c54d54ea1c1 input=0d914c680e0eed55]*/
Jack Jansen72781191995-08-07 14:34:15 +0000595{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200596 const unsigned char *ascii_data;
597 unsigned char *bin_data;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000598 int leftbits = 0;
599 unsigned char this_ch;
600 unsigned int leftchar = 0;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200601 PyObject *res;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000602 Py_ssize_t len;
603 int done = 0;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200604 _PyBytesWriter writer;
Tim Peters934c1a12002-07-02 22:24:50 +0000605
Serhiy Storchaka12785612014-01-25 11:49:49 +0200606 ascii_data = data->buf;
607 len = data->len;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200608 _PyBytesWriter_Init(&writer);
Jack Jansen72781191995-08-07 14:34:15 +0000609
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000610 assert(len >= 0);
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000611
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200612 if (len > PY_SSIZE_T_MAX - 2)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000613 return PyErr_NoMemory();
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000614
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000615 /* Allocate a string that is too big (fixed later)
616 Add two to the initial length to prevent interning which
617 would preclude subsequent resizing. */
Victor Stinnereaaaf132015-10-13 10:51:47 +0200618 bin_data = _PyBytesWriter_Alloc(&writer, len + 2);
619 if (bin_data == NULL)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000620 return NULL;
Jack Jansen72781191995-08-07 14:34:15 +0000621
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000622 for( ; len > 0 ; len--, ascii_data++ ) {
623 /* Get the byte and look it up */
624 this_ch = table_a2b_hqx[*ascii_data];
625 if ( this_ch == SKIP )
626 continue;
627 if ( this_ch == FAIL ) {
628 PyErr_SetString(Error, "Illegal char");
Victor Stinnereaaaf132015-10-13 10:51:47 +0200629 _PyBytesWriter_Dealloc(&writer);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000630 return NULL;
631 }
632 if ( this_ch == DONE ) {
633 /* The terminating colon */
634 done = 1;
635 break;
636 }
Jack Jansen72781191995-08-07 14:34:15 +0000637
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000638 /* Shift it into the buffer and see if any bytes are ready */
639 leftchar = (leftchar << 6) | (this_ch);
640 leftbits += 6;
641 if ( leftbits >= 8 ) {
642 leftbits -= 8;
643 *bin_data++ = (leftchar >> leftbits) & 0xff;
644 leftchar &= ((1 << leftbits) - 1);
645 }
646 }
Tim Peters934c1a12002-07-02 22:24:50 +0000647
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000648 if ( leftbits && !done ) {
649 PyErr_SetString(Incomplete,
650 "String has incomplete number of bytes");
Victor Stinnereaaaf132015-10-13 10:51:47 +0200651 _PyBytesWriter_Dealloc(&writer);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000652 return NULL;
653 }
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000654
Victor Stinnereaaaf132015-10-13 10:51:47 +0200655 res = _PyBytesWriter_Finish(&writer, bin_data);
656 if (res == NULL)
657 return NULL;
658 return Py_BuildValue("Ni", res, done);
Jack Jansen72781191995-08-07 14:34:15 +0000659}
660
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200661
662/*[clinic input]
663binascii.rlecode_hqx
664
665 data: Py_buffer
666 /
667
668Binhex RLE-code binary data.
669[clinic start generated code]*/
Jack Jansen72781191995-08-07 14:34:15 +0000670
671static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +0300672binascii_rlecode_hqx_impl(PyObject *module, Py_buffer *data)
673/*[clinic end generated code: output=393d79338f5f5629 input=e1f1712447a82b09]*/
Jack Jansen72781191995-08-07 14:34:15 +0000674{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200675 const unsigned char *in_data;
676 unsigned char *out_data;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000677 unsigned char ch;
678 Py_ssize_t in, inend, len;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200679 _PyBytesWriter writer;
Tim Peters934c1a12002-07-02 22:24:50 +0000680
Victor Stinnereaaaf132015-10-13 10:51:47 +0200681 _PyBytesWriter_Init(&writer);
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200682 in_data = data->buf;
683 len = data->len;
Jack Jansen72781191995-08-07 14:34:15 +0000684
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000685 assert(len >= 0);
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000686
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200687 if (len > PY_SSIZE_T_MAX / 2 - 2)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000688 return PyErr_NoMemory();
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000689
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000690 /* Worst case: output is twice as big as input (fixed later) */
Victor Stinnereaaaf132015-10-13 10:51:47 +0200691 out_data = _PyBytesWriter_Alloc(&writer, len * 2 + 2);
692 if (out_data == NULL)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000693 return NULL;
Tim Peters934c1a12002-07-02 22:24:50 +0000694
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000695 for( in=0; in<len; in++) {
696 ch = in_data[in];
697 if ( ch == RUNCHAR ) {
698 /* RUNCHAR. Escape it. */
699 *out_data++ = RUNCHAR;
700 *out_data++ = 0;
701 } else {
702 /* Check how many following are the same */
703 for(inend=in+1;
704 inend<len && in_data[inend] == ch &&
705 inend < in+255;
706 inend++) ;
707 if ( inend - in > 3 ) {
708 /* More than 3 in a row. Output RLE. */
709 *out_data++ = ch;
710 *out_data++ = RUNCHAR;
Antoine Pitrou40455752010-08-15 18:51:10 +0000711 *out_data++ = (unsigned char) (inend-in);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000712 in = inend-1;
713 } else {
714 /* Less than 3. Output the byte itself */
715 *out_data++ = ch;
716 }
717 }
718 }
Victor Stinnereaaaf132015-10-13 10:51:47 +0200719
720 return _PyBytesWriter_Finish(&writer, out_data);
Jack Jansen72781191995-08-07 14:34:15 +0000721}
722
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200723
724/*[clinic input]
725binascii.b2a_hqx
726
727 data: Py_buffer
728 /
729
730Encode .hqx data.
731[clinic start generated code]*/
Tim Peters934c1a12002-07-02 22:24:50 +0000732
Jack Jansen72781191995-08-07 14:34:15 +0000733static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +0300734binascii_b2a_hqx_impl(PyObject *module, Py_buffer *data)
735/*[clinic end generated code: output=d0aa5a704bc9f7de input=9596ebe019fe12ba]*/
Jack Jansen72781191995-08-07 14:34:15 +0000736{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200737 unsigned char *ascii_data;
738 const unsigned char *bin_data;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000739 int leftbits = 0;
740 unsigned char this_ch;
741 unsigned int leftchar = 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000742 Py_ssize_t len;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200743 _PyBytesWriter writer;
Tim Peters934c1a12002-07-02 22:24:50 +0000744
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200745 bin_data = data->buf;
746 len = data->len;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200747 _PyBytesWriter_Init(&writer);
Jack Jansen72781191995-08-07 14:34:15 +0000748
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000749 assert(len >= 0);
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000750
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200751 if (len > PY_SSIZE_T_MAX / 2 - 2)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000752 return PyErr_NoMemory();
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000753
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000754 /* Allocate a buffer that is at least large enough */
Victor Stinnereaaaf132015-10-13 10:51:47 +0200755 ascii_data = _PyBytesWriter_Alloc(&writer, len * 2 + 2);
756 if (ascii_data == NULL)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000757 return NULL;
Tim Peters934c1a12002-07-02 22:24:50 +0000758
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000759 for( ; len > 0 ; len--, bin_data++ ) {
760 /* Shift into our buffer, and output any 6bits ready */
761 leftchar = (leftchar << 8) | *bin_data;
762 leftbits += 8;
763 while ( leftbits >= 6 ) {
764 this_ch = (leftchar >> (leftbits-6)) & 0x3f;
765 leftbits -= 6;
766 *ascii_data++ = table_b2a_hqx[this_ch];
767 }
768 }
769 /* Output a possible runt byte */
770 if ( leftbits ) {
771 leftchar <<= (6-leftbits);
772 *ascii_data++ = table_b2a_hqx[leftchar & 0x3f];
773 }
Victor Stinnereaaaf132015-10-13 10:51:47 +0200774
775 return _PyBytesWriter_Finish(&writer, ascii_data);
Jack Jansen72781191995-08-07 14:34:15 +0000776}
777
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200778
779/*[clinic input]
780binascii.rledecode_hqx
781
782 data: Py_buffer
783 /
784
785Decode hexbin RLE-coded string.
786[clinic start generated code]*/
Tim Peters934c1a12002-07-02 22:24:50 +0000787
Jack Jansen72781191995-08-07 14:34:15 +0000788static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +0300789binascii_rledecode_hqx_impl(PyObject *module, Py_buffer *data)
790/*[clinic end generated code: output=9826619565de1c6c input=54cdd49fc014402c]*/
Jack Jansen72781191995-08-07 14:34:15 +0000791{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200792 const unsigned char *in_data;
793 unsigned char *out_data;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000794 unsigned char in_byte, in_repeat;
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200795 Py_ssize_t in_len;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200796 _PyBytesWriter writer;
Jack Jansen72781191995-08-07 14:34:15 +0000797
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200798 in_data = data->buf;
799 in_len = data->len;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200800 _PyBytesWriter_Init(&writer);
Jack Jansen72781191995-08-07 14:34:15 +0000801
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000802 assert(in_len >= 0);
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +0000803
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000804 /* Empty string is a special case */
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200805 if ( in_len == 0 )
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000806 return PyBytes_FromStringAndSize("", 0);
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200807 else if (in_len > PY_SSIZE_T_MAX / 2)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000808 return PyErr_NoMemory();
Jack Jansen72781191995-08-07 14:34:15 +0000809
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000810 /* Allocate a buffer of reasonable size. Resized when needed */
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200811 out_data = _PyBytesWriter_Alloc(&writer, in_len);
Victor Stinnereaaaf132015-10-13 10:51:47 +0200812 if (out_data == NULL)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000813 return NULL;
Victor Stinnereaaaf132015-10-13 10:51:47 +0200814
815 /* Use overallocation */
816 writer.overallocate = 1;
Jack Jansen72781191995-08-07 14:34:15 +0000817
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000818 /*
819 ** We need two macros here to get/put bytes and handle
820 ** end-of-buffer for input and output strings.
821 */
Victor Stinnereaaaf132015-10-13 10:51:47 +0200822#define INBYTE(b) \
823 do { \
824 if ( --in_len < 0 ) { \
825 PyErr_SetString(Incomplete, ""); \
826 goto error; \
827 } \
828 b = *in_data++; \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000829 } while(0)
Tim Peters934c1a12002-07-02 22:24:50 +0000830
Victor Stinnereaaaf132015-10-13 10:51:47 +0200831 /*
832 ** Handle first byte separately (since we have to get angry
833 ** in case of an orphaned RLE code).
834 */
835 INBYTE(in_byte);
Jack Jansen72781191995-08-07 14:34:15 +0000836
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000837 if (in_byte == RUNCHAR) {
838 INBYTE(in_repeat);
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200839 /* only 1 byte will be written, but 2 bytes were preallocated:
Raymond Hettinger15f44ab2016-08-30 10:47:49 -0700840 subtract 1 byte to prevent overallocation */
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200841 writer.min_size--;
842
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000843 if (in_repeat != 0) {
844 /* Note Error, not Incomplete (which is at the end
845 ** of the string only). This is a programmer error.
846 */
847 PyErr_SetString(Error, "Orphaned RLE code at start");
Victor Stinnereaaaf132015-10-13 10:51:47 +0200848 goto error;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000849 }
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200850 *out_data++ = RUNCHAR;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000851 } else {
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200852 *out_data++ = in_byte;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000853 }
Tim Peters934c1a12002-07-02 22:24:50 +0000854
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000855 while( in_len > 0 ) {
856 INBYTE(in_byte);
Jack Jansen72781191995-08-07 14:34:15 +0000857
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000858 if (in_byte == RUNCHAR) {
859 INBYTE(in_repeat);
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200860 /* only 1 byte will be written, but 2 bytes were preallocated:
Raymond Hettinger15f44ab2016-08-30 10:47:49 -0700861 subtract 1 byte to prevent overallocation */
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200862 writer.min_size--;
863
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000864 if ( in_repeat == 0 ) {
865 /* Just an escaped RUNCHAR value */
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200866 *out_data++ = RUNCHAR;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000867 } else {
868 /* Pick up value and output a sequence of it */
869 in_byte = out_data[-1];
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200870
871 /* enlarge the buffer if needed */
872 if (in_repeat > 1) {
873 /* -1 because we already preallocated 1 byte */
874 out_data = _PyBytesWriter_Prepare(&writer, out_data,
875 in_repeat - 1);
876 if (out_data == NULL)
877 goto error;
878 }
879
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000880 while ( --in_repeat > 0 )
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200881 *out_data++ = in_byte;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000882 }
883 } else {
884 /* Normal byte */
Victor Stinnerf9c9a3f2015-10-14 15:20:07 +0200885 *out_data++ = in_byte;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000886 }
887 }
Victor Stinnereaaaf132015-10-13 10:51:47 +0200888 return _PyBytesWriter_Finish(&writer, out_data);
889
890error:
891 _PyBytesWriter_Dealloc(&writer);
892 return NULL;
Jack Jansen72781191995-08-07 14:34:15 +0000893}
894
Jack Jansen72781191995-08-07 14:34:15 +0000895
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200896/*[clinic input]
Serhiy Storchaka2ef7c472015-04-20 09:26:49 +0300897binascii.crc_hqx -> unsigned_int
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200898
899 data: Py_buffer
Serhiy Storchaka2ef7c472015-04-20 09:26:49 +0300900 crc: unsigned_int(bitwise=True)
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200901 /
902
903Compute hqx CRC incrementally.
904[clinic start generated code]*/
905
Serhiy Storchaka2ef7c472015-04-20 09:26:49 +0300906static unsigned int
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +0300907binascii_crc_hqx_impl(PyObject *module, Py_buffer *data, unsigned int crc)
908/*[clinic end generated code: output=8ec2a78590d19170 input=add8c53712ccceda]*/
Jack Jansen72781191995-08-07 14:34:15 +0000909{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200910 const unsigned char *bin_data;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000911 Py_ssize_t len;
Tim Peters934c1a12002-07-02 22:24:50 +0000912
Serhiy Storchaka2ef7c472015-04-20 09:26:49 +0300913 crc &= 0xffff;
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200914 bin_data = data->buf;
915 len = data->len;
Jack Jansen72781191995-08-07 14:34:15 +0000916
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000917 while(len-- > 0) {
Serhiy Storchaka2ef7c472015-04-20 09:26:49 +0300918 crc = ((crc<<8)&0xff00) ^ crctab_hqx[(crc>>8)^*bin_data++];
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000919 }
Jack Jansen72781191995-08-07 14:34:15 +0000920
Serhiy Storchaka2ef7c472015-04-20 09:26:49 +0300921 return crc;
Jack Jansen72781191995-08-07 14:34:15 +0000922}
923
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +0200924#ifndef USE_ZLIB_CRC32
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000925/* Crc - 32 BIT ANSI X3.66 CRC checksum files
926 Also known as: ISO 3307
927**********************************************************************|
928* *|
929* Demonstration program to compute the 32-bit CRC used as the frame *|
930* check sequence in ADCCP (ANSI X3.66, also known as FIPS PUB 71 *|
931* and FED-STD-1003, the U.S. versions of CCITT's X.25 link-level *|
932* protocol). The 32-bit FCS was added via the Federal Register, *|
933* 1 June 1982, p.23798. I presume but don't know for certain that *|
934* this polynomial is or will be included in CCITT V.41, which *|
935* defines the 16-bit CRC (often called CRC-CCITT) polynomial. FIPS *|
936* PUB 78 says that the 32-bit FCS reduces otherwise undetected *|
937* errors by a factor of 10^-5 over 16-bit FCS. *|
938* *|
939**********************************************************************|
940
941 Copyright (C) 1986 Gary S. Brown. You may use this program, or
942 code or tables extracted from it, as desired without restriction.
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000943
Tim Peters934c1a12002-07-02 22:24:50 +0000944 First, the polynomial itself and its table of feedback terms. The
945 polynomial is
946 X^32+X^26+X^23+X^22+X^16+X^12+X^11+X^10+X^8+X^7+X^5+X^4+X^2+X^1+X^0
947 Note that we take it "backwards" and put the highest-order term in
948 the lowest-order bit. The X^32 term is "implied"; the LSB is the
949 X^31 term, etc. The X^0 term (usually shown as "+1") results in
950 the MSB being 1.
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000951
Tim Peters934c1a12002-07-02 22:24:50 +0000952 Note that the usual hardware shift register implementation, which
953 is what we're using (we're merely optimizing it by doing eight-bit
954 chunks at a time) shifts bits into the lowest-order term. In our
955 implementation, that means shifting towards the right. Why do we
956 do it this way? Because the calculated CRC must be transmitted in
957 order from highest-order term to lowest-order term. UARTs transmit
958 characters in order from LSB to MSB. By storing the CRC this way,
959 we hand it to the UART in the order low-byte to high-byte; the UART
960 sends each low-bit to hight-bit; and the result is transmission bit
961 by bit from highest- to lowest-order term without requiring any bit
962 shuffling on our part. Reception works similarly.
963
964 The feedback terms table consists of 256, 32-bit entries. Notes:
965
966 1. The table can be generated at runtime if desired; code to do so
967 is shown later. It might not be obvious, but the feedback
968 terms simply represent the results of eight shift/xor opera-
969 tions for all combinations of data and CRC register values.
970
971 2. The CRC accumulation logic is the same for all CRC polynomials,
972 be they sixteen or thirty-two bits wide. You simply choose the
973 appropriate table. Alternatively, because the table can be
974 generated at runtime, you can start by generating the table for
975 the polynomial in question and use exactly the same "updcrc",
976 if your application needn't simultaneously handle two CRC
977 polynomials. (Note, however, that XMODEM is strange.)
978
979 3. For 16-bit CRCs, the table entries need be only 16 bits wide;
980 of course, 32-bit entries work OK if the high 16 bits are zero.
981
982 4. The values must be right-shifted by eight bits by the "updcrc"
983 logic; the shift must be unsigned (bring in zeroes). On some
984 hardware you could probably optimize the shift in assembler by
985 using byte-swap instructions.
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000986********************************************************************/
987
Serhiy Storchaka2d06e842015-12-25 19:53:18 +0200988static const unsigned int crc_32_tab[256] = {
Gregory P. Smith3c0e4d22008-03-25 07:51:12 +00009890x00000000U, 0x77073096U, 0xee0e612cU, 0x990951baU, 0x076dc419U,
9900x706af48fU, 0xe963a535U, 0x9e6495a3U, 0x0edb8832U, 0x79dcb8a4U,
9910xe0d5e91eU, 0x97d2d988U, 0x09b64c2bU, 0x7eb17cbdU, 0xe7b82d07U,
9920x90bf1d91U, 0x1db71064U, 0x6ab020f2U, 0xf3b97148U, 0x84be41deU,
9930x1adad47dU, 0x6ddde4ebU, 0xf4d4b551U, 0x83d385c7U, 0x136c9856U,
9940x646ba8c0U, 0xfd62f97aU, 0x8a65c9ecU, 0x14015c4fU, 0x63066cd9U,
9950xfa0f3d63U, 0x8d080df5U, 0x3b6e20c8U, 0x4c69105eU, 0xd56041e4U,
9960xa2677172U, 0x3c03e4d1U, 0x4b04d447U, 0xd20d85fdU, 0xa50ab56bU,
9970x35b5a8faU, 0x42b2986cU, 0xdbbbc9d6U, 0xacbcf940U, 0x32d86ce3U,
9980x45df5c75U, 0xdcd60dcfU, 0xabd13d59U, 0x26d930acU, 0x51de003aU,
9990xc8d75180U, 0xbfd06116U, 0x21b4f4b5U, 0x56b3c423U, 0xcfba9599U,
10000xb8bda50fU, 0x2802b89eU, 0x5f058808U, 0xc60cd9b2U, 0xb10be924U,
10010x2f6f7c87U, 0x58684c11U, 0xc1611dabU, 0xb6662d3dU, 0x76dc4190U,
10020x01db7106U, 0x98d220bcU, 0xefd5102aU, 0x71b18589U, 0x06b6b51fU,
10030x9fbfe4a5U, 0xe8b8d433U, 0x7807c9a2U, 0x0f00f934U, 0x9609a88eU,
10040xe10e9818U, 0x7f6a0dbbU, 0x086d3d2dU, 0x91646c97U, 0xe6635c01U,
10050x6b6b51f4U, 0x1c6c6162U, 0x856530d8U, 0xf262004eU, 0x6c0695edU,
10060x1b01a57bU, 0x8208f4c1U, 0xf50fc457U, 0x65b0d9c6U, 0x12b7e950U,
10070x8bbeb8eaU, 0xfcb9887cU, 0x62dd1ddfU, 0x15da2d49U, 0x8cd37cf3U,
10080xfbd44c65U, 0x4db26158U, 0x3ab551ceU, 0xa3bc0074U, 0xd4bb30e2U,
10090x4adfa541U, 0x3dd895d7U, 0xa4d1c46dU, 0xd3d6f4fbU, 0x4369e96aU,
10100x346ed9fcU, 0xad678846U, 0xda60b8d0U, 0x44042d73U, 0x33031de5U,
10110xaa0a4c5fU, 0xdd0d7cc9U, 0x5005713cU, 0x270241aaU, 0xbe0b1010U,
10120xc90c2086U, 0x5768b525U, 0x206f85b3U, 0xb966d409U, 0xce61e49fU,
10130x5edef90eU, 0x29d9c998U, 0xb0d09822U, 0xc7d7a8b4U, 0x59b33d17U,
10140x2eb40d81U, 0xb7bd5c3bU, 0xc0ba6cadU, 0xedb88320U, 0x9abfb3b6U,
10150x03b6e20cU, 0x74b1d29aU, 0xead54739U, 0x9dd277afU, 0x04db2615U,
10160x73dc1683U, 0xe3630b12U, 0x94643b84U, 0x0d6d6a3eU, 0x7a6a5aa8U,
10170xe40ecf0bU, 0x9309ff9dU, 0x0a00ae27U, 0x7d079eb1U, 0xf00f9344U,
10180x8708a3d2U, 0x1e01f268U, 0x6906c2feU, 0xf762575dU, 0x806567cbU,
10190x196c3671U, 0x6e6b06e7U, 0xfed41b76U, 0x89d32be0U, 0x10da7a5aU,
10200x67dd4accU, 0xf9b9df6fU, 0x8ebeeff9U, 0x17b7be43U, 0x60b08ed5U,
10210xd6d6a3e8U, 0xa1d1937eU, 0x38d8c2c4U, 0x4fdff252U, 0xd1bb67f1U,
10220xa6bc5767U, 0x3fb506ddU, 0x48b2364bU, 0xd80d2bdaU, 0xaf0a1b4cU,
10230x36034af6U, 0x41047a60U, 0xdf60efc3U, 0xa867df55U, 0x316e8eefU,
10240x4669be79U, 0xcb61b38cU, 0xbc66831aU, 0x256fd2a0U, 0x5268e236U,
10250xcc0c7795U, 0xbb0b4703U, 0x220216b9U, 0x5505262fU, 0xc5ba3bbeU,
10260xb2bd0b28U, 0x2bb45a92U, 0x5cb36a04U, 0xc2d7ffa7U, 0xb5d0cf31U,
10270x2cd99e8bU, 0x5bdeae1dU, 0x9b64c2b0U, 0xec63f226U, 0x756aa39cU,
10280x026d930aU, 0x9c0906a9U, 0xeb0e363fU, 0x72076785U, 0x05005713U,
10290x95bf4a82U, 0xe2b87a14U, 0x7bb12baeU, 0x0cb61b38U, 0x92d28e9bU,
10300xe5d5be0dU, 0x7cdcefb7U, 0x0bdbdf21U, 0x86d3d2d4U, 0xf1d4e242U,
10310x68ddb3f8U, 0x1fda836eU, 0x81be16cdU, 0xf6b9265bU, 0x6fb077e1U,
10320x18b74777U, 0x88085ae6U, 0xff0f6a70U, 0x66063bcaU, 0x11010b5cU,
10330x8f659effU, 0xf862ae69U, 0x616bffd3U, 0x166ccf45U, 0xa00ae278U,
10340xd70dd2eeU, 0x4e048354U, 0x3903b3c2U, 0xa7672661U, 0xd06016f7U,
10350x4969474dU, 0x3e6e77dbU, 0xaed16a4aU, 0xd9d65adcU, 0x40df0b66U,
10360x37d83bf0U, 0xa9bcae53U, 0xdebb9ec5U, 0x47b2cf7fU, 0x30b5ffe9U,
10370xbdbdf21cU, 0xcabac28aU, 0x53b39330U, 0x24b4a3a6U, 0xbad03605U,
10380xcdd70693U, 0x54de5729U, 0x23d967bfU, 0xb3667a2eU, 0xc4614ab8U,
10390x5d681b02U, 0x2a6f2b94U, 0xb40bbe37U, 0xc30c8ea1U, 0x5a05df1bU,
10400x2d02ef8dU
Guido van Rossum7d47c9e2000-02-16 21:11:52 +00001041};
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001042#endif /* USE_ZLIB_CRC32 */
Guido van Rossum7d47c9e2000-02-16 21:11:52 +00001043
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001044/*[clinic input]
1045binascii.crc32 -> unsigned_int
1046
1047 data: Py_buffer
1048 crc: unsigned_int(bitwise=True) = 0
1049 /
1050
1051Compute CRC-32 incrementally.
1052[clinic start generated code]*/
1053
1054static unsigned int
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +03001055binascii_crc32_impl(PyObject *module, Py_buffer *data, unsigned int crc)
1056/*[clinic end generated code: output=52cf59056a78593b input=bbe340bc99d25aa8]*/
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001057
1058#ifdef USE_ZLIB_CRC32
1059/* This was taken from zlibmodule.c PyZlib_crc32 (but is PY_SSIZE_T_CLEAN) */
1060{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +02001061 const Byte *buf;
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001062 Py_ssize_t len;
1063 int signed_val;
1064
1065 buf = (Byte*)data->buf;
1066 len = data->len;
1067 signed_val = crc32(crc, buf, len);
1068 return (unsigned int)signed_val & 0xffffffffU;
1069}
1070#else /* USE_ZLIB_CRC32 */
Guido van Rossum7d47c9e2000-02-16 21:11:52 +00001071{ /* By Jim Ahlstrom; All rights transferred to CNRI */
Serhiy Storchakaef1585e2015-12-25 20:01:53 +02001072 const unsigned char *bin_data;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001073 Py_ssize_t len;
1074 unsigned int result;
Tim Peters934c1a12002-07-02 22:24:50 +00001075
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001076 bin_data = data->buf;
1077 len = data->len;
Guido van Rossum7d47c9e2000-02-16 21:11:52 +00001078
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001079 crc = ~ crc;
1080 while (len-- > 0) {
1081 crc = crc_32_tab[(crc ^ *bin_data++) & 0xff] ^ (crc >> 8);
1082 /* Note: (crc >> 8) MUST zero fill on left */
1083 }
Tim Petersa98011c2002-07-02 20:20:08 +00001084
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001085 result = (crc ^ 0xFFFFFFFF);
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001086 return result & 0xffffffff;
Guido van Rossum7d47c9e2000-02-16 21:11:52 +00001087}
Christian Heimes1dc54002008-03-24 02:19:29 +00001088#endif /* USE_ZLIB_CRC32 */
Guido van Rossum7d47c9e2000-02-16 21:11:52 +00001089
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001090/*[clinic input]
1091binascii.b2a_hex
1092
1093 data: Py_buffer
1094 /
1095
1096Hexadecimal representation of binary data.
1097
1098The return value is a bytes object. This function is also
1099available as "hexlify()".
1100[clinic start generated code]*/
Barry Warsawe977c212000-08-15 06:07:13 +00001101
1102static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +03001103binascii_b2a_hex_impl(PyObject *module, Py_buffer *data)
1104/*[clinic end generated code: output=92fec1a95c9897a0 input=96423cfa299ff3b1]*/
Barry Warsawe977c212000-08-15 06:07:13 +00001105{
Gregory P. Smith9c6b9162015-04-26 00:42:13 +00001106 return _Py_strhex_bytes((const char *)data->buf, data->len);
Barry Warsawe977c212000-08-15 06:07:13 +00001107}
1108
Zachary Wareb176d402015-01-20 13:59:46 -06001109/*[clinic input]
1110binascii.hexlify = binascii.b2a_hex
1111
1112Hexadecimal representation of binary data.
1113
1114The return value is a bytes object.
1115[clinic start generated code]*/
1116
1117static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +03001118binascii_hexlify_impl(PyObject *module, Py_buffer *data)
1119/*[clinic end generated code: output=749e95e53c14880c input=2e3afae7f083f061]*/
Zachary Wareb176d402015-01-20 13:59:46 -06001120{
Gregory P. Smith9c6b9162015-04-26 00:42:13 +00001121 return _Py_strhex_bytes((const char *)data->buf, data->len);
Zachary Wareb176d402015-01-20 13:59:46 -06001122}
Barry Warsawe977c212000-08-15 06:07:13 +00001123
1124static int
Tim Peters934c1a12002-07-02 22:24:50 +00001125to_int(int c)
Barry Warsawe977c212000-08-15 06:07:13 +00001126{
Antoine Pitrou4de74572013-02-09 23:11:27 +01001127 if (Py_ISDIGIT(c))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001128 return c - '0';
1129 else {
Antoine Pitroued8ba142011-10-04 13:50:21 +02001130 if (Py_ISUPPER(c))
1131 c = Py_TOLOWER(c);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001132 if (c >= 'a' && c <= 'f')
1133 return c - 'a' + 10;
1134 }
1135 return -1;
Barry Warsawe977c212000-08-15 06:07:13 +00001136}
1137
1138
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001139/*[clinic input]
1140binascii.a2b_hex
1141
1142 hexstr: ascii_buffer
1143 /
1144
1145Binary data of hexadecimal representation.
1146
1147hexstr must contain an even number of hex digits (upper or lower case).
1148This function is also available as "unhexlify()".
1149[clinic start generated code]*/
1150
Barry Warsawe977c212000-08-15 06:07:13 +00001151static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +03001152binascii_a2b_hex_impl(PyObject *module, Py_buffer *hexstr)
1153/*[clinic end generated code: output=0cc1a139af0eeecb input=9e1e7f2f94db24fd]*/
Barry Warsawe977c212000-08-15 06:07:13 +00001154{
Serhiy Storchakaef1585e2015-12-25 20:01:53 +02001155 const char* argbuf;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001156 Py_ssize_t arglen;
1157 PyObject *retval;
1158 char* retbuf;
1159 Py_ssize_t i, j;
Barry Warsawe977c212000-08-15 06:07:13 +00001160
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001161 argbuf = hexstr->buf;
1162 arglen = hexstr->len;
Barry Warsawe977c212000-08-15 06:07:13 +00001163
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001164 assert(arglen >= 0);
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +00001165
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001166 /* XXX What should we do about strings with an odd length? Should
1167 * we add an implicit leading zero, or a trailing zero? For now,
1168 * raise an exception.
1169 */
1170 if (arglen % 2) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001171 PyErr_SetString(Error, "Odd-length string");
1172 return NULL;
1173 }
Barry Warsawe977c212000-08-15 06:07:13 +00001174
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001175 retval = PyBytes_FromStringAndSize(NULL, (arglen/2));
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001176 if (!retval)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001177 return NULL;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001178 retbuf = PyBytes_AS_STRING(retval);
Barry Warsawe977c212000-08-15 06:07:13 +00001179
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001180 for (i=j=0; i < arglen; i += 2) {
1181 int top = to_int(Py_CHARMASK(argbuf[i]));
1182 int bot = to_int(Py_CHARMASK(argbuf[i+1]));
1183 if (top == -1 || bot == -1) {
1184 PyErr_SetString(Error,
1185 "Non-hexadecimal digit found");
1186 goto finally;
1187 }
1188 retbuf[j++] = (top << 4) + bot;
1189 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001190 return retval;
Barry Warsawe977c212000-08-15 06:07:13 +00001191
1192 finally:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001193 Py_DECREF(retval);
1194 return NULL;
Barry Warsawe977c212000-08-15 06:07:13 +00001195}
1196
Zachary Wareb176d402015-01-20 13:59:46 -06001197/*[clinic input]
1198binascii.unhexlify = binascii.a2b_hex
1199
1200Binary data of hexadecimal representation.
1201
1202hexstr must contain an even number of hex digits (upper or lower case).
1203[clinic start generated code]*/
1204
1205static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +03001206binascii_unhexlify_impl(PyObject *module, Py_buffer *hexstr)
1207/*[clinic end generated code: output=51a64c06c79629e3 input=dd8c012725f462da]*/
Zachary Wareb176d402015-01-20 13:59:46 -06001208{
1209 return binascii_a2b_hex_impl(module, hexstr);
1210}
1211
Serhiy Storchaka2d06e842015-12-25 19:53:18 +02001212static const int table_hex[128] = {
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001213 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1214 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1215 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1216 0, 1, 2, 3, 4, 5, 6, 7, 8, 9,-1,-1, -1,-1,-1,-1,
1217 -1,10,11,12, 13,14,15,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1218 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1219 -1,10,11,12, 13,14,15,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1220 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1
1221};
1222
1223#define hexval(c) table_hex[(unsigned int)(c)]
1224
1225#define MAXLINESIZE 76
1226
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001227
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001228/*[clinic input]
1229binascii.a2b_qp
1230
Serhiy Storchaka12785612014-01-25 11:49:49 +02001231 data: ascii_buffer
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001232 header: int(c_default="0") = False
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001233
1234Decode a string of qp-encoded data.
1235[clinic start generated code]*/
1236
1237static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +03001238binascii_a2b_qp_impl(PyObject *module, Py_buffer *data, int header)
1239/*[clinic end generated code: output=e99f7846cfb9bc53 input=5187a0d3d8e54f3b]*/
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001240{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001241 Py_ssize_t in, out;
1242 char ch;
Serhiy Storchakaef1585e2015-12-25 20:01:53 +02001243 const unsigned char *ascii_data;
1244 unsigned char *odata;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001245 Py_ssize_t datalen = 0;
1246 PyObject *rv;
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001247
Serhiy Storchaka12785612014-01-25 11:49:49 +02001248 ascii_data = data->buf;
1249 datalen = data->len;
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001250
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001251 /* We allocate the output same size as input, this is overkill.
1252 * The previous implementation used calloc() so we'll zero out the
1253 * memory here too, since PyMem_Malloc() does not guarantee that.
1254 */
1255 odata = (unsigned char *) PyMem_Malloc(datalen);
1256 if (odata == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001257 PyErr_NoMemory();
1258 return NULL;
1259 }
1260 memset(odata, 0, datalen);
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001261
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001262 in = out = 0;
1263 while (in < datalen) {
Serhiy Storchaka12785612014-01-25 11:49:49 +02001264 if (ascii_data[in] == '=') {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001265 in++;
1266 if (in >= datalen) break;
1267 /* Soft line breaks */
Serhiy Storchaka12785612014-01-25 11:49:49 +02001268 if ((ascii_data[in] == '\n') || (ascii_data[in] == '\r')) {
1269 if (ascii_data[in] != '\n') {
1270 while (in < datalen && ascii_data[in] != '\n') in++;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001271 }
1272 if (in < datalen) in++;
1273 }
Serhiy Storchaka12785612014-01-25 11:49:49 +02001274 else if (ascii_data[in] == '=') {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001275 /* broken case from broken python qp */
1276 odata[out++] = '=';
1277 in++;
1278 }
Serhiy Storchakae6265e92016-09-14 16:34:37 +03001279 else if ((in + 1 < datalen) &&
1280 ((ascii_data[in] >= 'A' && ascii_data[in] <= 'F') ||
Serhiy Storchaka12785612014-01-25 11:49:49 +02001281 (ascii_data[in] >= 'a' && ascii_data[in] <= 'f') ||
1282 (ascii_data[in] >= '0' && ascii_data[in] <= '9')) &&
1283 ((ascii_data[in+1] >= 'A' && ascii_data[in+1] <= 'F') ||
1284 (ascii_data[in+1] >= 'a' && ascii_data[in+1] <= 'f') ||
1285 (ascii_data[in+1] >= '0' && ascii_data[in+1] <= '9'))) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001286 /* hexval */
Serhiy Storchaka12785612014-01-25 11:49:49 +02001287 ch = hexval(ascii_data[in]) << 4;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001288 in++;
Serhiy Storchaka12785612014-01-25 11:49:49 +02001289 ch |= hexval(ascii_data[in]);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001290 in++;
1291 odata[out++] = ch;
1292 }
1293 else {
1294 odata[out++] = '=';
1295 }
1296 }
Serhiy Storchaka12785612014-01-25 11:49:49 +02001297 else if (header && ascii_data[in] == '_') {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001298 odata[out++] = ' ';
1299 in++;
1300 }
1301 else {
Serhiy Storchaka12785612014-01-25 11:49:49 +02001302 odata[out] = ascii_data[in];
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001303 in++;
1304 out++;
1305 }
1306 }
1307 if ((rv = PyBytes_FromStringAndSize((char *)odata, out)) == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001308 PyMem_Free(odata);
1309 return NULL;
1310 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001311 PyMem_Free(odata);
1312 return rv;
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001313}
1314
Tim Peters934c1a12002-07-02 22:24:50 +00001315static int
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001316to_hex (unsigned char ch, unsigned char *s)
1317{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001318 unsigned int uvalue = ch;
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001319
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001320 s[1] = "0123456789ABCDEF"[uvalue % 16];
1321 uvalue = (uvalue / 16);
1322 s[0] = "0123456789ABCDEF"[uvalue % 16];
1323 return 0;
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001324}
1325
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001326/* XXX: This is ridiculously complicated to be backward compatible
1327 * (mostly) with the quopri module. It doesn't re-create the quopri
1328 * module bug where text ending in CRLF has the CR encoded */
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001329
1330/*[clinic input]
1331binascii.b2a_qp
1332
1333 data: Py_buffer
1334 quotetabs: int(c_default="0") = False
1335 istext: int(c_default="1") = True
1336 header: int(c_default="0") = False
1337
1338Encode a string using quoted-printable encoding.
1339
1340On encoding, when istext is set, newlines are not encoded, and white
1341space at end of lines is. When istext is not set, \r and \n (CR/LF)
1342are both encoded. When quotetabs is set, space and tabs are encoded.
1343[clinic start generated code]*/
1344
1345static PyObject *
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +03001346binascii_b2a_qp_impl(PyObject *module, Py_buffer *data, int quotetabs,
Larry Hastings89964c42015-04-14 18:07:59 -04001347 int istext, int header)
Serhiy Storchaka1a2b24f2016-07-07 17:35:15 +03001348/*[clinic end generated code: output=e9884472ebb1a94c input=7f2a9aaa008e92b2]*/
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001349{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001350 Py_ssize_t in, out;
Serhiy Storchakaef1585e2015-12-25 20:01:53 +02001351 const unsigned char *databuf;
1352 unsigned char *odata;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001353 Py_ssize_t datalen = 0, odatalen = 0;
1354 PyObject *rv;
1355 unsigned int linelen = 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001356 unsigned char ch;
1357 int crlf = 0;
Serhiy Storchakaef1585e2015-12-25 20:01:53 +02001358 const unsigned char *p;
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001359
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001360 databuf = data->buf;
1361 datalen = data->len;
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001362
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001363 /* See if this string is using CRLF line ends */
1364 /* XXX: this function has the side effect of converting all of
1365 * the end of lines to be the same depending on this detection
1366 * here */
Serhiy Storchakaef1585e2015-12-25 20:01:53 +02001367 p = (const unsigned char *) memchr(databuf, '\n', datalen);
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001368 if ((p != NULL) && (p > databuf) && (*(p-1) == '\r'))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001369 crlf = 1;
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001370
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001371 /* First, scan to see how many characters need to be encoded */
1372 in = 0;
1373 while (in < datalen) {
Benjamin Peterson4f976512016-08-13 18:33:33 -07001374 Py_ssize_t delta = 0;
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001375 if ((databuf[in] > 126) ||
1376 (databuf[in] == '=') ||
1377 (header && databuf[in] == '_') ||
1378 ((databuf[in] == '.') && (linelen == 0) &&
Serhiy Storchakae6265e92016-09-14 16:34:37 +03001379 (in + 1 == datalen || databuf[in+1] == '\n' ||
1380 databuf[in+1] == '\r' || databuf[in+1] == 0)) ||
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001381 (!istext && ((databuf[in] == '\r') || (databuf[in] == '\n'))) ||
1382 ((databuf[in] == '\t' || databuf[in] == ' ') && (in + 1 == datalen)) ||
1383 ((databuf[in] < 33) &&
1384 (databuf[in] != '\r') && (databuf[in] != '\n') &&
1385 (quotetabs || ((databuf[in] != '\t') && (databuf[in] != ' ')))))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001386 {
1387 if ((linelen + 3) >= MAXLINESIZE) {
1388 linelen = 0;
1389 if (crlf)
Benjamin Peterson4f976512016-08-13 18:33:33 -07001390 delta += 3;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001391 else
Benjamin Peterson4f976512016-08-13 18:33:33 -07001392 delta += 2;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001393 }
1394 linelen += 3;
Benjamin Peterson4f976512016-08-13 18:33:33 -07001395 delta += 3;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001396 in++;
1397 }
1398 else {
1399 if (istext &&
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001400 ((databuf[in] == '\n') ||
1401 ((in+1 < datalen) && (databuf[in] == '\r') &&
1402 (databuf[in+1] == '\n'))))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001403 {
1404 linelen = 0;
1405 /* Protect against whitespace on end of line */
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001406 if (in && ((databuf[in-1] == ' ') || (databuf[in-1] == '\t')))
Benjamin Peterson4f976512016-08-13 18:33:33 -07001407 delta += 2;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001408 if (crlf)
Benjamin Peterson4f976512016-08-13 18:33:33 -07001409 delta += 2;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001410 else
Benjamin Peterson4f976512016-08-13 18:33:33 -07001411 delta += 1;
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001412 if (databuf[in] == '\r')
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001413 in += 2;
1414 else
1415 in++;
1416 }
1417 else {
1418 if ((in + 1 != datalen) &&
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001419 (databuf[in+1] != '\n') &&
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001420 (linelen + 1) >= MAXLINESIZE) {
1421 linelen = 0;
1422 if (crlf)
Benjamin Peterson4f976512016-08-13 18:33:33 -07001423 delta += 3;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001424 else
Benjamin Peterson4f976512016-08-13 18:33:33 -07001425 delta += 2;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001426 }
1427 linelen++;
Benjamin Peterson4f976512016-08-13 18:33:33 -07001428 delta++;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001429 in++;
1430 }
1431 }
Benjamin Peterson4f976512016-08-13 18:33:33 -07001432 if (PY_SSIZE_T_MAX - delta < odatalen) {
Benjamin Peterson4f976512016-08-13 18:33:33 -07001433 PyErr_NoMemory();
1434 return NULL;
1435 }
1436 odatalen += delta;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001437 }
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001438
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001439 /* We allocate the output same size as input, this is overkill.
1440 * The previous implementation used calloc() so we'll zero out the
1441 * memory here too, since PyMem_Malloc() does not guarantee that.
1442 */
1443 odata = (unsigned char *) PyMem_Malloc(odatalen);
1444 if (odata == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001445 PyErr_NoMemory();
1446 return NULL;
1447 }
1448 memset(odata, 0, odatalen);
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001449
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001450 in = out = linelen = 0;
1451 while (in < datalen) {
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001452 if ((databuf[in] > 126) ||
1453 (databuf[in] == '=') ||
1454 (header && databuf[in] == '_') ||
1455 ((databuf[in] == '.') && (linelen == 0) &&
Serhiy Storchakae6265e92016-09-14 16:34:37 +03001456 (in + 1 == datalen || databuf[in+1] == '\n' ||
1457 databuf[in+1] == '\r' || databuf[in+1] == 0)) ||
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001458 (!istext && ((databuf[in] == '\r') || (databuf[in] == '\n'))) ||
1459 ((databuf[in] == '\t' || databuf[in] == ' ') && (in + 1 == datalen)) ||
1460 ((databuf[in] < 33) &&
1461 (databuf[in] != '\r') && (databuf[in] != '\n') &&
Serhiy Storchakae6265e92016-09-14 16:34:37 +03001462 (quotetabs || ((databuf[in] != '\t') && (databuf[in] != ' ')))))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001463 {
1464 if ((linelen + 3 )>= MAXLINESIZE) {
1465 odata[out++] = '=';
1466 if (crlf) odata[out++] = '\r';
1467 odata[out++] = '\n';
1468 linelen = 0;
1469 }
1470 odata[out++] = '=';
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001471 to_hex(databuf[in], &odata[out]);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001472 out += 2;
1473 in++;
1474 linelen += 3;
1475 }
1476 else {
1477 if (istext &&
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001478 ((databuf[in] == '\n') ||
1479 ((in+1 < datalen) && (databuf[in] == '\r') &&
1480 (databuf[in+1] == '\n'))))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001481 {
1482 linelen = 0;
1483 /* Protect against whitespace on end of line */
1484 if (out && ((odata[out-1] == ' ') || (odata[out-1] == '\t'))) {
1485 ch = odata[out-1];
1486 odata[out-1] = '=';
1487 to_hex(ch, &odata[out]);
1488 out += 2;
1489 }
Tim Peters934c1a12002-07-02 22:24:50 +00001490
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001491 if (crlf) odata[out++] = '\r';
1492 odata[out++] = '\n';
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001493 if (databuf[in] == '\r')
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001494 in += 2;
1495 else
1496 in++;
1497 }
1498 else {
1499 if ((in + 1 != datalen) &&
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001500 (databuf[in+1] != '\n') &&
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001501 (linelen + 1) >= MAXLINESIZE) {
1502 odata[out++] = '=';
1503 if (crlf) odata[out++] = '\r';
1504 odata[out++] = '\n';
1505 linelen = 0;
1506 }
1507 linelen++;
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001508 if (header && databuf[in] == ' ') {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001509 odata[out++] = '_';
1510 in++;
1511 }
1512 else {
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001513 odata[out++] = databuf[in++];
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001514 }
1515 }
1516 }
1517 }
1518 if ((rv = PyBytes_FromStringAndSize((char *)odata, out)) == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001519 PyMem_Free(odata);
1520 return NULL;
1521 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001522 PyMem_Free(odata);
1523 return rv;
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001524}
Barry Warsawe977c212000-08-15 06:07:13 +00001525
Jack Jansen72781191995-08-07 14:34:15 +00001526/* List of functions defined in the module */
1527
1528static struct PyMethodDef binascii_module_methods[] = {
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001529 BINASCII_A2B_UU_METHODDEF
1530 BINASCII_B2A_UU_METHODDEF
1531 BINASCII_A2B_BASE64_METHODDEF
1532 BINASCII_B2A_BASE64_METHODDEF
1533 BINASCII_A2B_HQX_METHODDEF
1534 BINASCII_B2A_HQX_METHODDEF
1535 BINASCII_A2B_HEX_METHODDEF
1536 BINASCII_B2A_HEX_METHODDEF
Zachary Wareb176d402015-01-20 13:59:46 -06001537 BINASCII_HEXLIFY_METHODDEF
1538 BINASCII_UNHEXLIFY_METHODDEF
Serhiy Storchaka3ffd9132014-01-25 11:21:23 +02001539 BINASCII_RLECODE_HQX_METHODDEF
1540 BINASCII_RLEDECODE_HQX_METHODDEF
1541 BINASCII_CRC_HQX_METHODDEF
1542 BINASCII_CRC32_METHODDEF
1543 BINASCII_A2B_QP_METHODDEF
1544 BINASCII_B2A_QP_METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001545 {NULL, NULL} /* sentinel */
Jack Jansen72781191995-08-07 14:34:15 +00001546};
1547
1548
Martin v. Löwis1a214512008-06-11 05:26:20 +00001549/* Initialization function for the module (*must* be called PyInit_binascii) */
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001550PyDoc_STRVAR(doc_binascii, "Conversion between binary data and ASCII");
Jack Jansen72781191995-08-07 14:34:15 +00001551
Martin v. Löwis1a214512008-06-11 05:26:20 +00001552
1553static struct PyModuleDef binasciimodule = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001554 PyModuleDef_HEAD_INIT,
1555 "binascii",
1556 doc_binascii,
1557 -1,
1558 binascii_module_methods,
1559 NULL,
1560 NULL,
1561 NULL,
1562 NULL
Martin v. Löwis1a214512008-06-11 05:26:20 +00001563};
1564
Mark Hammondfe51c6d2002-08-02 02:27:13 +00001565PyMODINIT_FUNC
Martin v. Löwis1a214512008-06-11 05:26:20 +00001566PyInit_binascii(void)
Jack Jansen72781191995-08-07 14:34:15 +00001567{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001568 PyObject *m, *d;
Jack Jansen72781191995-08-07 14:34:15 +00001569
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001570 /* Create the module and add the functions */
1571 m = PyModule_Create(&binasciimodule);
1572 if (m == NULL)
1573 return NULL;
Jack Jansen72781191995-08-07 14:34:15 +00001574
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001575 d = PyModule_GetDict(m);
Jack Jansen72781191995-08-07 14:34:15 +00001576
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001577 Error = PyErr_NewException("binascii.Error", PyExc_ValueError, NULL);
1578 PyDict_SetItemString(d, "Error", Error);
1579 Incomplete = PyErr_NewException("binascii.Incomplete", NULL, NULL);
1580 PyDict_SetItemString(d, "Incomplete", Incomplete);
1581 if (PyErr_Occurred()) {
1582 Py_DECREF(m);
1583 m = NULL;
1584 }
1585 return m;
Jack Jansen72781191995-08-07 14:34:15 +00001586}