blob: ec07a7170a86ad0d71c0fa2bb3b6919aa4de7d7a [file] [log] [blame]
Jack Jansen72781191995-08-07 14:34:15 +00001/*
2** Routines to represent binary data in ASCII and vice-versa
3**
4** This module currently supports the following encodings:
5** uuencode:
6** each line encodes 45 bytes (except possibly the last)
7** First char encodes (binary) length, rest data
8** each char encodes 6 bits, as follows:
9** binary: 01234567 abcdefgh ijklmnop
10** ascii: 012345 67abcd efghij klmnop
11** ASCII encoding method is "excess-space": 000000 is encoded as ' ', etc.
12** short binary data is zero-extended (so the bits are always in the
13** right place), this does *not* reflect in the length.
Jack Jansen84bbc2e1995-10-04 16:38:44 +000014** base64:
15** Line breaks are insignificant, but lines are at most 76 chars
16** each char encodes 6 bits, in similar order as uucode/hqx. Encoding
17** is done via a table.
18** Short binary data is filled (in ASCII) with '='.
Jack Jansen72781191995-08-07 14:34:15 +000019** hqx:
20** File starts with introductory text, real data starts and ends
21** with colons.
22** Data consists of three similar parts: info, datafork, resourcefork.
23** Each part is protected (at the end) with a 16-bit crc
24** The binary data is run-length encoded, and then ascii-fied:
25** binary: 01234567 abcdefgh ijklmnop
26** ascii: 012345 67abcd efghij klmnop
27** ASCII encoding is table-driven, see the code.
28** Short binary data results in the runt ascii-byte being output with
29** the bits in the right place.
30**
31** While I was reading dozens of programs that encode or decode the formats
32** here (documentation? hihi:-) I have formulated Jansen's Observation:
33**
34** Programs that encode binary data in ASCII are written in
35** such a style that they are as unreadable as possible. Devices used
36** include unnecessary global variables, burying important tables
37** in unrelated sourcefiles, putting functions in include files,
38** using seemingly-descriptive variable names for different purposes,
39** calls to empty subroutines and a host of others.
40**
41** I have attempted to break with this tradition, but I guess that that
42** does make the performance sub-optimal. Oh well, too bad...
43**
44** Jack Jansen, CWI, July 1995.
Tim Peters934c1a12002-07-02 22:24:50 +000045**
Martin v. Löwis16dc7f42001-09-30 20:32:11 +000046** Added support for quoted-printable encoding, based on rfc 1521 et al
Tim Peters934c1a12002-07-02 22:24:50 +000047** quoted-printable encoding specifies that non printable characters (anything
Martin v. Löwis16dc7f42001-09-30 20:32:11 +000048** below 32 and above 126) be encoded as =XX where XX is the hexadecimal value
49** of the character. It also specifies some other behavior to enable 8bit data
Tim Peters934c1a12002-07-02 22:24:50 +000050** in a mail message with little difficulty (maximum line sizes, protecting
51** some cases of whitespace, etc).
Martin v. Löwis16dc7f42001-09-30 20:32:11 +000052**
53** Brandon Long, September 2001.
Jack Jansen72781191995-08-07 14:34:15 +000054*/
55
56
57#include "Python.h"
58
59static PyObject *Error;
60static PyObject *Incomplete;
61
62/*
63** hqx lookup table, ascii->binary.
64*/
65
66#define RUNCHAR 0x90
67
68#define DONE 0x7F
69#define SKIP 0x7E
70#define FAIL 0x7D
71
72static unsigned char table_a2b_hqx[256] = {
73/* ^@ ^A ^B ^C ^D ^E ^F ^G */
74/* 0*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
75/* \b \t \n ^K ^L \r ^N ^O */
76/* 1*/ FAIL, FAIL, SKIP, FAIL, FAIL, SKIP, FAIL, FAIL,
77/* ^P ^Q ^R ^S ^T ^U ^V ^W */
78/* 2*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
79/* ^X ^Y ^Z ^[ ^\ ^] ^^ ^_ */
80/* 3*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
81/* ! " # $ % & ' */
82/* 4*/ FAIL, 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06,
83/* ( ) * + , - . / */
84/* 5*/ 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, FAIL, FAIL,
85/* 0 1 2 3 4 5 6 7 */
86/* 6*/ 0x0D, 0x0E, 0x0F, 0x10, 0x11, 0x12, 0x13, FAIL,
87/* 8 9 : ; < = > ? */
88/* 7*/ 0x14, 0x15, DONE, FAIL, FAIL, FAIL, FAIL, FAIL,
89/* @ A B C D E F G */
90/* 8*/ 0x16, 0x17, 0x18, 0x19, 0x1A, 0x1B, 0x1C, 0x1D,
91/* H I J K L M N O */
92/* 9*/ 0x1E, 0x1F, 0x20, 0x21, 0x22, 0x23, 0x24, FAIL,
93/* P Q R S T U V W */
94/*10*/ 0x25, 0x26, 0x27, 0x28, 0x29, 0x2A, 0x2B, FAIL,
95/* X Y Z [ \ ] ^ _ */
96/*11*/ 0x2C, 0x2D, 0x2E, 0x2F, FAIL, FAIL, FAIL, FAIL,
97/* ` a b c d e f g */
98/*12*/ 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, FAIL,
99/* h i j k l m n o */
100/*13*/ 0x37, 0x38, 0x39, 0x3A, 0x3B, 0x3C, FAIL, FAIL,
101/* p q r s t u v w */
102/*14*/ 0x3D, 0x3E, 0x3F, FAIL, FAIL, FAIL, FAIL, FAIL,
103/* x y z { | } ~ ^? */
104/*15*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
105/*16*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
106 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
107 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
108 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
109 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
110 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
111 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
112 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
113 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
114 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
115 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
116 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
117 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
118 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
119 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
120 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
121};
122
123static unsigned char table_b2a_hqx[] =
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000124"!\"#$%&'()*+,-012345689@ABCDEFGHIJKLMNPQRSTUVXYZ[`abcdefhijklmpqr";
Jack Jansen72781191995-08-07 14:34:15 +0000125
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000126static char table_a2b_base64[] = {
127 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
128 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
129 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,62, -1,-1,-1,63,
130 52,53,54,55, 56,57,58,59, 60,61,-1,-1, -1, 0,-1,-1, /* Note PAD->0 */
131 -1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9,10, 11,12,13,14,
132 15,16,17,18, 19,20,21,22, 23,24,25,-1, -1,-1,-1,-1,
133 -1,26,27,28, 29,30,31,32, 33,34,35,36, 37,38,39,40,
134 41,42,43,44, 45,46,47,48, 49,50,51,-1, -1,-1,-1,-1
135};
136
137#define BASE64_PAD '='
Guido van Rossum355bc0c2001-10-30 03:00:52 +0000138
139/* Max binary chunk size; limited only by available memory */
Tim Peters1fbb5772001-12-19 04:41:35 +0000140#define BASE64_MAXBIN (INT_MAX/2 - sizeof(PyStringObject) - 3)
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000141
142static unsigned char table_b2a_base64[] =
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000143"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000144
145
146
Jack Jansen72781191995-08-07 14:34:15 +0000147static unsigned short crctab_hqx[256] = {
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000148 0x0000, 0x1021, 0x2042, 0x3063, 0x4084, 0x50a5, 0x60c6, 0x70e7,
149 0x8108, 0x9129, 0xa14a, 0xb16b, 0xc18c, 0xd1ad, 0xe1ce, 0xf1ef,
150 0x1231, 0x0210, 0x3273, 0x2252, 0x52b5, 0x4294, 0x72f7, 0x62d6,
151 0x9339, 0x8318, 0xb37b, 0xa35a, 0xd3bd, 0xc39c, 0xf3ff, 0xe3de,
152 0x2462, 0x3443, 0x0420, 0x1401, 0x64e6, 0x74c7, 0x44a4, 0x5485,
153 0xa56a, 0xb54b, 0x8528, 0x9509, 0xe5ee, 0xf5cf, 0xc5ac, 0xd58d,
154 0x3653, 0x2672, 0x1611, 0x0630, 0x76d7, 0x66f6, 0x5695, 0x46b4,
155 0xb75b, 0xa77a, 0x9719, 0x8738, 0xf7df, 0xe7fe, 0xd79d, 0xc7bc,
156 0x48c4, 0x58e5, 0x6886, 0x78a7, 0x0840, 0x1861, 0x2802, 0x3823,
157 0xc9cc, 0xd9ed, 0xe98e, 0xf9af, 0x8948, 0x9969, 0xa90a, 0xb92b,
158 0x5af5, 0x4ad4, 0x7ab7, 0x6a96, 0x1a71, 0x0a50, 0x3a33, 0x2a12,
159 0xdbfd, 0xcbdc, 0xfbbf, 0xeb9e, 0x9b79, 0x8b58, 0xbb3b, 0xab1a,
160 0x6ca6, 0x7c87, 0x4ce4, 0x5cc5, 0x2c22, 0x3c03, 0x0c60, 0x1c41,
161 0xedae, 0xfd8f, 0xcdec, 0xddcd, 0xad2a, 0xbd0b, 0x8d68, 0x9d49,
162 0x7e97, 0x6eb6, 0x5ed5, 0x4ef4, 0x3e13, 0x2e32, 0x1e51, 0x0e70,
163 0xff9f, 0xefbe, 0xdfdd, 0xcffc, 0xbf1b, 0xaf3a, 0x9f59, 0x8f78,
164 0x9188, 0x81a9, 0xb1ca, 0xa1eb, 0xd10c, 0xc12d, 0xf14e, 0xe16f,
165 0x1080, 0x00a1, 0x30c2, 0x20e3, 0x5004, 0x4025, 0x7046, 0x6067,
166 0x83b9, 0x9398, 0xa3fb, 0xb3da, 0xc33d, 0xd31c, 0xe37f, 0xf35e,
167 0x02b1, 0x1290, 0x22f3, 0x32d2, 0x4235, 0x5214, 0x6277, 0x7256,
168 0xb5ea, 0xa5cb, 0x95a8, 0x8589, 0xf56e, 0xe54f, 0xd52c, 0xc50d,
169 0x34e2, 0x24c3, 0x14a0, 0x0481, 0x7466, 0x6447, 0x5424, 0x4405,
170 0xa7db, 0xb7fa, 0x8799, 0x97b8, 0xe75f, 0xf77e, 0xc71d, 0xd73c,
171 0x26d3, 0x36f2, 0x0691, 0x16b0, 0x6657, 0x7676, 0x4615, 0x5634,
172 0xd94c, 0xc96d, 0xf90e, 0xe92f, 0x99c8, 0x89e9, 0xb98a, 0xa9ab,
173 0x5844, 0x4865, 0x7806, 0x6827, 0x18c0, 0x08e1, 0x3882, 0x28a3,
174 0xcb7d, 0xdb5c, 0xeb3f, 0xfb1e, 0x8bf9, 0x9bd8, 0xabbb, 0xbb9a,
175 0x4a75, 0x5a54, 0x6a37, 0x7a16, 0x0af1, 0x1ad0, 0x2ab3, 0x3a92,
176 0xfd2e, 0xed0f, 0xdd6c, 0xcd4d, 0xbdaa, 0xad8b, 0x9de8, 0x8dc9,
177 0x7c26, 0x6c07, 0x5c64, 0x4c45, 0x3ca2, 0x2c83, 0x1ce0, 0x0cc1,
178 0xef1f, 0xff3e, 0xcf5d, 0xdf7c, 0xaf9b, 0xbfba, 0x8fd9, 0x9ff8,
179 0x6e17, 0x7e36, 0x4e55, 0x5e74, 0x2e93, 0x3eb2, 0x0ed1, 0x1ef0,
Jack Jansen72781191995-08-07 14:34:15 +0000180};
181
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000182PyDoc_STRVAR(doc_a2b_uu, "(ascii) -> bin. Decode a line of uuencoded data");
Jack Jansen72781191995-08-07 14:34:15 +0000183
184static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000185binascii_a2b_uu(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000186{
187 unsigned char *ascii_data, *bin_data;
188 int leftbits = 0;
189 unsigned char this_ch;
190 unsigned int leftchar = 0;
191 PyObject *rv;
192 int ascii_len, bin_len;
Tim Peters934c1a12002-07-02 22:24:50 +0000193
Guido van Rossum43713e52000-02-29 13:59:29 +0000194 if ( !PyArg_ParseTuple(args, "t#:a2b_uu", &ascii_data, &ascii_len) )
Jack Jansen72781191995-08-07 14:34:15 +0000195 return NULL;
196
197 /* First byte: binary data length (in bytes) */
198 bin_len = (*ascii_data++ - ' ') & 077;
199 ascii_len--;
200
201 /* Allocate the buffer */
202 if ( (rv=PyString_FromStringAndSize(NULL, bin_len)) == NULL )
203 return NULL;
204 bin_data = (unsigned char *)PyString_AsString(rv);
Tim Peters934c1a12002-07-02 22:24:50 +0000205
Jack Jansen72781191995-08-07 14:34:15 +0000206 for( ; bin_len > 0 ; ascii_len--, ascii_data++ ) {
207 this_ch = *ascii_data;
208 if ( this_ch == '\n' || this_ch == '\r' || ascii_len <= 0) {
209 /*
210 ** Whitespace. Assume some spaces got eaten at
211 ** end-of-line. (We check this later)
212 */
213 this_ch = 0;
214 } else {
Jack Jansen5d957971995-11-14 10:35:19 +0000215 /* Check the character for legality
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000216 ** The 64 in stead of the expected 63 is because
217 ** there are a few uuencodes out there that use
Guido van Rossum92d89172001-01-09 02:11:57 +0000218 ** '`' as zero instead of space.
Jack Jansen5d957971995-11-14 10:35:19 +0000219 */
220 if ( this_ch < ' ' || this_ch > (' ' + 64)) {
Jack Jansen72781191995-08-07 14:34:15 +0000221 PyErr_SetString(Error, "Illegal char");
222 Py_DECREF(rv);
223 return NULL;
224 }
225 this_ch = (this_ch - ' ') & 077;
226 }
227 /*
228 ** Shift it in on the low end, and see if there's
229 ** a byte ready for output.
230 */
231 leftchar = (leftchar << 6) | (this_ch);
232 leftbits += 6;
233 if ( leftbits >= 8 ) {
234 leftbits -= 8;
235 *bin_data++ = (leftchar >> leftbits) & 0xff;
236 leftchar &= ((1 << leftbits) - 1);
237 bin_len--;
238 }
239 }
240 /*
241 ** Finally, check that if there's anything left on the line
242 ** that it's whitespace only.
243 */
244 while( ascii_len-- > 0 ) {
245 this_ch = *ascii_data++;
Guido van Rossum92d89172001-01-09 02:11:57 +0000246 /* Extra '`' may be written as padding in some cases */
247 if ( this_ch != ' ' && this_ch != ' '+64 &&
Guido van Rossum1243ae71997-07-11 18:36:28 +0000248 this_ch != '\n' && this_ch != '\r' ) {
Jack Jansen72781191995-08-07 14:34:15 +0000249 PyErr_SetString(Error, "Trailing garbage");
250 Py_DECREF(rv);
251 return NULL;
252 }
253 }
254 return rv;
255}
256
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000257PyDoc_STRVAR(doc_b2a_uu, "(bin) -> ascii. Uuencode line of data");
Tim Peters934c1a12002-07-02 22:24:50 +0000258
Jack Jansen72781191995-08-07 14:34:15 +0000259static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000260binascii_b2a_uu(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000261{
262 unsigned char *ascii_data, *bin_data;
263 int leftbits = 0;
264 unsigned char this_ch;
265 unsigned int leftchar = 0;
266 PyObject *rv;
267 int bin_len;
Tim Peters934c1a12002-07-02 22:24:50 +0000268
Guido van Rossum43713e52000-02-29 13:59:29 +0000269 if ( !PyArg_ParseTuple(args, "s#:b2a_uu", &bin_data, &bin_len) )
Jack Jansen72781191995-08-07 14:34:15 +0000270 return NULL;
271 if ( bin_len > 45 ) {
272 /* The 45 is a limit that appears in all uuencode's */
273 PyErr_SetString(Error, "At most 45 bytes at once");
274 return NULL;
275 }
276
277 /* We're lazy and allocate to much (fixed up later) */
278 if ( (rv=PyString_FromStringAndSize(NULL, bin_len*2)) == NULL )
279 return NULL;
280 ascii_data = (unsigned char *)PyString_AsString(rv);
281
282 /* Store the length */
283 *ascii_data++ = ' ' + (bin_len & 077);
Tim Peters934c1a12002-07-02 22:24:50 +0000284
Jack Jansen72781191995-08-07 14:34:15 +0000285 for( ; bin_len > 0 || leftbits != 0 ; bin_len--, bin_data++ ) {
286 /* Shift the data (or padding) into our buffer */
287 if ( bin_len > 0 ) /* Data */
288 leftchar = (leftchar << 8) | *bin_data;
289 else /* Padding */
290 leftchar <<= 8;
291 leftbits += 8;
292
293 /* See if there are 6-bit groups ready */
294 while ( leftbits >= 6 ) {
295 this_ch = (leftchar >> (leftbits-6)) & 0x3f;
296 leftbits -= 6;
297 *ascii_data++ = this_ch + ' ';
298 }
299 }
300 *ascii_data++ = '\n'; /* Append a courtesy newline */
Tim Peters934c1a12002-07-02 22:24:50 +0000301
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000302 _PyString_Resize(&rv, (ascii_data -
303 (unsigned char *)PyString_AsString(rv)));
Jack Jansen72781191995-08-07 14:34:15 +0000304 return rv;
305}
306
Guido van Rossum2db4f471999-10-19 19:05:14 +0000307
308static int
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000309binascii_find_valid(unsigned char *s, int slen, int num)
Guido van Rossum2db4f471999-10-19 19:05:14 +0000310{
Tim Peters934c1a12002-07-02 22:24:50 +0000311 /* Finds & returns the (num+1)th
Guido van Rossum2db4f471999-10-19 19:05:14 +0000312 ** valid character for base64, or -1 if none.
313 */
314
315 int ret = -1;
316 unsigned char c, b64val;
317
318 while ((slen > 0) && (ret == -1)) {
319 c = *s;
320 b64val = table_a2b_base64[c & 0x7f];
321 if ( ((c <= 0x7f) && (b64val != (unsigned char)-1)) ) {
322 if (num == 0)
323 ret = *s;
324 num--;
325 }
326
327 s++;
328 slen--;
329 }
330 return ret;
331}
332
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000333PyDoc_STRVAR(doc_a2b_base64, "(ascii) -> bin. Decode a line of base64 data");
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000334
335static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000336binascii_a2b_base64(PyObject *self, PyObject *args)
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000337{
338 unsigned char *ascii_data, *bin_data;
339 int leftbits = 0;
340 unsigned char this_ch;
341 unsigned int leftchar = 0;
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000342 PyObject *rv;
343 int ascii_len, bin_len;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000344 int quad_pos = 0;
Tim Peters934c1a12002-07-02 22:24:50 +0000345
Guido van Rossum43713e52000-02-29 13:59:29 +0000346 if ( !PyArg_ParseTuple(args, "t#:a2b_base64", &ascii_data, &ascii_len) )
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000347 return NULL;
348
Peter Schneider-Kampd895b202001-06-07 05:51:36 +0000349 if ( ascii_len == 0) {
350 PyErr_SetString(Error, "Cannot decode empty input");
351 return NULL;
352 }
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000353 bin_len = ((ascii_len+3)/4)*3; /* Upper bound, corrected later */
354
355 /* Allocate the buffer */
356 if ( (rv=PyString_FromStringAndSize(NULL, bin_len)) == NULL )
357 return NULL;
358 bin_data = (unsigned char *)PyString_AsString(rv);
359 bin_len = 0;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000360
361 for( ; ascii_len > 0; ascii_len--, ascii_data++) {
362 this_ch = *ascii_data;
363
364 if (this_ch > 0x7f ||
365 this_ch == '\r' || this_ch == '\n' || this_ch == ' ')
Jack Jansenba1de3b1996-01-22 10:47:15 +0000366 continue;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000367
368 /* Check for pad sequences and ignore
369 ** the invalid ones.
370 */
371 if (this_ch == BASE64_PAD) {
372 if ( (quad_pos < 2) ||
373 ((quad_pos == 2) &&
374 (binascii_find_valid(ascii_data, ascii_len, 1)
375 != BASE64_PAD)) )
376 {
377 continue;
378 }
379 else {
380 /* A pad sequence means no more input.
381 ** We've already interpreted the data
382 ** from the quad at this point.
383 */
384 leftbits = 0;
385 break;
386 }
387 }
388
389 this_ch = table_a2b_base64[*ascii_data];
390 if ( this_ch == (unsigned char) -1 )
391 continue;
392
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000393 /*
394 ** Shift it in on the low end, and see if there's
395 ** a byte ready for output.
396 */
Guido van Rossum2db4f471999-10-19 19:05:14 +0000397 quad_pos = (quad_pos + 1) & 0x03;
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000398 leftchar = (leftchar << 6) | (this_ch);
399 leftbits += 6;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000400
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000401 if ( leftbits >= 8 ) {
402 leftbits -= 8;
403 *bin_data++ = (leftchar >> leftbits) & 0xff;
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000404 bin_len++;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000405 leftchar &= ((1 << leftbits) - 1);
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000406 }
Guido van Rossum2db4f471999-10-19 19:05:14 +0000407 }
408
409 if (leftbits != 0) {
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000410 PyErr_SetString(Error, "Incorrect padding");
411 Py_DECREF(rv);
412 return NULL;
413 }
Guido van Rossum2db4f471999-10-19 19:05:14 +0000414
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000415 /* and set string size correctly */
416 _PyString_Resize(&rv, bin_len);
417 return rv;
418}
419
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000420PyDoc_STRVAR(doc_b2a_base64, "(bin) -> ascii. Base64-code line of data");
Tim Peters934c1a12002-07-02 22:24:50 +0000421
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000422static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000423binascii_b2a_base64(PyObject *self, PyObject *args)
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000424{
425 unsigned char *ascii_data, *bin_data;
426 int leftbits = 0;
427 unsigned char this_ch;
428 unsigned int leftchar = 0;
429 PyObject *rv;
430 int bin_len;
Tim Peters934c1a12002-07-02 22:24:50 +0000431
Guido van Rossum43713e52000-02-29 13:59:29 +0000432 if ( !PyArg_ParseTuple(args, "s#:b2a_base64", &bin_data, &bin_len) )
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000433 return NULL;
434 if ( bin_len > BASE64_MAXBIN ) {
435 PyErr_SetString(Error, "Too much data for base64 line");
436 return NULL;
437 }
Tim Peters934c1a12002-07-02 22:24:50 +0000438
Tim Peters1fbb5772001-12-19 04:41:35 +0000439 /* We're lazy and allocate too much (fixed up later).
440 "+3" leaves room for up to two pad characters and a trailing
441 newline. Note that 'b' gets encoded as 'Yg==\n' (1 in, 5 out). */
442 if ( (rv=PyString_FromStringAndSize(NULL, bin_len*2 + 3)) == NULL )
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000443 return NULL;
444 ascii_data = (unsigned char *)PyString_AsString(rv);
445
446 for( ; bin_len > 0 ; bin_len--, bin_data++ ) {
447 /* Shift the data into our buffer */
448 leftchar = (leftchar << 8) | *bin_data;
449 leftbits += 8;
450
451 /* See if there are 6-bit groups ready */
452 while ( leftbits >= 6 ) {
453 this_ch = (leftchar >> (leftbits-6)) & 0x3f;
454 leftbits -= 6;
455 *ascii_data++ = table_b2a_base64[this_ch];
456 }
457 }
458 if ( leftbits == 2 ) {
459 *ascii_data++ = table_b2a_base64[(leftchar&3) << 4];
460 *ascii_data++ = BASE64_PAD;
461 *ascii_data++ = BASE64_PAD;
462 } else if ( leftbits == 4 ) {
463 *ascii_data++ = table_b2a_base64[(leftchar&0xf) << 2];
464 *ascii_data++ = BASE64_PAD;
Tim Peters934c1a12002-07-02 22:24:50 +0000465 }
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000466 *ascii_data++ = '\n'; /* Append a courtesy newline */
Tim Peters934c1a12002-07-02 22:24:50 +0000467
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000468 _PyString_Resize(&rv, (ascii_data -
469 (unsigned char *)PyString_AsString(rv)));
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000470 return rv;
471}
472
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000473PyDoc_STRVAR(doc_a2b_hqx, "ascii -> bin, done. Decode .hqx coding");
Jack Jansen72781191995-08-07 14:34:15 +0000474
475static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000476binascii_a2b_hqx(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000477{
478 unsigned char *ascii_data, *bin_data;
479 int leftbits = 0;
480 unsigned char this_ch;
Jack Janseneaeb1c81995-08-14 12:17:57 +0000481 unsigned int leftchar = 0;
Jack Jansen72781191995-08-07 14:34:15 +0000482 PyObject *rv;
483 int len;
484 int done = 0;
Tim Peters934c1a12002-07-02 22:24:50 +0000485
Guido van Rossum43713e52000-02-29 13:59:29 +0000486 if ( !PyArg_ParseTuple(args, "t#:a2b_hqx", &ascii_data, &len) )
Jack Jansen72781191995-08-07 14:34:15 +0000487 return NULL;
488
489 /* Allocate a string that is too big (fixed later) */
490 if ( (rv=PyString_FromStringAndSize(NULL, len)) == NULL )
491 return NULL;
492 bin_data = (unsigned char *)PyString_AsString(rv);
493
494 for( ; len > 0 ; len--, ascii_data++ ) {
495 /* Get the byte and look it up */
496 this_ch = table_a2b_hqx[*ascii_data];
497 if ( this_ch == SKIP )
498 continue;
499 if ( this_ch == FAIL ) {
500 PyErr_SetString(Error, "Illegal char");
501 Py_DECREF(rv);
502 return NULL;
503 }
504 if ( this_ch == DONE ) {
505 /* The terminating colon */
506 done = 1;
507 break;
508 }
509
510 /* Shift it into the buffer and see if any bytes are ready */
511 leftchar = (leftchar << 6) | (this_ch);
512 leftbits += 6;
513 if ( leftbits >= 8 ) {
514 leftbits -= 8;
515 *bin_data++ = (leftchar >> leftbits) & 0xff;
516 leftchar &= ((1 << leftbits) - 1);
517 }
518 }
Tim Peters934c1a12002-07-02 22:24:50 +0000519
Jack Jansen72781191995-08-07 14:34:15 +0000520 if ( leftbits && !done ) {
521 PyErr_SetString(Incomplete,
522 "String has incomplete number of bytes");
523 Py_DECREF(rv);
524 return NULL;
525 }
Guido van Rossum9c6ba5e1997-01-12 20:02:04 +0000526 _PyString_Resize(
527 &rv, (bin_data - (unsigned char *)PyString_AsString(rv)));
528 if (rv) {
529 PyObject *rrv = Py_BuildValue("Oi", rv, done);
530 Py_DECREF(rv);
531 return rrv;
532 }
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000533
Jack Jansen72781191995-08-07 14:34:15 +0000534 return NULL;
535}
536
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000537PyDoc_STRVAR(doc_rlecode_hqx, "Binhex RLE-code binary data");
Jack Jansen72781191995-08-07 14:34:15 +0000538
539static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000540binascii_rlecode_hqx(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000541{
542 unsigned char *in_data, *out_data;
543 PyObject *rv;
544 unsigned char ch;
545 int in, inend, len;
Tim Peters934c1a12002-07-02 22:24:50 +0000546
Guido van Rossum43713e52000-02-29 13:59:29 +0000547 if ( !PyArg_ParseTuple(args, "s#:rlecode_hqx", &in_data, &len) )
Jack Jansen72781191995-08-07 14:34:15 +0000548 return NULL;
549
550 /* Worst case: output is twice as big as input (fixed later) */
551 if ( (rv=PyString_FromStringAndSize(NULL, len*2)) == NULL )
552 return NULL;
553 out_data = (unsigned char *)PyString_AsString(rv);
Tim Peters934c1a12002-07-02 22:24:50 +0000554
Jack Jansen72781191995-08-07 14:34:15 +0000555 for( in=0; in<len; in++) {
556 ch = in_data[in];
557 if ( ch == RUNCHAR ) {
558 /* RUNCHAR. Escape it. */
559 *out_data++ = RUNCHAR;
560 *out_data++ = 0;
561 } else {
562 /* Check how many following are the same */
563 for(inend=in+1;
564 inend<len && in_data[inend] == ch &&
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000565 inend < in+255;
Jack Jansen72781191995-08-07 14:34:15 +0000566 inend++) ;
Jack Jansen0223aa11995-08-31 13:44:23 +0000567 if ( inend - in > 3 ) {
568 /* More than 3 in a row. Output RLE. */
Jack Jansen72781191995-08-07 14:34:15 +0000569 *out_data++ = ch;
570 *out_data++ = RUNCHAR;
571 *out_data++ = inend-in;
572 in = inend-1;
573 } else {
574 /* Less than 3. Output the byte itself */
575 *out_data++ = ch;
576 }
577 }
578 }
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000579 _PyString_Resize(&rv, (out_data -
580 (unsigned char *)PyString_AsString(rv)));
Jack Jansen72781191995-08-07 14:34:15 +0000581 return rv;
582}
583
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000584PyDoc_STRVAR(doc_b2a_hqx, "Encode .hqx data");
Tim Peters934c1a12002-07-02 22:24:50 +0000585
Jack Jansen72781191995-08-07 14:34:15 +0000586static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000587binascii_b2a_hqx(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000588{
589 unsigned char *ascii_data, *bin_data;
590 int leftbits = 0;
591 unsigned char this_ch;
Jack Janseneaeb1c81995-08-14 12:17:57 +0000592 unsigned int leftchar = 0;
Jack Jansen72781191995-08-07 14:34:15 +0000593 PyObject *rv;
594 int len;
Tim Peters934c1a12002-07-02 22:24:50 +0000595
Guido van Rossum43713e52000-02-29 13:59:29 +0000596 if ( !PyArg_ParseTuple(args, "s#:b2a_hqx", &bin_data, &len) )
Jack Jansen72781191995-08-07 14:34:15 +0000597 return NULL;
598
599 /* Allocate a buffer that is at least large enough */
600 if ( (rv=PyString_FromStringAndSize(NULL, len*2)) == NULL )
601 return NULL;
602 ascii_data = (unsigned char *)PyString_AsString(rv);
Tim Peters934c1a12002-07-02 22:24:50 +0000603
Jack Jansen72781191995-08-07 14:34:15 +0000604 for( ; len > 0 ; len--, bin_data++ ) {
605 /* Shift into our buffer, and output any 6bits ready */
606 leftchar = (leftchar << 8) | *bin_data;
607 leftbits += 8;
608 while ( leftbits >= 6 ) {
609 this_ch = (leftchar >> (leftbits-6)) & 0x3f;
610 leftbits -= 6;
611 *ascii_data++ = table_b2a_hqx[this_ch];
612 }
613 }
614 /* Output a possible runt byte */
615 if ( leftbits ) {
616 leftchar <<= (6-leftbits);
617 *ascii_data++ = table_b2a_hqx[leftchar & 0x3f];
618 }
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000619 _PyString_Resize(&rv, (ascii_data -
620 (unsigned char *)PyString_AsString(rv)));
Jack Jansen72781191995-08-07 14:34:15 +0000621 return rv;
622}
623
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000624PyDoc_STRVAR(doc_rledecode_hqx, "Decode hexbin RLE-coded string");
Tim Peters934c1a12002-07-02 22:24:50 +0000625
Jack Jansen72781191995-08-07 14:34:15 +0000626static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000627binascii_rledecode_hqx(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000628{
629 unsigned char *in_data, *out_data;
630 unsigned char in_byte, in_repeat;
631 PyObject *rv;
632 int in_len, out_len, out_len_left;
633
Guido van Rossum43713e52000-02-29 13:59:29 +0000634 if ( !PyArg_ParseTuple(args, "s#:rledecode_hqx", &in_data, &in_len) )
Jack Jansen72781191995-08-07 14:34:15 +0000635 return NULL;
636
637 /* Empty string is a special case */
638 if ( in_len == 0 )
639 return Py_BuildValue("s", "");
640
641 /* Allocate a buffer of reasonable size. Resized when needed */
642 out_len = in_len*2;
643 if ( (rv=PyString_FromStringAndSize(NULL, out_len)) == NULL )
644 return NULL;
645 out_len_left = out_len;
646 out_data = (unsigned char *)PyString_AsString(rv);
647
648 /*
649 ** We need two macros here to get/put bytes and handle
650 ** end-of-buffer for input and output strings.
651 */
652#define INBYTE(b) \
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000653 do { \
654 if ( --in_len < 0 ) { \
655 PyErr_SetString(Incomplete, ""); \
656 Py_DECREF(rv); \
657 return NULL; \
658 } \
659 b = *in_data++; \
660 } while(0)
Tim Peters934c1a12002-07-02 22:24:50 +0000661
Jack Jansen72781191995-08-07 14:34:15 +0000662#define OUTBYTE(b) \
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000663 do { \
664 if ( --out_len_left < 0 ) { \
665 _PyString_Resize(&rv, 2*out_len); \
666 if ( rv == NULL ) return NULL; \
667 out_data = (unsigned char *)PyString_AsString(rv) \
668 + out_len; \
669 out_len_left = out_len-1; \
670 out_len = out_len * 2; \
671 } \
672 *out_data++ = b; \
673 } while(0)
Jack Jansen72781191995-08-07 14:34:15 +0000674
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000675 /*
676 ** Handle first byte separately (since we have to get angry
677 ** in case of an orphaned RLE code).
678 */
679 INBYTE(in_byte);
Jack Jansen72781191995-08-07 14:34:15 +0000680
681 if (in_byte == RUNCHAR) {
682 INBYTE(in_repeat);
683 if (in_repeat != 0) {
684 /* Note Error, not Incomplete (which is at the end
685 ** of the string only). This is a programmer error.
686 */
687 PyErr_SetString(Error, "Orphaned RLE code at start");
688 Py_DECREF(rv);
689 return NULL;
690 }
691 OUTBYTE(RUNCHAR);
692 } else {
693 OUTBYTE(in_byte);
694 }
Tim Peters934c1a12002-07-02 22:24:50 +0000695
Jack Jansen72781191995-08-07 14:34:15 +0000696 while( in_len > 0 ) {
697 INBYTE(in_byte);
698
699 if (in_byte == RUNCHAR) {
700 INBYTE(in_repeat);
701 if ( in_repeat == 0 ) {
702 /* Just an escaped RUNCHAR value */
703 OUTBYTE(RUNCHAR);
704 } else {
705 /* Pick up value and output a sequence of it */
706 in_byte = out_data[-1];
707 while ( --in_repeat > 0 )
708 OUTBYTE(in_byte);
709 }
710 } else {
711 /* Normal byte */
712 OUTBYTE(in_byte);
713 }
714 }
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000715 _PyString_Resize(&rv, (out_data -
716 (unsigned char *)PyString_AsString(rv)));
Jack Jansen72781191995-08-07 14:34:15 +0000717 return rv;
718}
719
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000720PyDoc_STRVAR(doc_crc_hqx,
721"(data, oldcrc) -> newcrc. Compute hqx CRC incrementally");
Jack Jansen72781191995-08-07 14:34:15 +0000722
723static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000724binascii_crc_hqx(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000725{
726 unsigned char *bin_data;
727 unsigned int crc;
728 int len;
Tim Peters934c1a12002-07-02 22:24:50 +0000729
Guido van Rossum43713e52000-02-29 13:59:29 +0000730 if ( !PyArg_ParseTuple(args, "s#i:crc_hqx", &bin_data, &len, &crc) )
Jack Jansen72781191995-08-07 14:34:15 +0000731 return NULL;
732
733 while(len--) {
734 crc=((crc<<8)&0xff00)^crctab_hqx[((crc>>8)&0xff)^*bin_data++];
735 }
736
737 return Py_BuildValue("i", crc);
738}
739
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000740PyDoc_STRVAR(doc_crc32,
741"(data, oldcrc = 0) -> newcrc. Compute CRC-32 incrementally");
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000742
743/* Crc - 32 BIT ANSI X3.66 CRC checksum files
744 Also known as: ISO 3307
745**********************************************************************|
746* *|
747* Demonstration program to compute the 32-bit CRC used as the frame *|
748* check sequence in ADCCP (ANSI X3.66, also known as FIPS PUB 71 *|
749* and FED-STD-1003, the U.S. versions of CCITT's X.25 link-level *|
750* protocol). The 32-bit FCS was added via the Federal Register, *|
751* 1 June 1982, p.23798. I presume but don't know for certain that *|
752* this polynomial is or will be included in CCITT V.41, which *|
753* defines the 16-bit CRC (often called CRC-CCITT) polynomial. FIPS *|
754* PUB 78 says that the 32-bit FCS reduces otherwise undetected *|
755* errors by a factor of 10^-5 over 16-bit FCS. *|
756* *|
757**********************************************************************|
758
759 Copyright (C) 1986 Gary S. Brown. You may use this program, or
760 code or tables extracted from it, as desired without restriction.
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000761
Tim Peters934c1a12002-07-02 22:24:50 +0000762 First, the polynomial itself and its table of feedback terms. The
763 polynomial is
764 X^32+X^26+X^23+X^22+X^16+X^12+X^11+X^10+X^8+X^7+X^5+X^4+X^2+X^1+X^0
765 Note that we take it "backwards" and put the highest-order term in
766 the lowest-order bit. The X^32 term is "implied"; the LSB is the
767 X^31 term, etc. The X^0 term (usually shown as "+1") results in
768 the MSB being 1.
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000769
Tim Peters934c1a12002-07-02 22:24:50 +0000770 Note that the usual hardware shift register implementation, which
771 is what we're using (we're merely optimizing it by doing eight-bit
772 chunks at a time) shifts bits into the lowest-order term. In our
773 implementation, that means shifting towards the right. Why do we
774 do it this way? Because the calculated CRC must be transmitted in
775 order from highest-order term to lowest-order term. UARTs transmit
776 characters in order from LSB to MSB. By storing the CRC this way,
777 we hand it to the UART in the order low-byte to high-byte; the UART
778 sends each low-bit to hight-bit; and the result is transmission bit
779 by bit from highest- to lowest-order term without requiring any bit
780 shuffling on our part. Reception works similarly.
781
782 The feedback terms table consists of 256, 32-bit entries. Notes:
783
784 1. The table can be generated at runtime if desired; code to do so
785 is shown later. It might not be obvious, but the feedback
786 terms simply represent the results of eight shift/xor opera-
787 tions for all combinations of data and CRC register values.
788
789 2. The CRC accumulation logic is the same for all CRC polynomials,
790 be they sixteen or thirty-two bits wide. You simply choose the
791 appropriate table. Alternatively, because the table can be
792 generated at runtime, you can start by generating the table for
793 the polynomial in question and use exactly the same "updcrc",
794 if your application needn't simultaneously handle two CRC
795 polynomials. (Note, however, that XMODEM is strange.)
796
797 3. For 16-bit CRCs, the table entries need be only 16 bits wide;
798 of course, 32-bit entries work OK if the high 16 bits are zero.
799
800 4. The values must be right-shifted by eight bits by the "updcrc"
801 logic; the shift must be unsigned (bring in zeroes). On some
802 hardware you could probably optimize the shift in assembler by
803 using byte-swap instructions.
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000804********************************************************************/
805
806static unsigned long crc_32_tab[256] = {
8070x00000000UL, 0x77073096UL, 0xee0e612cUL, 0x990951baUL, 0x076dc419UL,
8080x706af48fUL, 0xe963a535UL, 0x9e6495a3UL, 0x0edb8832UL, 0x79dcb8a4UL,
8090xe0d5e91eUL, 0x97d2d988UL, 0x09b64c2bUL, 0x7eb17cbdUL, 0xe7b82d07UL,
8100x90bf1d91UL, 0x1db71064UL, 0x6ab020f2UL, 0xf3b97148UL, 0x84be41deUL,
8110x1adad47dUL, 0x6ddde4ebUL, 0xf4d4b551UL, 0x83d385c7UL, 0x136c9856UL,
8120x646ba8c0UL, 0xfd62f97aUL, 0x8a65c9ecUL, 0x14015c4fUL, 0x63066cd9UL,
8130xfa0f3d63UL, 0x8d080df5UL, 0x3b6e20c8UL, 0x4c69105eUL, 0xd56041e4UL,
8140xa2677172UL, 0x3c03e4d1UL, 0x4b04d447UL, 0xd20d85fdUL, 0xa50ab56bUL,
8150x35b5a8faUL, 0x42b2986cUL, 0xdbbbc9d6UL, 0xacbcf940UL, 0x32d86ce3UL,
8160x45df5c75UL, 0xdcd60dcfUL, 0xabd13d59UL, 0x26d930acUL, 0x51de003aUL,
8170xc8d75180UL, 0xbfd06116UL, 0x21b4f4b5UL, 0x56b3c423UL, 0xcfba9599UL,
8180xb8bda50fUL, 0x2802b89eUL, 0x5f058808UL, 0xc60cd9b2UL, 0xb10be924UL,
8190x2f6f7c87UL, 0x58684c11UL, 0xc1611dabUL, 0xb6662d3dUL, 0x76dc4190UL,
8200x01db7106UL, 0x98d220bcUL, 0xefd5102aUL, 0x71b18589UL, 0x06b6b51fUL,
8210x9fbfe4a5UL, 0xe8b8d433UL, 0x7807c9a2UL, 0x0f00f934UL, 0x9609a88eUL,
8220xe10e9818UL, 0x7f6a0dbbUL, 0x086d3d2dUL, 0x91646c97UL, 0xe6635c01UL,
8230x6b6b51f4UL, 0x1c6c6162UL, 0x856530d8UL, 0xf262004eUL, 0x6c0695edUL,
8240x1b01a57bUL, 0x8208f4c1UL, 0xf50fc457UL, 0x65b0d9c6UL, 0x12b7e950UL,
8250x8bbeb8eaUL, 0xfcb9887cUL, 0x62dd1ddfUL, 0x15da2d49UL, 0x8cd37cf3UL,
8260xfbd44c65UL, 0x4db26158UL, 0x3ab551ceUL, 0xa3bc0074UL, 0xd4bb30e2UL,
8270x4adfa541UL, 0x3dd895d7UL, 0xa4d1c46dUL, 0xd3d6f4fbUL, 0x4369e96aUL,
8280x346ed9fcUL, 0xad678846UL, 0xda60b8d0UL, 0x44042d73UL, 0x33031de5UL,
8290xaa0a4c5fUL, 0xdd0d7cc9UL, 0x5005713cUL, 0x270241aaUL, 0xbe0b1010UL,
8300xc90c2086UL, 0x5768b525UL, 0x206f85b3UL, 0xb966d409UL, 0xce61e49fUL,
8310x5edef90eUL, 0x29d9c998UL, 0xb0d09822UL, 0xc7d7a8b4UL, 0x59b33d17UL,
8320x2eb40d81UL, 0xb7bd5c3bUL, 0xc0ba6cadUL, 0xedb88320UL, 0x9abfb3b6UL,
8330x03b6e20cUL, 0x74b1d29aUL, 0xead54739UL, 0x9dd277afUL, 0x04db2615UL,
8340x73dc1683UL, 0xe3630b12UL, 0x94643b84UL, 0x0d6d6a3eUL, 0x7a6a5aa8UL,
8350xe40ecf0bUL, 0x9309ff9dUL, 0x0a00ae27UL, 0x7d079eb1UL, 0xf00f9344UL,
8360x8708a3d2UL, 0x1e01f268UL, 0x6906c2feUL, 0xf762575dUL, 0x806567cbUL,
8370x196c3671UL, 0x6e6b06e7UL, 0xfed41b76UL, 0x89d32be0UL, 0x10da7a5aUL,
8380x67dd4accUL, 0xf9b9df6fUL, 0x8ebeeff9UL, 0x17b7be43UL, 0x60b08ed5UL,
8390xd6d6a3e8UL, 0xa1d1937eUL, 0x38d8c2c4UL, 0x4fdff252UL, 0xd1bb67f1UL,
8400xa6bc5767UL, 0x3fb506ddUL, 0x48b2364bUL, 0xd80d2bdaUL, 0xaf0a1b4cUL,
8410x36034af6UL, 0x41047a60UL, 0xdf60efc3UL, 0xa867df55UL, 0x316e8eefUL,
8420x4669be79UL, 0xcb61b38cUL, 0xbc66831aUL, 0x256fd2a0UL, 0x5268e236UL,
8430xcc0c7795UL, 0xbb0b4703UL, 0x220216b9UL, 0x5505262fUL, 0xc5ba3bbeUL,
8440xb2bd0b28UL, 0x2bb45a92UL, 0x5cb36a04UL, 0xc2d7ffa7UL, 0xb5d0cf31UL,
8450x2cd99e8bUL, 0x5bdeae1dUL, 0x9b64c2b0UL, 0xec63f226UL, 0x756aa39cUL,
8460x026d930aUL, 0x9c0906a9UL, 0xeb0e363fUL, 0x72076785UL, 0x05005713UL,
8470x95bf4a82UL, 0xe2b87a14UL, 0x7bb12baeUL, 0x0cb61b38UL, 0x92d28e9bUL,
8480xe5d5be0dUL, 0x7cdcefb7UL, 0x0bdbdf21UL, 0x86d3d2d4UL, 0xf1d4e242UL,
8490x68ddb3f8UL, 0x1fda836eUL, 0x81be16cdUL, 0xf6b9265bUL, 0x6fb077e1UL,
8500x18b74777UL, 0x88085ae6UL, 0xff0f6a70UL, 0x66063bcaUL, 0x11010b5cUL,
8510x8f659effUL, 0xf862ae69UL, 0x616bffd3UL, 0x166ccf45UL, 0xa00ae278UL,
8520xd70dd2eeUL, 0x4e048354UL, 0x3903b3c2UL, 0xa7672661UL, 0xd06016f7UL,
8530x4969474dUL, 0x3e6e77dbUL, 0xaed16a4aUL, 0xd9d65adcUL, 0x40df0b66UL,
8540x37d83bf0UL, 0xa9bcae53UL, 0xdebb9ec5UL, 0x47b2cf7fUL, 0x30b5ffe9UL,
8550xbdbdf21cUL, 0xcabac28aUL, 0x53b39330UL, 0x24b4a3a6UL, 0xbad03605UL,
8560xcdd70693UL, 0x54de5729UL, 0x23d967bfUL, 0xb3667a2eUL, 0xc4614ab8UL,
8570x5d681b02UL, 0x2a6f2b94UL, 0xb40bbe37UL, 0xc30c8ea1UL, 0x5a05df1bUL,
8580x2d02ef8dUL
859};
860
861static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000862binascii_crc32(PyObject *self, PyObject *args)
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000863{ /* By Jim Ahlstrom; All rights transferred to CNRI */
864 unsigned char *bin_data;
865 unsigned long crc = 0UL; /* initial value of CRC */
866 int len;
Tim Petersa98011c2002-07-02 20:20:08 +0000867 long result;
Tim Peters934c1a12002-07-02 22:24:50 +0000868
Guido van Rossum43713e52000-02-29 13:59:29 +0000869 if ( !PyArg_ParseTuple(args, "s#|l:crc32", &bin_data, &len, &crc) )
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000870 return NULL;
871
Tim Peters934c1a12002-07-02 22:24:50 +0000872 crc = ~ crc;
873#if SIZEOF_LONG > 4
874 /* only want the trailing 32 bits */
875 crc &= 0xFFFFFFFFUL;
876#endif
877 while (len--)
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000878 crc = crc_32_tab[(crc ^ *bin_data++) & 0xffUL] ^ (crc >> 8);
879 /* Note: (crc >> 8) MUST zero fill on left */
Tim Petersa98011c2002-07-02 20:20:08 +0000880
881 result = (long)(crc ^ 0xFFFFFFFFUL);
Tim Peters934c1a12002-07-02 22:24:50 +0000882#if SIZEOF_LONG > 4
883 /* Extend the sign bit. This is one way to ensure the result is the
884 * same across platforms. The other way would be to return an
885 * unbounded unsigned long, but the evidence suggests that lots of
886 * code outside this treats the result as if it were a signed 4-byte
887 * integer.
Tim Petersa98011c2002-07-02 20:20:08 +0000888 */
889 result |= -(result & (1L << 31));
Tim Peters934c1a12002-07-02 22:24:50 +0000890#endif
Tim Petersa98011c2002-07-02 20:20:08 +0000891 return PyInt_FromLong(result);
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000892}
893
Barry Warsawe977c212000-08-15 06:07:13 +0000894
895static PyObject *
896binascii_hexlify(PyObject *self, PyObject *args)
897{
898 char* argbuf;
899 int arglen;
900 PyObject *retval;
901 char* retbuf;
902 int i, j;
903
904 if (!PyArg_ParseTuple(args, "t#:b2a_hex", &argbuf, &arglen))
905 return NULL;
906
907 retval = PyString_FromStringAndSize(NULL, arglen*2);
908 if (!retval)
909 return NULL;
910 retbuf = PyString_AsString(retval);
911 if (!retbuf)
912 goto finally;
913
914 /* make hex version of string, taken from shamodule.c */
915 for (i=j=0; i < arglen; i++) {
916 char c;
917 c = (argbuf[i] >> 4) & 0xf;
918 c = (c>9) ? c+'a'-10 : c + '0';
919 retbuf[j++] = c;
920 c = argbuf[i] & 0xf;
921 c = (c>9) ? c+'a'-10 : c + '0';
922 retbuf[j++] = c;
923 }
924 return retval;
925
926 finally:
927 Py_DECREF(retval);
928 return NULL;
929}
930
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000931PyDoc_STRVAR(doc_hexlify,
Barry Warsawe977c212000-08-15 06:07:13 +0000932"b2a_hex(data) -> s; Hexadecimal representation of binary data.\n\
933\n\
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000934This function is also available as \"hexlify()\".");
Barry Warsawe977c212000-08-15 06:07:13 +0000935
936
937static int
Tim Peters934c1a12002-07-02 22:24:50 +0000938to_int(int c)
Barry Warsawe977c212000-08-15 06:07:13 +0000939{
940 if (isdigit(c))
941 return c - '0';
942 else {
943 if (isupper(c))
944 c = tolower(c);
945 if (c >= 'a' && c <= 'f')
946 return c - 'a' + 10;
947 }
948 return -1;
949}
950
951
952static PyObject *
953binascii_unhexlify(PyObject *self, PyObject *args)
954{
955 char* argbuf;
956 int arglen;
957 PyObject *retval;
958 char* retbuf;
959 int i, j;
960
961 if (!PyArg_ParseTuple(args, "s#:a2b_hex", &argbuf, &arglen))
962 return NULL;
963
Barry Warsaw16168472000-08-15 06:59:58 +0000964 /* XXX What should we do about strings with an odd length? Should
965 * we add an implicit leading zero, or a trailing zero? For now,
966 * raise an exception.
Barry Warsawe977c212000-08-15 06:07:13 +0000967 */
968 if (arglen % 2) {
Barry Warsaw16168472000-08-15 06:59:58 +0000969 PyErr_SetString(PyExc_TypeError, "Odd-length string");
Barry Warsawe977c212000-08-15 06:07:13 +0000970 return NULL;
971 }
972
973 retval = PyString_FromStringAndSize(NULL, (arglen/2));
974 if (!retval)
975 return NULL;
976 retbuf = PyString_AsString(retval);
977 if (!retbuf)
978 goto finally;
979
980 for (i=j=0; i < arglen; i += 2) {
981 int top = to_int(Py_CHARMASK(argbuf[i]));
982 int bot = to_int(Py_CHARMASK(argbuf[i+1]));
983 if (top == -1 || bot == -1) {
984 PyErr_SetString(PyExc_TypeError,
Barry Warsaw16168472000-08-15 06:59:58 +0000985 "Non-hexadecimal digit found");
Barry Warsawe977c212000-08-15 06:07:13 +0000986 goto finally;
987 }
988 retbuf[j++] = (top << 4) + bot;
989 }
990 return retval;
991
992 finally:
993 Py_DECREF(retval);
994 return NULL;
995}
996
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000997PyDoc_STRVAR(doc_unhexlify,
Barry Warsawe977c212000-08-15 06:07:13 +0000998"a2b_hex(hexstr) -> s; Binary data of hexadecimal representation.\n\
999\n\
1000hexstr must contain an even number of hex digits (upper or lower case).\n\
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001001This function is also available as \"unhexlify()\"");
Barry Warsawe977c212000-08-15 06:07:13 +00001002
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001003static int table_hex[128] = {
1004 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1005 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1006 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1007 0, 1, 2, 3, 4, 5, 6, 7, 8, 9,-1,-1, -1,-1,-1,-1,
1008 -1,10,11,12, 13,14,15,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1009 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1010 -1,10,11,12, 13,14,15,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1011 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1
1012};
1013
1014#define hexval(c) table_hex[(unsigned int)(c)]
1015
1016#define MAXLINESIZE 76
1017
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001018PyDoc_STRVAR(doc_a2b_qp, "Decode a string of qp-encoded data");
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001019
Tim Peters934c1a12002-07-02 22:24:50 +00001020static PyObject*
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001021binascii_a2b_qp(PyObject *self, PyObject *args, PyObject *kwargs)
1022{
1023 unsigned int in, out;
1024 char ch;
1025 unsigned char *data, *odata;
1026 unsigned int datalen = 0;
1027 PyObject *rv;
1028 static char *kwlist[] = {"data", "header", NULL};
1029 int header = 0;
1030
Tim Peters934c1a12002-07-02 22:24:50 +00001031 if (!PyArg_ParseTupleAndKeywords(args, kwargs, "s#|i", kwlist, &data,
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001032 &datalen, &header))
1033 return NULL;
1034
1035 /* We allocate the output same size as input, this is overkill */
Greg Warda645b302001-10-04 14:54:53 +00001036 odata = (unsigned char *) calloc(1, datalen);
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001037
1038 if (odata == NULL) {
1039 PyErr_NoMemory();
1040 return NULL;
1041 }
1042
1043 in = out = 0;
1044 while (in < datalen) {
1045 if (data[in] == '=') {
1046 in++;
1047 if (in >= datalen) break;
1048 /* Soft line breaks */
Tim Peters934c1a12002-07-02 22:24:50 +00001049 if ((data[in] == '\n') || (data[in] == '\r') ||
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001050 (data[in] == ' ') || (data[in] == '\t')) {
1051 if (data[in] != '\n') {
1052 while (in < datalen && data[in] != '\n') in++;
1053 }
1054 if (in < datalen) in++;
1055 }
1056 else if (data[in] == '=') {
1057 /* broken case from broken python qp */
1058 odata[out++] = '=';
1059 in++;
1060 }
Tim Peters934c1a12002-07-02 22:24:50 +00001061 else if (((data[in] >= 'A' && data[in] <= 'F') ||
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001062 (data[in] >= 'a' && data[in] <= 'f') ||
1063 (data[in] >= '0' && data[in] <= '9')) &&
1064 ((data[in+1] >= 'A' && data[in+1] <= 'F') ||
1065 (data[in+1] >= 'a' && data[in+1] <= 'f') ||
1066 (data[in+1] >= '0' && data[in+1] <= '9'))) {
1067 /* hexval */
1068 ch = hexval(data[in]) << 4;
1069 in++;
1070 ch |= hexval(data[in]);
1071 in++;
1072 odata[out++] = ch;
1073 }
1074 else {
1075 odata[out++] = '=';
1076 }
1077 }
1078 else if (header && data[in] == '_') {
1079 odata[out++] = ' ';
1080 in++;
1081 }
1082 else {
1083 odata[out] = data[in];
1084 in++;
1085 out++;
1086 }
1087 }
Greg Warda645b302001-10-04 14:54:53 +00001088 if ((rv = PyString_FromStringAndSize((char *)odata, out)) == NULL) {
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001089 free (odata);
1090 return NULL;
1091 }
1092 free (odata);
1093 return rv;
1094}
1095
Tim Peters934c1a12002-07-02 22:24:50 +00001096static int
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001097to_hex (unsigned char ch, unsigned char *s)
1098{
1099 unsigned int uvalue = ch;
1100
1101 s[1] = "0123456789ABCDEF"[uvalue % 16];
1102 uvalue = (uvalue / 16);
1103 s[0] = "0123456789ABCDEF"[uvalue % 16];
1104 return 0;
1105}
1106
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001107PyDoc_STRVAR(doc_b2a_qp,
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001108"b2a_qp(data, quotetabs=0, istext=1, header=0) -> s; \n\
1109 Encode a string using quoted-printable encoding. \n\
1110\n\
1111On encoding, when istext is set, newlines are not encoded, and white \n\
1112space at end of lines is. When istext is not set, \\r and \\n (CR/LF) are \n\
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001113both encoded. When quotetabs is set, space and tabs are encoded.");
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001114
1115/* XXX: This is ridiculously complicated to be backward compatible
1116 * (mostly) with the quopri module. It doesn't re-create the quopri
1117 * module bug where text ending in CRLF has the CR encoded */
Tim Peters934c1a12002-07-02 22:24:50 +00001118static PyObject*
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001119binascii_b2a_qp (PyObject *self, PyObject *args, PyObject *kwargs)
1120{
1121 unsigned int in, out;
1122 unsigned char *data, *odata;
1123 unsigned int datalen = 0, odatalen = 0;
1124 PyObject *rv;
1125 unsigned int linelen = 0;
1126 static char *kwlist[] = {"data", "quotetabs", "istext", "header", NULL};
1127 int istext = 1;
1128 int quotetabs = 0;
1129 int header = 0;
1130 unsigned char ch;
1131 int crlf = 0;
1132 unsigned char *p;
1133
Tim Peters934c1a12002-07-02 22:24:50 +00001134 if (!PyArg_ParseTupleAndKeywords(args, kwargs, "s#|iii", kwlist, &data,
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001135 &datalen, &quotetabs, &istext, &header))
1136 return NULL;
1137
1138 /* See if this string is using CRLF line ends */
1139 /* XXX: this function has the side effect of converting all of
1140 * the end of lines to be the same depending on this detection
1141 * here */
Greg Warda645b302001-10-04 14:54:53 +00001142 p = (unsigned char *) strchr((char *)data, '\n');
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001143 if ((p != NULL) && (p > data) && (*(p-1) == '\r'))
1144 crlf = 1;
1145
1146 /* First, scan to see how many characters need to be encoded */
1147 in = 0;
1148 while (in < datalen) {
Tim Peters934c1a12002-07-02 22:24:50 +00001149 if ((data[in] > 126) ||
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001150 (data[in] == '=') ||
1151 (header && data[in] == '_') ||
1152 ((data[in] == '.') && (linelen == 1)) ||
1153 (!istext && ((data[in] == '\r') || (data[in] == '\n'))) ||
1154 ((data[in] == '\t' || data[in] == ' ') && (in + 1 == datalen)) ||
Tim Peters934c1a12002-07-02 22:24:50 +00001155 ((data[in] < 33) &&
1156 (data[in] != '\r') && (data[in] != '\n') &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001157 (quotetabs && ((data[in] != '\t') || (data[in] != ' ')))))
1158 {
1159 if ((linelen + 3) >= MAXLINESIZE) {
1160 linelen = 0;
1161 if (crlf)
1162 odatalen += 3;
1163 else
1164 odatalen += 2;
1165 }
1166 linelen += 3;
1167 odatalen += 3;
1168 in++;
1169 }
1170 else {
Tim Peters934c1a12002-07-02 22:24:50 +00001171 if (istext &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001172 ((data[in] == '\n') ||
1173 ((in+1 < datalen) && (data[in] == '\r') &&
1174 (data[in+1] == '\n'))))
1175 {
1176 linelen = 0;
1177 /* Protect against whitespace on end of line */
1178 if (in && ((data[in-1] == ' ') || (data[in-1] == '\t')))
1179 odatalen += 2;
1180 if (crlf)
1181 odatalen += 2;
1182 else
1183 odatalen += 1;
1184 if (data[in] == '\r')
1185 in += 2;
1186 else
1187 in++;
1188 }
1189 else {
Tim Peters934c1a12002-07-02 22:24:50 +00001190 if ((in + 1 != datalen) &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001191 (data[in+1] != '\n') &&
1192 (linelen + 1) >= MAXLINESIZE) {
1193 linelen = 0;
1194 if (crlf)
1195 odatalen += 3;
1196 else
1197 odatalen += 2;
1198 }
1199 linelen++;
1200 odatalen++;
1201 in++;
1202 }
1203 }
1204 }
1205
Greg Warda645b302001-10-04 14:54:53 +00001206 odata = (unsigned char *) calloc(1, odatalen);
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001207
1208 if (odata == NULL) {
1209 PyErr_NoMemory();
1210 return NULL;
1211 }
1212
1213 in = out = linelen = 0;
1214 while (in < datalen) {
Tim Peters934c1a12002-07-02 22:24:50 +00001215 if ((data[in] > 126) ||
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001216 (data[in] == '=') ||
1217 (header && data[in] == '_') ||
1218 ((data[in] == '.') && (linelen == 1)) ||
1219 (!istext && ((data[in] == '\r') || (data[in] == '\n'))) ||
1220 ((data[in] == '\t' || data[in] == ' ') && (in + 1 == datalen)) ||
Tim Peters934c1a12002-07-02 22:24:50 +00001221 ((data[in] < 33) &&
1222 (data[in] != '\r') && (data[in] != '\n') &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001223 (quotetabs && ((data[in] != '\t') || (data[in] != ' ')))))
1224 {
1225 if ((linelen + 3 )>= MAXLINESIZE) {
1226 odata[out++] = '=';
1227 if (crlf) odata[out++] = '\r';
1228 odata[out++] = '\n';
1229 linelen = 0;
1230 }
1231 odata[out++] = '=';
1232 to_hex(data[in], &odata[out]);
1233 out += 2;
1234 in++;
1235 linelen += 3;
1236 }
1237 else {
Tim Peters934c1a12002-07-02 22:24:50 +00001238 if (istext &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001239 ((data[in] == '\n') ||
1240 ((in+1 < datalen) && (data[in] == '\r') &&
1241 (data[in+1] == '\n'))))
1242 {
1243 linelen = 0;
1244 /* Protect against whitespace on end of line */
1245 if (out && ((odata[out-1] == ' ') || (odata[out-1] == '\t'))) {
1246 ch = odata[out-1];
1247 odata[out-1] = '=';
1248 to_hex(ch, &odata[out]);
1249 out += 2;
1250 }
Tim Peters934c1a12002-07-02 22:24:50 +00001251
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001252 if (crlf) odata[out++] = '\r';
1253 odata[out++] = '\n';
1254 if (data[in] == '\r')
1255 in += 2;
1256 else
1257 in++;
1258 }
1259 else {
Tim Peters934c1a12002-07-02 22:24:50 +00001260 if ((in + 1 != datalen) &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001261 (data[in+1] != '\n') &&
1262 (linelen + 1) >= MAXLINESIZE) {
1263 odata[out++] = '=';
1264 if (crlf) odata[out++] = '\r';
1265 odata[out++] = '\n';
1266 linelen = 0;
1267 }
1268 linelen++;
1269 if (header && data[in] == ' ') {
1270 odata[out++] = '_';
1271 in++;
1272 }
1273 else {
1274 odata[out++] = data[in++];
1275 }
1276 }
1277 }
1278 }
Greg Warda645b302001-10-04 14:54:53 +00001279 if ((rv = PyString_FromStringAndSize((char *)odata, out)) == NULL) {
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001280 free (odata);
1281 return NULL;
1282 }
1283 free (odata);
1284 return rv;
1285}
Barry Warsawe977c212000-08-15 06:07:13 +00001286
Jack Jansen72781191995-08-07 14:34:15 +00001287/* List of functions defined in the module */
1288
1289static struct PyMethodDef binascii_module_methods[] = {
Barry Warsawe977c212000-08-15 06:07:13 +00001290 {"a2b_uu", binascii_a2b_uu, METH_VARARGS, doc_a2b_uu},
1291 {"b2a_uu", binascii_b2a_uu, METH_VARARGS, doc_b2a_uu},
1292 {"a2b_base64", binascii_a2b_base64, METH_VARARGS, doc_a2b_base64},
1293 {"b2a_base64", binascii_b2a_base64, METH_VARARGS, doc_b2a_base64},
1294 {"a2b_hqx", binascii_a2b_hqx, METH_VARARGS, doc_a2b_hqx},
1295 {"b2a_hqx", binascii_b2a_hqx, METH_VARARGS, doc_b2a_hqx},
1296 {"b2a_hex", binascii_hexlify, METH_VARARGS, doc_hexlify},
1297 {"a2b_hex", binascii_unhexlify, METH_VARARGS, doc_unhexlify},
1298 {"hexlify", binascii_hexlify, METH_VARARGS, doc_hexlify},
1299 {"unhexlify", binascii_unhexlify, METH_VARARGS, doc_unhexlify},
1300 {"rlecode_hqx", binascii_rlecode_hqx, METH_VARARGS, doc_rlecode_hqx},
1301 {"rledecode_hqx", binascii_rledecode_hqx, METH_VARARGS,
1302 doc_rledecode_hqx},
1303 {"crc_hqx", binascii_crc_hqx, METH_VARARGS, doc_crc_hqx},
1304 {"crc32", binascii_crc32, METH_VARARGS, doc_crc32},
Tim Peters934c1a12002-07-02 22:24:50 +00001305 {"a2b_qp", (PyCFunction)binascii_a2b_qp, METH_VARARGS | METH_KEYWORDS,
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001306 doc_a2b_qp},
Tim Peters934c1a12002-07-02 22:24:50 +00001307 {"b2a_qp", (PyCFunction)binascii_b2a_qp, METH_VARARGS | METH_KEYWORDS,
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001308 doc_b2a_qp},
Barry Warsawe977c212000-08-15 06:07:13 +00001309 {NULL, NULL} /* sentinel */
Jack Jansen72781191995-08-07 14:34:15 +00001310};
1311
1312
1313/* Initialization function for the module (*must* be called initbinascii) */
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001314PyDoc_STRVAR(doc_binascii, "Conversion between binary data and ASCII");
Jack Jansen72781191995-08-07 14:34:15 +00001315
Guido van Rossum3886bb61998-12-04 18:50:17 +00001316DL_EXPORT(void)
Thomas Woutersf3f33dc2000-07-21 06:00:07 +00001317initbinascii(void)
Jack Jansen72781191995-08-07 14:34:15 +00001318{
1319 PyObject *m, *d, *x;
1320
1321 /* Create the module and add the functions */
1322 m = Py_InitModule("binascii", binascii_module_methods);
1323
1324 d = PyModule_GetDict(m);
1325 x = PyString_FromString(doc_binascii);
1326 PyDict_SetItemString(d, "__doc__", x);
Guido van Rossum5c159bd1997-08-04 23:55:25 +00001327 Py_XDECREF(x);
Jack Jansen72781191995-08-07 14:34:15 +00001328
Guido van Rossum7dbb48a1997-10-08 15:26:07 +00001329 Error = PyErr_NewException("binascii.Error", NULL, NULL);
Jack Jansen72781191995-08-07 14:34:15 +00001330 PyDict_SetItemString(d, "Error", Error);
Guido van Rossum7dbb48a1997-10-08 15:26:07 +00001331 Incomplete = PyErr_NewException("binascii.Incomplete", NULL, NULL);
Jack Jansen72781191995-08-07 14:34:15 +00001332 PyDict_SetItemString(d, "Incomplete", Incomplete);
Jack Jansen72781191995-08-07 14:34:15 +00001333}