blob: 05964c9351cc059e699558055b8574882cc17f8c [file] [log] [blame]
Jack Jansen72781191995-08-07 14:34:15 +00001/*
2** Routines to represent binary data in ASCII and vice-versa
3**
4** This module currently supports the following encodings:
5** uuencode:
6** each line encodes 45 bytes (except possibly the last)
7** First char encodes (binary) length, rest data
8** each char encodes 6 bits, as follows:
9** binary: 01234567 abcdefgh ijklmnop
10** ascii: 012345 67abcd efghij klmnop
11** ASCII encoding method is "excess-space": 000000 is encoded as ' ', etc.
12** short binary data is zero-extended (so the bits are always in the
13** right place), this does *not* reflect in the length.
Jack Jansen84bbc2e1995-10-04 16:38:44 +000014** base64:
15** Line breaks are insignificant, but lines are at most 76 chars
16** each char encodes 6 bits, in similar order as uucode/hqx. Encoding
17** is done via a table.
18** Short binary data is filled (in ASCII) with '='.
Jack Jansen72781191995-08-07 14:34:15 +000019** hqx:
20** File starts with introductory text, real data starts and ends
21** with colons.
22** Data consists of three similar parts: info, datafork, resourcefork.
23** Each part is protected (at the end) with a 16-bit crc
24** The binary data is run-length encoded, and then ascii-fied:
25** binary: 01234567 abcdefgh ijklmnop
26** ascii: 012345 67abcd efghij klmnop
27** ASCII encoding is table-driven, see the code.
28** Short binary data results in the runt ascii-byte being output with
29** the bits in the right place.
30**
31** While I was reading dozens of programs that encode or decode the formats
32** here (documentation? hihi:-) I have formulated Jansen's Observation:
33**
34** Programs that encode binary data in ASCII are written in
35** such a style that they are as unreadable as possible. Devices used
36** include unnecessary global variables, burying important tables
37** in unrelated sourcefiles, putting functions in include files,
38** using seemingly-descriptive variable names for different purposes,
39** calls to empty subroutines and a host of others.
40**
41** I have attempted to break with this tradition, but I guess that that
42** does make the performance sub-optimal. Oh well, too bad...
43**
44** Jack Jansen, CWI, July 1995.
Tim Peters934c1a12002-07-02 22:24:50 +000045**
Martin v. Löwis16dc7f42001-09-30 20:32:11 +000046** Added support for quoted-printable encoding, based on rfc 1521 et al
Tim Peters934c1a12002-07-02 22:24:50 +000047** quoted-printable encoding specifies that non printable characters (anything
Martin v. Löwis16dc7f42001-09-30 20:32:11 +000048** below 32 and above 126) be encoded as =XX where XX is the hexadecimal value
49** of the character. It also specifies some other behavior to enable 8bit data
Tim Peters934c1a12002-07-02 22:24:50 +000050** in a mail message with little difficulty (maximum line sizes, protecting
51** some cases of whitespace, etc).
Martin v. Löwis16dc7f42001-09-30 20:32:11 +000052**
53** Brandon Long, September 2001.
Jack Jansen72781191995-08-07 14:34:15 +000054*/
55
56
57#include "Python.h"
58
59static PyObject *Error;
60static PyObject *Incomplete;
61
62/*
63** hqx lookup table, ascii->binary.
64*/
65
66#define RUNCHAR 0x90
67
68#define DONE 0x7F
69#define SKIP 0x7E
70#define FAIL 0x7D
71
72static unsigned char table_a2b_hqx[256] = {
73/* ^@ ^A ^B ^C ^D ^E ^F ^G */
74/* 0*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
75/* \b \t \n ^K ^L \r ^N ^O */
76/* 1*/ FAIL, FAIL, SKIP, FAIL, FAIL, SKIP, FAIL, FAIL,
77/* ^P ^Q ^R ^S ^T ^U ^V ^W */
78/* 2*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
79/* ^X ^Y ^Z ^[ ^\ ^] ^^ ^_ */
80/* 3*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
81/* ! " # $ % & ' */
82/* 4*/ FAIL, 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06,
83/* ( ) * + , - . / */
84/* 5*/ 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, FAIL, FAIL,
85/* 0 1 2 3 4 5 6 7 */
86/* 6*/ 0x0D, 0x0E, 0x0F, 0x10, 0x11, 0x12, 0x13, FAIL,
87/* 8 9 : ; < = > ? */
88/* 7*/ 0x14, 0x15, DONE, FAIL, FAIL, FAIL, FAIL, FAIL,
89/* @ A B C D E F G */
90/* 8*/ 0x16, 0x17, 0x18, 0x19, 0x1A, 0x1B, 0x1C, 0x1D,
91/* H I J K L M N O */
92/* 9*/ 0x1E, 0x1F, 0x20, 0x21, 0x22, 0x23, 0x24, FAIL,
93/* P Q R S T U V W */
94/*10*/ 0x25, 0x26, 0x27, 0x28, 0x29, 0x2A, 0x2B, FAIL,
95/* X Y Z [ \ ] ^ _ */
96/*11*/ 0x2C, 0x2D, 0x2E, 0x2F, FAIL, FAIL, FAIL, FAIL,
97/* ` a b c d e f g */
98/*12*/ 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, FAIL,
99/* h i j k l m n o */
100/*13*/ 0x37, 0x38, 0x39, 0x3A, 0x3B, 0x3C, FAIL, FAIL,
101/* p q r s t u v w */
102/*14*/ 0x3D, 0x3E, 0x3F, FAIL, FAIL, FAIL, FAIL, FAIL,
103/* x y z { | } ~ ^? */
104/*15*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
105/*16*/ FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
106 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
107 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
108 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
109 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
110 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
111 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
112 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
113 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
114 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
115 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
116 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
117 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
118 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
119 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
120 FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL, FAIL,
121};
122
123static unsigned char table_b2a_hqx[] =
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000124"!\"#$%&'()*+,-012345689@ABCDEFGHIJKLMNPQRSTUVXYZ[`abcdefhijklmpqr";
Jack Jansen72781191995-08-07 14:34:15 +0000125
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000126static char table_a2b_base64[] = {
127 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
128 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
129 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,62, -1,-1,-1,63,
130 52,53,54,55, 56,57,58,59, 60,61,-1,-1, -1, 0,-1,-1, /* Note PAD->0 */
131 -1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9,10, 11,12,13,14,
132 15,16,17,18, 19,20,21,22, 23,24,25,-1, -1,-1,-1,-1,
133 -1,26,27,28, 29,30,31,32, 33,34,35,36, 37,38,39,40,
134 41,42,43,44, 45,46,47,48, 49,50,51,-1, -1,-1,-1,-1
135};
136
137#define BASE64_PAD '='
Guido van Rossum355bc0c2001-10-30 03:00:52 +0000138
139/* Max binary chunk size; limited only by available memory */
Tim Peters1fbb5772001-12-19 04:41:35 +0000140#define BASE64_MAXBIN (INT_MAX/2 - sizeof(PyStringObject) - 3)
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000141
142static unsigned char table_b2a_base64[] =
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000143"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000144
145
146
Jack Jansen72781191995-08-07 14:34:15 +0000147static unsigned short crctab_hqx[256] = {
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000148 0x0000, 0x1021, 0x2042, 0x3063, 0x4084, 0x50a5, 0x60c6, 0x70e7,
149 0x8108, 0x9129, 0xa14a, 0xb16b, 0xc18c, 0xd1ad, 0xe1ce, 0xf1ef,
150 0x1231, 0x0210, 0x3273, 0x2252, 0x52b5, 0x4294, 0x72f7, 0x62d6,
151 0x9339, 0x8318, 0xb37b, 0xa35a, 0xd3bd, 0xc39c, 0xf3ff, 0xe3de,
152 0x2462, 0x3443, 0x0420, 0x1401, 0x64e6, 0x74c7, 0x44a4, 0x5485,
153 0xa56a, 0xb54b, 0x8528, 0x9509, 0xe5ee, 0xf5cf, 0xc5ac, 0xd58d,
154 0x3653, 0x2672, 0x1611, 0x0630, 0x76d7, 0x66f6, 0x5695, 0x46b4,
155 0xb75b, 0xa77a, 0x9719, 0x8738, 0xf7df, 0xe7fe, 0xd79d, 0xc7bc,
156 0x48c4, 0x58e5, 0x6886, 0x78a7, 0x0840, 0x1861, 0x2802, 0x3823,
157 0xc9cc, 0xd9ed, 0xe98e, 0xf9af, 0x8948, 0x9969, 0xa90a, 0xb92b,
158 0x5af5, 0x4ad4, 0x7ab7, 0x6a96, 0x1a71, 0x0a50, 0x3a33, 0x2a12,
159 0xdbfd, 0xcbdc, 0xfbbf, 0xeb9e, 0x9b79, 0x8b58, 0xbb3b, 0xab1a,
160 0x6ca6, 0x7c87, 0x4ce4, 0x5cc5, 0x2c22, 0x3c03, 0x0c60, 0x1c41,
161 0xedae, 0xfd8f, 0xcdec, 0xddcd, 0xad2a, 0xbd0b, 0x8d68, 0x9d49,
162 0x7e97, 0x6eb6, 0x5ed5, 0x4ef4, 0x3e13, 0x2e32, 0x1e51, 0x0e70,
163 0xff9f, 0xefbe, 0xdfdd, 0xcffc, 0xbf1b, 0xaf3a, 0x9f59, 0x8f78,
164 0x9188, 0x81a9, 0xb1ca, 0xa1eb, 0xd10c, 0xc12d, 0xf14e, 0xe16f,
165 0x1080, 0x00a1, 0x30c2, 0x20e3, 0x5004, 0x4025, 0x7046, 0x6067,
166 0x83b9, 0x9398, 0xa3fb, 0xb3da, 0xc33d, 0xd31c, 0xe37f, 0xf35e,
167 0x02b1, 0x1290, 0x22f3, 0x32d2, 0x4235, 0x5214, 0x6277, 0x7256,
168 0xb5ea, 0xa5cb, 0x95a8, 0x8589, 0xf56e, 0xe54f, 0xd52c, 0xc50d,
169 0x34e2, 0x24c3, 0x14a0, 0x0481, 0x7466, 0x6447, 0x5424, 0x4405,
170 0xa7db, 0xb7fa, 0x8799, 0x97b8, 0xe75f, 0xf77e, 0xc71d, 0xd73c,
171 0x26d3, 0x36f2, 0x0691, 0x16b0, 0x6657, 0x7676, 0x4615, 0x5634,
172 0xd94c, 0xc96d, 0xf90e, 0xe92f, 0x99c8, 0x89e9, 0xb98a, 0xa9ab,
173 0x5844, 0x4865, 0x7806, 0x6827, 0x18c0, 0x08e1, 0x3882, 0x28a3,
174 0xcb7d, 0xdb5c, 0xeb3f, 0xfb1e, 0x8bf9, 0x9bd8, 0xabbb, 0xbb9a,
175 0x4a75, 0x5a54, 0x6a37, 0x7a16, 0x0af1, 0x1ad0, 0x2ab3, 0x3a92,
176 0xfd2e, 0xed0f, 0xdd6c, 0xcd4d, 0xbdaa, 0xad8b, 0x9de8, 0x8dc9,
177 0x7c26, 0x6c07, 0x5c64, 0x4c45, 0x3ca2, 0x2c83, 0x1ce0, 0x0cc1,
178 0xef1f, 0xff3e, 0xcf5d, 0xdf7c, 0xaf9b, 0xbfba, 0x8fd9, 0x9ff8,
179 0x6e17, 0x7e36, 0x4e55, 0x5e74, 0x2e93, 0x3eb2, 0x0ed1, 0x1ef0,
Jack Jansen72781191995-08-07 14:34:15 +0000180};
181
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000182PyDoc_STRVAR(doc_a2b_uu, "(ascii) -> bin. Decode a line of uuencoded data");
Jack Jansen72781191995-08-07 14:34:15 +0000183
184static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000185binascii_a2b_uu(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000186{
187 unsigned char *ascii_data, *bin_data;
188 int leftbits = 0;
189 unsigned char this_ch;
190 unsigned int leftchar = 0;
191 PyObject *rv;
192 int ascii_len, bin_len;
Tim Peters934c1a12002-07-02 22:24:50 +0000193
Guido van Rossum43713e52000-02-29 13:59:29 +0000194 if ( !PyArg_ParseTuple(args, "t#:a2b_uu", &ascii_data, &ascii_len) )
Jack Jansen72781191995-08-07 14:34:15 +0000195 return NULL;
196
197 /* First byte: binary data length (in bytes) */
198 bin_len = (*ascii_data++ - ' ') & 077;
199 ascii_len--;
200
201 /* Allocate the buffer */
202 if ( (rv=PyString_FromStringAndSize(NULL, bin_len)) == NULL )
203 return NULL;
204 bin_data = (unsigned char *)PyString_AsString(rv);
Tim Peters934c1a12002-07-02 22:24:50 +0000205
Jack Jansen72781191995-08-07 14:34:15 +0000206 for( ; bin_len > 0 ; ascii_len--, ascii_data++ ) {
207 this_ch = *ascii_data;
208 if ( this_ch == '\n' || this_ch == '\r' || ascii_len <= 0) {
209 /*
210 ** Whitespace. Assume some spaces got eaten at
211 ** end-of-line. (We check this later)
212 */
213 this_ch = 0;
214 } else {
Jack Jansen5d957971995-11-14 10:35:19 +0000215 /* Check the character for legality
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000216 ** The 64 in stead of the expected 63 is because
217 ** there are a few uuencodes out there that use
Guido van Rossum92d89172001-01-09 02:11:57 +0000218 ** '`' as zero instead of space.
Jack Jansen5d957971995-11-14 10:35:19 +0000219 */
220 if ( this_ch < ' ' || this_ch > (' ' + 64)) {
Jack Jansen72781191995-08-07 14:34:15 +0000221 PyErr_SetString(Error, "Illegal char");
222 Py_DECREF(rv);
223 return NULL;
224 }
225 this_ch = (this_ch - ' ') & 077;
226 }
227 /*
228 ** Shift it in on the low end, and see if there's
229 ** a byte ready for output.
230 */
231 leftchar = (leftchar << 6) | (this_ch);
232 leftbits += 6;
233 if ( leftbits >= 8 ) {
234 leftbits -= 8;
235 *bin_data++ = (leftchar >> leftbits) & 0xff;
236 leftchar &= ((1 << leftbits) - 1);
237 bin_len--;
238 }
239 }
240 /*
241 ** Finally, check that if there's anything left on the line
242 ** that it's whitespace only.
243 */
244 while( ascii_len-- > 0 ) {
245 this_ch = *ascii_data++;
Guido van Rossum92d89172001-01-09 02:11:57 +0000246 /* Extra '`' may be written as padding in some cases */
247 if ( this_ch != ' ' && this_ch != ' '+64 &&
Guido van Rossum1243ae71997-07-11 18:36:28 +0000248 this_ch != '\n' && this_ch != '\r' ) {
Jack Jansen72781191995-08-07 14:34:15 +0000249 PyErr_SetString(Error, "Trailing garbage");
250 Py_DECREF(rv);
251 return NULL;
252 }
253 }
254 return rv;
255}
256
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000257PyDoc_STRVAR(doc_b2a_uu, "(bin) -> ascii. Uuencode line of data");
Tim Peters934c1a12002-07-02 22:24:50 +0000258
Jack Jansen72781191995-08-07 14:34:15 +0000259static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000260binascii_b2a_uu(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000261{
262 unsigned char *ascii_data, *bin_data;
263 int leftbits = 0;
264 unsigned char this_ch;
265 unsigned int leftchar = 0;
266 PyObject *rv;
267 int bin_len;
Tim Peters934c1a12002-07-02 22:24:50 +0000268
Guido van Rossum43713e52000-02-29 13:59:29 +0000269 if ( !PyArg_ParseTuple(args, "s#:b2a_uu", &bin_data, &bin_len) )
Jack Jansen72781191995-08-07 14:34:15 +0000270 return NULL;
271 if ( bin_len > 45 ) {
272 /* The 45 is a limit that appears in all uuencode's */
273 PyErr_SetString(Error, "At most 45 bytes at once");
274 return NULL;
275 }
276
277 /* We're lazy and allocate to much (fixed up later) */
278 if ( (rv=PyString_FromStringAndSize(NULL, bin_len*2)) == NULL )
279 return NULL;
280 ascii_data = (unsigned char *)PyString_AsString(rv);
281
282 /* Store the length */
283 *ascii_data++ = ' ' + (bin_len & 077);
Tim Peters934c1a12002-07-02 22:24:50 +0000284
Jack Jansen72781191995-08-07 14:34:15 +0000285 for( ; bin_len > 0 || leftbits != 0 ; bin_len--, bin_data++ ) {
286 /* Shift the data (or padding) into our buffer */
287 if ( bin_len > 0 ) /* Data */
288 leftchar = (leftchar << 8) | *bin_data;
289 else /* Padding */
290 leftchar <<= 8;
291 leftbits += 8;
292
293 /* See if there are 6-bit groups ready */
294 while ( leftbits >= 6 ) {
295 this_ch = (leftchar >> (leftbits-6)) & 0x3f;
296 leftbits -= 6;
297 *ascii_data++ = this_ch + ' ';
298 }
299 }
300 *ascii_data++ = '\n'; /* Append a courtesy newline */
Tim Peters934c1a12002-07-02 22:24:50 +0000301
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000302 _PyString_Resize(&rv, (ascii_data -
303 (unsigned char *)PyString_AsString(rv)));
Jack Jansen72781191995-08-07 14:34:15 +0000304 return rv;
305}
306
Guido van Rossum2db4f471999-10-19 19:05:14 +0000307
308static int
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000309binascii_find_valid(unsigned char *s, int slen, int num)
Guido van Rossum2db4f471999-10-19 19:05:14 +0000310{
Tim Peters934c1a12002-07-02 22:24:50 +0000311 /* Finds & returns the (num+1)th
Guido van Rossum2db4f471999-10-19 19:05:14 +0000312 ** valid character for base64, or -1 if none.
313 */
314
315 int ret = -1;
316 unsigned char c, b64val;
317
318 while ((slen > 0) && (ret == -1)) {
319 c = *s;
320 b64val = table_a2b_base64[c & 0x7f];
321 if ( ((c <= 0x7f) && (b64val != (unsigned char)-1)) ) {
322 if (num == 0)
323 ret = *s;
324 num--;
325 }
326
327 s++;
328 slen--;
329 }
330 return ret;
331}
332
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000333PyDoc_STRVAR(doc_a2b_base64, "(ascii) -> bin. Decode a line of base64 data");
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000334
335static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000336binascii_a2b_base64(PyObject *self, PyObject *args)
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000337{
338 unsigned char *ascii_data, *bin_data;
339 int leftbits = 0;
340 unsigned char this_ch;
341 unsigned int leftchar = 0;
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000342 PyObject *rv;
343 int ascii_len, bin_len;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000344 int quad_pos = 0;
Tim Peters934c1a12002-07-02 22:24:50 +0000345
Guido van Rossum43713e52000-02-29 13:59:29 +0000346 if ( !PyArg_ParseTuple(args, "t#:a2b_base64", &ascii_data, &ascii_len) )
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000347 return NULL;
348
349 bin_len = ((ascii_len+3)/4)*3; /* Upper bound, corrected later */
350
351 /* Allocate the buffer */
352 if ( (rv=PyString_FromStringAndSize(NULL, bin_len)) == NULL )
353 return NULL;
354 bin_data = (unsigned char *)PyString_AsString(rv);
355 bin_len = 0;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000356
357 for( ; ascii_len > 0; ascii_len--, ascii_data++) {
358 this_ch = *ascii_data;
359
360 if (this_ch > 0x7f ||
361 this_ch == '\r' || this_ch == '\n' || this_ch == ' ')
Jack Jansenba1de3b1996-01-22 10:47:15 +0000362 continue;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000363
364 /* Check for pad sequences and ignore
365 ** the invalid ones.
366 */
367 if (this_ch == BASE64_PAD) {
368 if ( (quad_pos < 2) ||
369 ((quad_pos == 2) &&
370 (binascii_find_valid(ascii_data, ascii_len, 1)
371 != BASE64_PAD)) )
372 {
373 continue;
374 }
375 else {
376 /* A pad sequence means no more input.
377 ** We've already interpreted the data
378 ** from the quad at this point.
379 */
380 leftbits = 0;
381 break;
382 }
383 }
384
385 this_ch = table_a2b_base64[*ascii_data];
386 if ( this_ch == (unsigned char) -1 )
387 continue;
388
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000389 /*
390 ** Shift it in on the low end, and see if there's
391 ** a byte ready for output.
392 */
Guido van Rossum2db4f471999-10-19 19:05:14 +0000393 quad_pos = (quad_pos + 1) & 0x03;
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000394 leftchar = (leftchar << 6) | (this_ch);
395 leftbits += 6;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000396
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000397 if ( leftbits >= 8 ) {
398 leftbits -= 8;
399 *bin_data++ = (leftchar >> leftbits) & 0xff;
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000400 bin_len++;
Guido van Rossum2db4f471999-10-19 19:05:14 +0000401 leftchar &= ((1 << leftbits) - 1);
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000402 }
Guido van Rossum2db4f471999-10-19 19:05:14 +0000403 }
404
405 if (leftbits != 0) {
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000406 PyErr_SetString(Error, "Incorrect padding");
407 Py_DECREF(rv);
408 return NULL;
409 }
Guido van Rossum2db4f471999-10-19 19:05:14 +0000410
Thomas Wouters9e1c1922003-03-17 11:24:29 +0000411 /* And set string size correctly. If the result string is empty
412 ** (because the input was all invalid) return the shared empty
413 ** string instead; _PyString_Resize() won't do this for us.
414 */
Barry Warsaw0a51b582002-08-15 22:14:24 +0000415 if (bin_len > 0)
416 _PyString_Resize(&rv, bin_len);
Thomas Wouters9e1c1922003-03-17 11:24:29 +0000417 else {
418 Py_DECREF(rv);
419 rv = PyString_FromString("");
420 }
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000421 return rv;
422}
423
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000424PyDoc_STRVAR(doc_b2a_base64, "(bin) -> ascii. Base64-code line of data");
Tim Peters934c1a12002-07-02 22:24:50 +0000425
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000426static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000427binascii_b2a_base64(PyObject *self, PyObject *args)
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000428{
429 unsigned char *ascii_data, *bin_data;
430 int leftbits = 0;
431 unsigned char this_ch;
432 unsigned int leftchar = 0;
433 PyObject *rv;
434 int bin_len;
Tim Peters934c1a12002-07-02 22:24:50 +0000435
Guido van Rossum43713e52000-02-29 13:59:29 +0000436 if ( !PyArg_ParseTuple(args, "s#:b2a_base64", &bin_data, &bin_len) )
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000437 return NULL;
438 if ( bin_len > BASE64_MAXBIN ) {
439 PyErr_SetString(Error, "Too much data for base64 line");
440 return NULL;
441 }
Tim Peters934c1a12002-07-02 22:24:50 +0000442
Tim Peters1fbb5772001-12-19 04:41:35 +0000443 /* We're lazy and allocate too much (fixed up later).
444 "+3" leaves room for up to two pad characters and a trailing
445 newline. Note that 'b' gets encoded as 'Yg==\n' (1 in, 5 out). */
446 if ( (rv=PyString_FromStringAndSize(NULL, bin_len*2 + 3)) == NULL )
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000447 return NULL;
448 ascii_data = (unsigned char *)PyString_AsString(rv);
449
450 for( ; bin_len > 0 ; bin_len--, bin_data++ ) {
451 /* Shift the data into our buffer */
452 leftchar = (leftchar << 8) | *bin_data;
453 leftbits += 8;
454
455 /* See if there are 6-bit groups ready */
456 while ( leftbits >= 6 ) {
457 this_ch = (leftchar >> (leftbits-6)) & 0x3f;
458 leftbits -= 6;
459 *ascii_data++ = table_b2a_base64[this_ch];
460 }
461 }
462 if ( leftbits == 2 ) {
463 *ascii_data++ = table_b2a_base64[(leftchar&3) << 4];
464 *ascii_data++ = BASE64_PAD;
465 *ascii_data++ = BASE64_PAD;
466 } else if ( leftbits == 4 ) {
467 *ascii_data++ = table_b2a_base64[(leftchar&0xf) << 2];
468 *ascii_data++ = BASE64_PAD;
Tim Peters934c1a12002-07-02 22:24:50 +0000469 }
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000470 *ascii_data++ = '\n'; /* Append a courtesy newline */
Tim Peters934c1a12002-07-02 22:24:50 +0000471
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000472 _PyString_Resize(&rv, (ascii_data -
473 (unsigned char *)PyString_AsString(rv)));
Jack Jansen84bbc2e1995-10-04 16:38:44 +0000474 return rv;
475}
476
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000477PyDoc_STRVAR(doc_a2b_hqx, "ascii -> bin, done. Decode .hqx coding");
Jack Jansen72781191995-08-07 14:34:15 +0000478
479static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000480binascii_a2b_hqx(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000481{
482 unsigned char *ascii_data, *bin_data;
483 int leftbits = 0;
484 unsigned char this_ch;
Jack Janseneaeb1c81995-08-14 12:17:57 +0000485 unsigned int leftchar = 0;
Jack Jansen72781191995-08-07 14:34:15 +0000486 PyObject *rv;
487 int len;
488 int done = 0;
Tim Peters934c1a12002-07-02 22:24:50 +0000489
Guido van Rossum43713e52000-02-29 13:59:29 +0000490 if ( !PyArg_ParseTuple(args, "t#:a2b_hqx", &ascii_data, &len) )
Jack Jansen72781191995-08-07 14:34:15 +0000491 return NULL;
492
493 /* Allocate a string that is too big (fixed later) */
494 if ( (rv=PyString_FromStringAndSize(NULL, len)) == NULL )
495 return NULL;
496 bin_data = (unsigned char *)PyString_AsString(rv);
497
498 for( ; len > 0 ; len--, ascii_data++ ) {
499 /* Get the byte and look it up */
500 this_ch = table_a2b_hqx[*ascii_data];
501 if ( this_ch == SKIP )
502 continue;
503 if ( this_ch == FAIL ) {
504 PyErr_SetString(Error, "Illegal char");
505 Py_DECREF(rv);
506 return NULL;
507 }
508 if ( this_ch == DONE ) {
509 /* The terminating colon */
510 done = 1;
511 break;
512 }
513
514 /* Shift it into the buffer and see if any bytes are ready */
515 leftchar = (leftchar << 6) | (this_ch);
516 leftbits += 6;
517 if ( leftbits >= 8 ) {
518 leftbits -= 8;
519 *bin_data++ = (leftchar >> leftbits) & 0xff;
520 leftchar &= ((1 << leftbits) - 1);
521 }
522 }
Tim Peters934c1a12002-07-02 22:24:50 +0000523
Jack Jansen72781191995-08-07 14:34:15 +0000524 if ( leftbits && !done ) {
525 PyErr_SetString(Incomplete,
526 "String has incomplete number of bytes");
527 Py_DECREF(rv);
528 return NULL;
529 }
Guido van Rossum9c6ba5e1997-01-12 20:02:04 +0000530 _PyString_Resize(
531 &rv, (bin_data - (unsigned char *)PyString_AsString(rv)));
532 if (rv) {
533 PyObject *rrv = Py_BuildValue("Oi", rv, done);
534 Py_DECREF(rv);
535 return rrv;
536 }
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000537
Jack Jansen72781191995-08-07 14:34:15 +0000538 return NULL;
539}
540
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000541PyDoc_STRVAR(doc_rlecode_hqx, "Binhex RLE-code binary data");
Jack Jansen72781191995-08-07 14:34:15 +0000542
543static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000544binascii_rlecode_hqx(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000545{
546 unsigned char *in_data, *out_data;
547 PyObject *rv;
548 unsigned char ch;
549 int in, inend, len;
Tim Peters934c1a12002-07-02 22:24:50 +0000550
Guido van Rossum43713e52000-02-29 13:59:29 +0000551 if ( !PyArg_ParseTuple(args, "s#:rlecode_hqx", &in_data, &len) )
Jack Jansen72781191995-08-07 14:34:15 +0000552 return NULL;
553
554 /* Worst case: output is twice as big as input (fixed later) */
555 if ( (rv=PyString_FromStringAndSize(NULL, len*2)) == NULL )
556 return NULL;
557 out_data = (unsigned char *)PyString_AsString(rv);
Tim Peters934c1a12002-07-02 22:24:50 +0000558
Jack Jansen72781191995-08-07 14:34:15 +0000559 for( in=0; in<len; in++) {
560 ch = in_data[in];
561 if ( ch == RUNCHAR ) {
562 /* RUNCHAR. Escape it. */
563 *out_data++ = RUNCHAR;
564 *out_data++ = 0;
565 } else {
566 /* Check how many following are the same */
567 for(inend=in+1;
568 inend<len && in_data[inend] == ch &&
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000569 inend < in+255;
Jack Jansen72781191995-08-07 14:34:15 +0000570 inend++) ;
Jack Jansen0223aa11995-08-31 13:44:23 +0000571 if ( inend - in > 3 ) {
572 /* More than 3 in a row. Output RLE. */
Jack Jansen72781191995-08-07 14:34:15 +0000573 *out_data++ = ch;
574 *out_data++ = RUNCHAR;
575 *out_data++ = inend-in;
576 in = inend-1;
577 } else {
578 /* Less than 3. Output the byte itself */
579 *out_data++ = ch;
580 }
581 }
582 }
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000583 _PyString_Resize(&rv, (out_data -
584 (unsigned char *)PyString_AsString(rv)));
Jack Jansen72781191995-08-07 14:34:15 +0000585 return rv;
586}
587
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000588PyDoc_STRVAR(doc_b2a_hqx, "Encode .hqx data");
Tim Peters934c1a12002-07-02 22:24:50 +0000589
Jack Jansen72781191995-08-07 14:34:15 +0000590static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000591binascii_b2a_hqx(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000592{
593 unsigned char *ascii_data, *bin_data;
594 int leftbits = 0;
595 unsigned char this_ch;
Jack Janseneaeb1c81995-08-14 12:17:57 +0000596 unsigned int leftchar = 0;
Jack Jansen72781191995-08-07 14:34:15 +0000597 PyObject *rv;
598 int len;
Tim Peters934c1a12002-07-02 22:24:50 +0000599
Guido van Rossum43713e52000-02-29 13:59:29 +0000600 if ( !PyArg_ParseTuple(args, "s#:b2a_hqx", &bin_data, &len) )
Jack Jansen72781191995-08-07 14:34:15 +0000601 return NULL;
602
603 /* Allocate a buffer that is at least large enough */
604 if ( (rv=PyString_FromStringAndSize(NULL, len*2)) == NULL )
605 return NULL;
606 ascii_data = (unsigned char *)PyString_AsString(rv);
Tim Peters934c1a12002-07-02 22:24:50 +0000607
Jack Jansen72781191995-08-07 14:34:15 +0000608 for( ; len > 0 ; len--, bin_data++ ) {
609 /* Shift into our buffer, and output any 6bits ready */
610 leftchar = (leftchar << 8) | *bin_data;
611 leftbits += 8;
612 while ( leftbits >= 6 ) {
613 this_ch = (leftchar >> (leftbits-6)) & 0x3f;
614 leftbits -= 6;
615 *ascii_data++ = table_b2a_hqx[this_ch];
616 }
617 }
618 /* Output a possible runt byte */
619 if ( leftbits ) {
620 leftchar <<= (6-leftbits);
621 *ascii_data++ = table_b2a_hqx[leftchar & 0x3f];
622 }
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000623 _PyString_Resize(&rv, (ascii_data -
624 (unsigned char *)PyString_AsString(rv)));
Jack Jansen72781191995-08-07 14:34:15 +0000625 return rv;
626}
627
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000628PyDoc_STRVAR(doc_rledecode_hqx, "Decode hexbin RLE-coded string");
Tim Peters934c1a12002-07-02 22:24:50 +0000629
Jack Jansen72781191995-08-07 14:34:15 +0000630static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000631binascii_rledecode_hqx(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000632{
633 unsigned char *in_data, *out_data;
634 unsigned char in_byte, in_repeat;
635 PyObject *rv;
636 int in_len, out_len, out_len_left;
637
Guido van Rossum43713e52000-02-29 13:59:29 +0000638 if ( !PyArg_ParseTuple(args, "s#:rledecode_hqx", &in_data, &in_len) )
Jack Jansen72781191995-08-07 14:34:15 +0000639 return NULL;
640
641 /* Empty string is a special case */
642 if ( in_len == 0 )
643 return Py_BuildValue("s", "");
644
645 /* Allocate a buffer of reasonable size. Resized when needed */
646 out_len = in_len*2;
647 if ( (rv=PyString_FromStringAndSize(NULL, out_len)) == NULL )
648 return NULL;
649 out_len_left = out_len;
650 out_data = (unsigned char *)PyString_AsString(rv);
651
652 /*
653 ** We need two macros here to get/put bytes and handle
654 ** end-of-buffer for input and output strings.
655 */
656#define INBYTE(b) \
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000657 do { \
658 if ( --in_len < 0 ) { \
659 PyErr_SetString(Incomplete, ""); \
660 Py_DECREF(rv); \
661 return NULL; \
662 } \
663 b = *in_data++; \
664 } while(0)
Tim Peters934c1a12002-07-02 22:24:50 +0000665
Jack Jansen72781191995-08-07 14:34:15 +0000666#define OUTBYTE(b) \
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000667 do { \
668 if ( --out_len_left < 0 ) { \
669 _PyString_Resize(&rv, 2*out_len); \
670 if ( rv == NULL ) return NULL; \
671 out_data = (unsigned char *)PyString_AsString(rv) \
672 + out_len; \
673 out_len_left = out_len-1; \
674 out_len = out_len * 2; \
675 } \
676 *out_data++ = b; \
677 } while(0)
Jack Jansen72781191995-08-07 14:34:15 +0000678
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000679 /*
680 ** Handle first byte separately (since we have to get angry
681 ** in case of an orphaned RLE code).
682 */
683 INBYTE(in_byte);
Jack Jansen72781191995-08-07 14:34:15 +0000684
685 if (in_byte == RUNCHAR) {
686 INBYTE(in_repeat);
687 if (in_repeat != 0) {
688 /* Note Error, not Incomplete (which is at the end
689 ** of the string only). This is a programmer error.
690 */
691 PyErr_SetString(Error, "Orphaned RLE code at start");
692 Py_DECREF(rv);
693 return NULL;
694 }
695 OUTBYTE(RUNCHAR);
696 } else {
697 OUTBYTE(in_byte);
698 }
Tim Peters934c1a12002-07-02 22:24:50 +0000699
Jack Jansen72781191995-08-07 14:34:15 +0000700 while( in_len > 0 ) {
701 INBYTE(in_byte);
702
703 if (in_byte == RUNCHAR) {
704 INBYTE(in_repeat);
705 if ( in_repeat == 0 ) {
706 /* Just an escaped RUNCHAR value */
707 OUTBYTE(RUNCHAR);
708 } else {
709 /* Pick up value and output a sequence of it */
710 in_byte = out_data[-1];
711 while ( --in_repeat > 0 )
712 OUTBYTE(in_byte);
713 }
714 } else {
715 /* Normal byte */
716 OUTBYTE(in_byte);
717 }
718 }
Roger E. Masse5f4ce181997-01-16 17:10:22 +0000719 _PyString_Resize(&rv, (out_data -
720 (unsigned char *)PyString_AsString(rv)));
Jack Jansen72781191995-08-07 14:34:15 +0000721 return rv;
722}
723
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000724PyDoc_STRVAR(doc_crc_hqx,
725"(data, oldcrc) -> newcrc. Compute hqx CRC incrementally");
Jack Jansen72781191995-08-07 14:34:15 +0000726
727static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000728binascii_crc_hqx(PyObject *self, PyObject *args)
Jack Jansen72781191995-08-07 14:34:15 +0000729{
730 unsigned char *bin_data;
731 unsigned int crc;
732 int len;
Tim Peters934c1a12002-07-02 22:24:50 +0000733
Guido van Rossum43713e52000-02-29 13:59:29 +0000734 if ( !PyArg_ParseTuple(args, "s#i:crc_hqx", &bin_data, &len, &crc) )
Jack Jansen72781191995-08-07 14:34:15 +0000735 return NULL;
736
737 while(len--) {
738 crc=((crc<<8)&0xff00)^crctab_hqx[((crc>>8)&0xff)^*bin_data++];
739 }
740
741 return Py_BuildValue("i", crc);
742}
743
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000744PyDoc_STRVAR(doc_crc32,
745"(data, oldcrc = 0) -> newcrc. Compute CRC-32 incrementally");
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000746
747/* Crc - 32 BIT ANSI X3.66 CRC checksum files
748 Also known as: ISO 3307
749**********************************************************************|
750* *|
751* Demonstration program to compute the 32-bit CRC used as the frame *|
752* check sequence in ADCCP (ANSI X3.66, also known as FIPS PUB 71 *|
753* and FED-STD-1003, the U.S. versions of CCITT's X.25 link-level *|
754* protocol). The 32-bit FCS was added via the Federal Register, *|
755* 1 June 1982, p.23798. I presume but don't know for certain that *|
756* this polynomial is or will be included in CCITT V.41, which *|
757* defines the 16-bit CRC (often called CRC-CCITT) polynomial. FIPS *|
758* PUB 78 says that the 32-bit FCS reduces otherwise undetected *|
759* errors by a factor of 10^-5 over 16-bit FCS. *|
760* *|
761**********************************************************************|
762
763 Copyright (C) 1986 Gary S. Brown. You may use this program, or
764 code or tables extracted from it, as desired without restriction.
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000765
Tim Peters934c1a12002-07-02 22:24:50 +0000766 First, the polynomial itself and its table of feedback terms. The
767 polynomial is
768 X^32+X^26+X^23+X^22+X^16+X^12+X^11+X^10+X^8+X^7+X^5+X^4+X^2+X^1+X^0
769 Note that we take it "backwards" and put the highest-order term in
770 the lowest-order bit. The X^32 term is "implied"; the LSB is the
771 X^31 term, etc. The X^0 term (usually shown as "+1") results in
772 the MSB being 1.
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000773
Tim Peters934c1a12002-07-02 22:24:50 +0000774 Note that the usual hardware shift register implementation, which
775 is what we're using (we're merely optimizing it by doing eight-bit
776 chunks at a time) shifts bits into the lowest-order term. In our
777 implementation, that means shifting towards the right. Why do we
778 do it this way? Because the calculated CRC must be transmitted in
779 order from highest-order term to lowest-order term. UARTs transmit
780 characters in order from LSB to MSB. By storing the CRC this way,
781 we hand it to the UART in the order low-byte to high-byte; the UART
782 sends each low-bit to hight-bit; and the result is transmission bit
783 by bit from highest- to lowest-order term without requiring any bit
784 shuffling on our part. Reception works similarly.
785
786 The feedback terms table consists of 256, 32-bit entries. Notes:
787
788 1. The table can be generated at runtime if desired; code to do so
789 is shown later. It might not be obvious, but the feedback
790 terms simply represent the results of eight shift/xor opera-
791 tions for all combinations of data and CRC register values.
792
793 2. The CRC accumulation logic is the same for all CRC polynomials,
794 be they sixteen or thirty-two bits wide. You simply choose the
795 appropriate table. Alternatively, because the table can be
796 generated at runtime, you can start by generating the table for
797 the polynomial in question and use exactly the same "updcrc",
798 if your application needn't simultaneously handle two CRC
799 polynomials. (Note, however, that XMODEM is strange.)
800
801 3. For 16-bit CRCs, the table entries need be only 16 bits wide;
802 of course, 32-bit entries work OK if the high 16 bits are zero.
803
804 4. The values must be right-shifted by eight bits by the "updcrc"
805 logic; the shift must be unsigned (bring in zeroes). On some
806 hardware you could probably optimize the shift in assembler by
807 using byte-swap instructions.
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000808********************************************************************/
809
810static unsigned long crc_32_tab[256] = {
8110x00000000UL, 0x77073096UL, 0xee0e612cUL, 0x990951baUL, 0x076dc419UL,
8120x706af48fUL, 0xe963a535UL, 0x9e6495a3UL, 0x0edb8832UL, 0x79dcb8a4UL,
8130xe0d5e91eUL, 0x97d2d988UL, 0x09b64c2bUL, 0x7eb17cbdUL, 0xe7b82d07UL,
8140x90bf1d91UL, 0x1db71064UL, 0x6ab020f2UL, 0xf3b97148UL, 0x84be41deUL,
8150x1adad47dUL, 0x6ddde4ebUL, 0xf4d4b551UL, 0x83d385c7UL, 0x136c9856UL,
8160x646ba8c0UL, 0xfd62f97aUL, 0x8a65c9ecUL, 0x14015c4fUL, 0x63066cd9UL,
8170xfa0f3d63UL, 0x8d080df5UL, 0x3b6e20c8UL, 0x4c69105eUL, 0xd56041e4UL,
8180xa2677172UL, 0x3c03e4d1UL, 0x4b04d447UL, 0xd20d85fdUL, 0xa50ab56bUL,
8190x35b5a8faUL, 0x42b2986cUL, 0xdbbbc9d6UL, 0xacbcf940UL, 0x32d86ce3UL,
8200x45df5c75UL, 0xdcd60dcfUL, 0xabd13d59UL, 0x26d930acUL, 0x51de003aUL,
8210xc8d75180UL, 0xbfd06116UL, 0x21b4f4b5UL, 0x56b3c423UL, 0xcfba9599UL,
8220xb8bda50fUL, 0x2802b89eUL, 0x5f058808UL, 0xc60cd9b2UL, 0xb10be924UL,
8230x2f6f7c87UL, 0x58684c11UL, 0xc1611dabUL, 0xb6662d3dUL, 0x76dc4190UL,
8240x01db7106UL, 0x98d220bcUL, 0xefd5102aUL, 0x71b18589UL, 0x06b6b51fUL,
8250x9fbfe4a5UL, 0xe8b8d433UL, 0x7807c9a2UL, 0x0f00f934UL, 0x9609a88eUL,
8260xe10e9818UL, 0x7f6a0dbbUL, 0x086d3d2dUL, 0x91646c97UL, 0xe6635c01UL,
8270x6b6b51f4UL, 0x1c6c6162UL, 0x856530d8UL, 0xf262004eUL, 0x6c0695edUL,
8280x1b01a57bUL, 0x8208f4c1UL, 0xf50fc457UL, 0x65b0d9c6UL, 0x12b7e950UL,
8290x8bbeb8eaUL, 0xfcb9887cUL, 0x62dd1ddfUL, 0x15da2d49UL, 0x8cd37cf3UL,
8300xfbd44c65UL, 0x4db26158UL, 0x3ab551ceUL, 0xa3bc0074UL, 0xd4bb30e2UL,
8310x4adfa541UL, 0x3dd895d7UL, 0xa4d1c46dUL, 0xd3d6f4fbUL, 0x4369e96aUL,
8320x346ed9fcUL, 0xad678846UL, 0xda60b8d0UL, 0x44042d73UL, 0x33031de5UL,
8330xaa0a4c5fUL, 0xdd0d7cc9UL, 0x5005713cUL, 0x270241aaUL, 0xbe0b1010UL,
8340xc90c2086UL, 0x5768b525UL, 0x206f85b3UL, 0xb966d409UL, 0xce61e49fUL,
8350x5edef90eUL, 0x29d9c998UL, 0xb0d09822UL, 0xc7d7a8b4UL, 0x59b33d17UL,
8360x2eb40d81UL, 0xb7bd5c3bUL, 0xc0ba6cadUL, 0xedb88320UL, 0x9abfb3b6UL,
8370x03b6e20cUL, 0x74b1d29aUL, 0xead54739UL, 0x9dd277afUL, 0x04db2615UL,
8380x73dc1683UL, 0xe3630b12UL, 0x94643b84UL, 0x0d6d6a3eUL, 0x7a6a5aa8UL,
8390xe40ecf0bUL, 0x9309ff9dUL, 0x0a00ae27UL, 0x7d079eb1UL, 0xf00f9344UL,
8400x8708a3d2UL, 0x1e01f268UL, 0x6906c2feUL, 0xf762575dUL, 0x806567cbUL,
8410x196c3671UL, 0x6e6b06e7UL, 0xfed41b76UL, 0x89d32be0UL, 0x10da7a5aUL,
8420x67dd4accUL, 0xf9b9df6fUL, 0x8ebeeff9UL, 0x17b7be43UL, 0x60b08ed5UL,
8430xd6d6a3e8UL, 0xa1d1937eUL, 0x38d8c2c4UL, 0x4fdff252UL, 0xd1bb67f1UL,
8440xa6bc5767UL, 0x3fb506ddUL, 0x48b2364bUL, 0xd80d2bdaUL, 0xaf0a1b4cUL,
8450x36034af6UL, 0x41047a60UL, 0xdf60efc3UL, 0xa867df55UL, 0x316e8eefUL,
8460x4669be79UL, 0xcb61b38cUL, 0xbc66831aUL, 0x256fd2a0UL, 0x5268e236UL,
8470xcc0c7795UL, 0xbb0b4703UL, 0x220216b9UL, 0x5505262fUL, 0xc5ba3bbeUL,
8480xb2bd0b28UL, 0x2bb45a92UL, 0x5cb36a04UL, 0xc2d7ffa7UL, 0xb5d0cf31UL,
8490x2cd99e8bUL, 0x5bdeae1dUL, 0x9b64c2b0UL, 0xec63f226UL, 0x756aa39cUL,
8500x026d930aUL, 0x9c0906a9UL, 0xeb0e363fUL, 0x72076785UL, 0x05005713UL,
8510x95bf4a82UL, 0xe2b87a14UL, 0x7bb12baeUL, 0x0cb61b38UL, 0x92d28e9bUL,
8520xe5d5be0dUL, 0x7cdcefb7UL, 0x0bdbdf21UL, 0x86d3d2d4UL, 0xf1d4e242UL,
8530x68ddb3f8UL, 0x1fda836eUL, 0x81be16cdUL, 0xf6b9265bUL, 0x6fb077e1UL,
8540x18b74777UL, 0x88085ae6UL, 0xff0f6a70UL, 0x66063bcaUL, 0x11010b5cUL,
8550x8f659effUL, 0xf862ae69UL, 0x616bffd3UL, 0x166ccf45UL, 0xa00ae278UL,
8560xd70dd2eeUL, 0x4e048354UL, 0x3903b3c2UL, 0xa7672661UL, 0xd06016f7UL,
8570x4969474dUL, 0x3e6e77dbUL, 0xaed16a4aUL, 0xd9d65adcUL, 0x40df0b66UL,
8580x37d83bf0UL, 0xa9bcae53UL, 0xdebb9ec5UL, 0x47b2cf7fUL, 0x30b5ffe9UL,
8590xbdbdf21cUL, 0xcabac28aUL, 0x53b39330UL, 0x24b4a3a6UL, 0xbad03605UL,
8600xcdd70693UL, 0x54de5729UL, 0x23d967bfUL, 0xb3667a2eUL, 0xc4614ab8UL,
8610x5d681b02UL, 0x2a6f2b94UL, 0xb40bbe37UL, 0xc30c8ea1UL, 0x5a05df1bUL,
8620x2d02ef8dUL
863};
864
865static PyObject *
Peter Schneider-Kampa788a7f2000-07-10 09:57:19 +0000866binascii_crc32(PyObject *self, PyObject *args)
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000867{ /* By Jim Ahlstrom; All rights transferred to CNRI */
868 unsigned char *bin_data;
869 unsigned long crc = 0UL; /* initial value of CRC */
870 int len;
Tim Petersa98011c2002-07-02 20:20:08 +0000871 long result;
Tim Peters934c1a12002-07-02 22:24:50 +0000872
Guido van Rossum43713e52000-02-29 13:59:29 +0000873 if ( !PyArg_ParseTuple(args, "s#|l:crc32", &bin_data, &len, &crc) )
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000874 return NULL;
875
Tim Peters934c1a12002-07-02 22:24:50 +0000876 crc = ~ crc;
877#if SIZEOF_LONG > 4
878 /* only want the trailing 32 bits */
879 crc &= 0xFFFFFFFFUL;
880#endif
881 while (len--)
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000882 crc = crc_32_tab[(crc ^ *bin_data++) & 0xffUL] ^ (crc >> 8);
883 /* Note: (crc >> 8) MUST zero fill on left */
Tim Petersa98011c2002-07-02 20:20:08 +0000884
885 result = (long)(crc ^ 0xFFFFFFFFUL);
Tim Peters934c1a12002-07-02 22:24:50 +0000886#if SIZEOF_LONG > 4
887 /* Extend the sign bit. This is one way to ensure the result is the
888 * same across platforms. The other way would be to return an
889 * unbounded unsigned long, but the evidence suggests that lots of
890 * code outside this treats the result as if it were a signed 4-byte
891 * integer.
Tim Petersa98011c2002-07-02 20:20:08 +0000892 */
893 result |= -(result & (1L << 31));
Tim Peters934c1a12002-07-02 22:24:50 +0000894#endif
Tim Petersa98011c2002-07-02 20:20:08 +0000895 return PyInt_FromLong(result);
Guido van Rossum7d47c9e2000-02-16 21:11:52 +0000896}
897
Barry Warsawe977c212000-08-15 06:07:13 +0000898
899static PyObject *
900binascii_hexlify(PyObject *self, PyObject *args)
901{
902 char* argbuf;
903 int arglen;
904 PyObject *retval;
905 char* retbuf;
906 int i, j;
907
908 if (!PyArg_ParseTuple(args, "t#:b2a_hex", &argbuf, &arglen))
909 return NULL;
910
911 retval = PyString_FromStringAndSize(NULL, arglen*2);
912 if (!retval)
913 return NULL;
914 retbuf = PyString_AsString(retval);
915 if (!retbuf)
916 goto finally;
917
918 /* make hex version of string, taken from shamodule.c */
919 for (i=j=0; i < arglen; i++) {
920 char c;
921 c = (argbuf[i] >> 4) & 0xf;
922 c = (c>9) ? c+'a'-10 : c + '0';
923 retbuf[j++] = c;
924 c = argbuf[i] & 0xf;
925 c = (c>9) ? c+'a'-10 : c + '0';
926 retbuf[j++] = c;
927 }
928 return retval;
929
930 finally:
931 Py_DECREF(retval);
932 return NULL;
933}
934
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000935PyDoc_STRVAR(doc_hexlify,
Barry Warsawe977c212000-08-15 06:07:13 +0000936"b2a_hex(data) -> s; Hexadecimal representation of binary data.\n\
937\n\
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000938This function is also available as \"hexlify()\".");
Barry Warsawe977c212000-08-15 06:07:13 +0000939
940
941static int
Tim Peters934c1a12002-07-02 22:24:50 +0000942to_int(int c)
Barry Warsawe977c212000-08-15 06:07:13 +0000943{
944 if (isdigit(c))
945 return c - '0';
946 else {
947 if (isupper(c))
948 c = tolower(c);
949 if (c >= 'a' && c <= 'f')
950 return c - 'a' + 10;
951 }
952 return -1;
953}
954
955
956static PyObject *
957binascii_unhexlify(PyObject *self, PyObject *args)
958{
959 char* argbuf;
960 int arglen;
961 PyObject *retval;
962 char* retbuf;
963 int i, j;
964
965 if (!PyArg_ParseTuple(args, "s#:a2b_hex", &argbuf, &arglen))
966 return NULL;
967
Barry Warsaw16168472000-08-15 06:59:58 +0000968 /* XXX What should we do about strings with an odd length? Should
969 * we add an implicit leading zero, or a trailing zero? For now,
970 * raise an exception.
Barry Warsawe977c212000-08-15 06:07:13 +0000971 */
972 if (arglen % 2) {
Barry Warsaw16168472000-08-15 06:59:58 +0000973 PyErr_SetString(PyExc_TypeError, "Odd-length string");
Barry Warsawe977c212000-08-15 06:07:13 +0000974 return NULL;
975 }
976
977 retval = PyString_FromStringAndSize(NULL, (arglen/2));
978 if (!retval)
979 return NULL;
980 retbuf = PyString_AsString(retval);
981 if (!retbuf)
982 goto finally;
983
984 for (i=j=0; i < arglen; i += 2) {
985 int top = to_int(Py_CHARMASK(argbuf[i]));
986 int bot = to_int(Py_CHARMASK(argbuf[i+1]));
987 if (top == -1 || bot == -1) {
988 PyErr_SetString(PyExc_TypeError,
Barry Warsaw16168472000-08-15 06:59:58 +0000989 "Non-hexadecimal digit found");
Barry Warsawe977c212000-08-15 06:07:13 +0000990 goto finally;
991 }
992 retbuf[j++] = (top << 4) + bot;
993 }
994 return retval;
995
996 finally:
997 Py_DECREF(retval);
998 return NULL;
999}
1000
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001001PyDoc_STRVAR(doc_unhexlify,
Barry Warsawe977c212000-08-15 06:07:13 +00001002"a2b_hex(hexstr) -> s; Binary data of hexadecimal representation.\n\
1003\n\
1004hexstr must contain an even number of hex digits (upper or lower case).\n\
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001005This function is also available as \"unhexlify()\"");
Barry Warsawe977c212000-08-15 06:07:13 +00001006
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001007static int table_hex[128] = {
1008 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1009 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1010 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1011 0, 1, 2, 3, 4, 5, 6, 7, 8, 9,-1,-1, -1,-1,-1,-1,
1012 -1,10,11,12, 13,14,15,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1013 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1014 -1,10,11,12, 13,14,15,-1, -1,-1,-1,-1, -1,-1,-1,-1,
1015 -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1, -1,-1,-1,-1
1016};
1017
1018#define hexval(c) table_hex[(unsigned int)(c)]
1019
1020#define MAXLINESIZE 76
1021
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001022PyDoc_STRVAR(doc_a2b_qp, "Decode a string of qp-encoded data");
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001023
Tim Peters934c1a12002-07-02 22:24:50 +00001024static PyObject*
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001025binascii_a2b_qp(PyObject *self, PyObject *args, PyObject *kwargs)
1026{
1027 unsigned int in, out;
1028 char ch;
1029 unsigned char *data, *odata;
1030 unsigned int datalen = 0;
1031 PyObject *rv;
1032 static char *kwlist[] = {"data", "header", NULL};
1033 int header = 0;
1034
Tim Peters934c1a12002-07-02 22:24:50 +00001035 if (!PyArg_ParseTupleAndKeywords(args, kwargs, "s#|i", kwlist, &data,
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001036 &datalen, &header))
1037 return NULL;
1038
1039 /* We allocate the output same size as input, this is overkill */
Greg Warda645b302001-10-04 14:54:53 +00001040 odata = (unsigned char *) calloc(1, datalen);
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001041
1042 if (odata == NULL) {
1043 PyErr_NoMemory();
1044 return NULL;
1045 }
1046
1047 in = out = 0;
1048 while (in < datalen) {
1049 if (data[in] == '=') {
1050 in++;
1051 if (in >= datalen) break;
1052 /* Soft line breaks */
Tim Peters934c1a12002-07-02 22:24:50 +00001053 if ((data[in] == '\n') || (data[in] == '\r') ||
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001054 (data[in] == ' ') || (data[in] == '\t')) {
1055 if (data[in] != '\n') {
1056 while (in < datalen && data[in] != '\n') in++;
1057 }
1058 if (in < datalen) in++;
1059 }
1060 else if (data[in] == '=') {
1061 /* broken case from broken python qp */
1062 odata[out++] = '=';
1063 in++;
1064 }
Tim Peters934c1a12002-07-02 22:24:50 +00001065 else if (((data[in] >= 'A' && data[in] <= 'F') ||
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001066 (data[in] >= 'a' && data[in] <= 'f') ||
1067 (data[in] >= '0' && data[in] <= '9')) &&
1068 ((data[in+1] >= 'A' && data[in+1] <= 'F') ||
1069 (data[in+1] >= 'a' && data[in+1] <= 'f') ||
1070 (data[in+1] >= '0' && data[in+1] <= '9'))) {
1071 /* hexval */
1072 ch = hexval(data[in]) << 4;
1073 in++;
1074 ch |= hexval(data[in]);
1075 in++;
1076 odata[out++] = ch;
1077 }
1078 else {
1079 odata[out++] = '=';
1080 }
1081 }
1082 else if (header && data[in] == '_') {
1083 odata[out++] = ' ';
1084 in++;
1085 }
1086 else {
1087 odata[out] = data[in];
1088 in++;
1089 out++;
1090 }
1091 }
Greg Warda645b302001-10-04 14:54:53 +00001092 if ((rv = PyString_FromStringAndSize((char *)odata, out)) == NULL) {
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001093 free (odata);
1094 return NULL;
1095 }
1096 free (odata);
1097 return rv;
1098}
1099
Tim Peters934c1a12002-07-02 22:24:50 +00001100static int
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001101to_hex (unsigned char ch, unsigned char *s)
1102{
1103 unsigned int uvalue = ch;
1104
1105 s[1] = "0123456789ABCDEF"[uvalue % 16];
1106 uvalue = (uvalue / 16);
1107 s[0] = "0123456789ABCDEF"[uvalue % 16];
1108 return 0;
1109}
1110
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001111PyDoc_STRVAR(doc_b2a_qp,
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001112"b2a_qp(data, quotetabs=0, istext=1, header=0) -> s; \n\
1113 Encode a string using quoted-printable encoding. \n\
1114\n\
1115On encoding, when istext is set, newlines are not encoded, and white \n\
1116space at end of lines is. When istext is not set, \\r and \\n (CR/LF) are \n\
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001117both encoded. When quotetabs is set, space and tabs are encoded.");
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001118
1119/* XXX: This is ridiculously complicated to be backward compatible
1120 * (mostly) with the quopri module. It doesn't re-create the quopri
1121 * module bug where text ending in CRLF has the CR encoded */
Tim Peters934c1a12002-07-02 22:24:50 +00001122static PyObject*
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001123binascii_b2a_qp (PyObject *self, PyObject *args, PyObject *kwargs)
1124{
1125 unsigned int in, out;
1126 unsigned char *data, *odata;
1127 unsigned int datalen = 0, odatalen = 0;
1128 PyObject *rv;
1129 unsigned int linelen = 0;
1130 static char *kwlist[] = {"data", "quotetabs", "istext", "header", NULL};
1131 int istext = 1;
1132 int quotetabs = 0;
1133 int header = 0;
1134 unsigned char ch;
1135 int crlf = 0;
1136 unsigned char *p;
1137
Tim Peters934c1a12002-07-02 22:24:50 +00001138 if (!PyArg_ParseTupleAndKeywords(args, kwargs, "s#|iii", kwlist, &data,
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001139 &datalen, &quotetabs, &istext, &header))
1140 return NULL;
1141
1142 /* See if this string is using CRLF line ends */
1143 /* XXX: this function has the side effect of converting all of
1144 * the end of lines to be the same depending on this detection
1145 * here */
Greg Warda645b302001-10-04 14:54:53 +00001146 p = (unsigned char *) strchr((char *)data, '\n');
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001147 if ((p != NULL) && (p > data) && (*(p-1) == '\r'))
1148 crlf = 1;
1149
1150 /* First, scan to see how many characters need to be encoded */
1151 in = 0;
1152 while (in < datalen) {
Tim Peters934c1a12002-07-02 22:24:50 +00001153 if ((data[in] > 126) ||
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001154 (data[in] == '=') ||
1155 (header && data[in] == '_') ||
1156 ((data[in] == '.') && (linelen == 1)) ||
1157 (!istext && ((data[in] == '\r') || (data[in] == '\n'))) ||
1158 ((data[in] == '\t' || data[in] == ' ') && (in + 1 == datalen)) ||
Tim Peters934c1a12002-07-02 22:24:50 +00001159 ((data[in] < 33) &&
1160 (data[in] != '\r') && (data[in] != '\n') &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001161 (quotetabs && ((data[in] != '\t') || (data[in] != ' ')))))
1162 {
1163 if ((linelen + 3) >= MAXLINESIZE) {
1164 linelen = 0;
1165 if (crlf)
1166 odatalen += 3;
1167 else
1168 odatalen += 2;
1169 }
1170 linelen += 3;
1171 odatalen += 3;
1172 in++;
1173 }
1174 else {
Tim Peters934c1a12002-07-02 22:24:50 +00001175 if (istext &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001176 ((data[in] == '\n') ||
1177 ((in+1 < datalen) && (data[in] == '\r') &&
1178 (data[in+1] == '\n'))))
1179 {
1180 linelen = 0;
1181 /* Protect against whitespace on end of line */
1182 if (in && ((data[in-1] == ' ') || (data[in-1] == '\t')))
1183 odatalen += 2;
1184 if (crlf)
1185 odatalen += 2;
1186 else
1187 odatalen += 1;
1188 if (data[in] == '\r')
1189 in += 2;
1190 else
1191 in++;
1192 }
1193 else {
Tim Peters934c1a12002-07-02 22:24:50 +00001194 if ((in + 1 != datalen) &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001195 (data[in+1] != '\n') &&
1196 (linelen + 1) >= MAXLINESIZE) {
1197 linelen = 0;
1198 if (crlf)
1199 odatalen += 3;
1200 else
1201 odatalen += 2;
1202 }
1203 linelen++;
1204 odatalen++;
1205 in++;
1206 }
1207 }
1208 }
1209
Greg Warda645b302001-10-04 14:54:53 +00001210 odata = (unsigned char *) calloc(1, odatalen);
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001211
1212 if (odata == NULL) {
1213 PyErr_NoMemory();
1214 return NULL;
1215 }
1216
1217 in = out = linelen = 0;
1218 while (in < datalen) {
Tim Peters934c1a12002-07-02 22:24:50 +00001219 if ((data[in] > 126) ||
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001220 (data[in] == '=') ||
1221 (header && data[in] == '_') ||
1222 ((data[in] == '.') && (linelen == 1)) ||
1223 (!istext && ((data[in] == '\r') || (data[in] == '\n'))) ||
1224 ((data[in] == '\t' || data[in] == ' ') && (in + 1 == datalen)) ||
Tim Peters934c1a12002-07-02 22:24:50 +00001225 ((data[in] < 33) &&
1226 (data[in] != '\r') && (data[in] != '\n') &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001227 (quotetabs && ((data[in] != '\t') || (data[in] != ' ')))))
1228 {
1229 if ((linelen + 3 )>= MAXLINESIZE) {
1230 odata[out++] = '=';
1231 if (crlf) odata[out++] = '\r';
1232 odata[out++] = '\n';
1233 linelen = 0;
1234 }
1235 odata[out++] = '=';
1236 to_hex(data[in], &odata[out]);
1237 out += 2;
1238 in++;
1239 linelen += 3;
1240 }
1241 else {
Tim Peters934c1a12002-07-02 22:24:50 +00001242 if (istext &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001243 ((data[in] == '\n') ||
1244 ((in+1 < datalen) && (data[in] == '\r') &&
1245 (data[in+1] == '\n'))))
1246 {
1247 linelen = 0;
1248 /* Protect against whitespace on end of line */
1249 if (out && ((odata[out-1] == ' ') || (odata[out-1] == '\t'))) {
1250 ch = odata[out-1];
1251 odata[out-1] = '=';
1252 to_hex(ch, &odata[out]);
1253 out += 2;
1254 }
Tim Peters934c1a12002-07-02 22:24:50 +00001255
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001256 if (crlf) odata[out++] = '\r';
1257 odata[out++] = '\n';
1258 if (data[in] == '\r')
1259 in += 2;
1260 else
1261 in++;
1262 }
1263 else {
Tim Peters934c1a12002-07-02 22:24:50 +00001264 if ((in + 1 != datalen) &&
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001265 (data[in+1] != '\n') &&
1266 (linelen + 1) >= MAXLINESIZE) {
1267 odata[out++] = '=';
1268 if (crlf) odata[out++] = '\r';
1269 odata[out++] = '\n';
1270 linelen = 0;
1271 }
1272 linelen++;
1273 if (header && data[in] == ' ') {
1274 odata[out++] = '_';
1275 in++;
1276 }
1277 else {
1278 odata[out++] = data[in++];
1279 }
1280 }
1281 }
1282 }
Greg Warda645b302001-10-04 14:54:53 +00001283 if ((rv = PyString_FromStringAndSize((char *)odata, out)) == NULL) {
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001284 free (odata);
1285 return NULL;
1286 }
1287 free (odata);
1288 return rv;
1289}
Barry Warsawe977c212000-08-15 06:07:13 +00001290
Jack Jansen72781191995-08-07 14:34:15 +00001291/* List of functions defined in the module */
1292
1293static struct PyMethodDef binascii_module_methods[] = {
Barry Warsawe977c212000-08-15 06:07:13 +00001294 {"a2b_uu", binascii_a2b_uu, METH_VARARGS, doc_a2b_uu},
1295 {"b2a_uu", binascii_b2a_uu, METH_VARARGS, doc_b2a_uu},
1296 {"a2b_base64", binascii_a2b_base64, METH_VARARGS, doc_a2b_base64},
1297 {"b2a_base64", binascii_b2a_base64, METH_VARARGS, doc_b2a_base64},
1298 {"a2b_hqx", binascii_a2b_hqx, METH_VARARGS, doc_a2b_hqx},
1299 {"b2a_hqx", binascii_b2a_hqx, METH_VARARGS, doc_b2a_hqx},
1300 {"b2a_hex", binascii_hexlify, METH_VARARGS, doc_hexlify},
1301 {"a2b_hex", binascii_unhexlify, METH_VARARGS, doc_unhexlify},
1302 {"hexlify", binascii_hexlify, METH_VARARGS, doc_hexlify},
1303 {"unhexlify", binascii_unhexlify, METH_VARARGS, doc_unhexlify},
1304 {"rlecode_hqx", binascii_rlecode_hqx, METH_VARARGS, doc_rlecode_hqx},
1305 {"rledecode_hqx", binascii_rledecode_hqx, METH_VARARGS,
1306 doc_rledecode_hqx},
1307 {"crc_hqx", binascii_crc_hqx, METH_VARARGS, doc_crc_hqx},
1308 {"crc32", binascii_crc32, METH_VARARGS, doc_crc32},
Tim Peters934c1a12002-07-02 22:24:50 +00001309 {"a2b_qp", (PyCFunction)binascii_a2b_qp, METH_VARARGS | METH_KEYWORDS,
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001310 doc_a2b_qp},
Tim Peters934c1a12002-07-02 22:24:50 +00001311 {"b2a_qp", (PyCFunction)binascii_b2a_qp, METH_VARARGS | METH_KEYWORDS,
Martin v. Löwis16dc7f42001-09-30 20:32:11 +00001312 doc_b2a_qp},
Barry Warsawe977c212000-08-15 06:07:13 +00001313 {NULL, NULL} /* sentinel */
Jack Jansen72781191995-08-07 14:34:15 +00001314};
1315
1316
1317/* Initialization function for the module (*must* be called initbinascii) */
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001318PyDoc_STRVAR(doc_binascii, "Conversion between binary data and ASCII");
Jack Jansen72781191995-08-07 14:34:15 +00001319
Mark Hammondfe51c6d2002-08-02 02:27:13 +00001320PyMODINIT_FUNC
Thomas Woutersf3f33dc2000-07-21 06:00:07 +00001321initbinascii(void)
Jack Jansen72781191995-08-07 14:34:15 +00001322{
1323 PyObject *m, *d, *x;
1324
1325 /* Create the module and add the functions */
1326 m = Py_InitModule("binascii", binascii_module_methods);
1327
1328 d = PyModule_GetDict(m);
1329 x = PyString_FromString(doc_binascii);
1330 PyDict_SetItemString(d, "__doc__", x);
Guido van Rossum5c159bd1997-08-04 23:55:25 +00001331 Py_XDECREF(x);
Jack Jansen72781191995-08-07 14:34:15 +00001332
Guido van Rossum7dbb48a1997-10-08 15:26:07 +00001333 Error = PyErr_NewException("binascii.Error", NULL, NULL);
Jack Jansen72781191995-08-07 14:34:15 +00001334 PyDict_SetItemString(d, "Error", Error);
Guido van Rossum7dbb48a1997-10-08 15:26:07 +00001335 Incomplete = PyErr_NewException("binascii.Incomplete", NULL, NULL);
Jack Jansen72781191995-08-07 14:34:15 +00001336 PyDict_SetItemString(d, "Incomplete", Incomplete);
Jack Jansen72781191995-08-07 14:34:15 +00001337}