blob: c26111a9d5b3a5fe9edf5176447bfa60d74fb461 [file] [log] [blame]
Guido van Rossumbe0e9421993-12-24 10:32:00 +00001
Guido van Rossum1924a061998-12-18 22:02:37 +00002#include "Python.h"
Guido van Rossumb6775db1994-08-01 11:34:53 +00003
Guido van Rossume32d1531998-07-07 21:32:53 +00004#if defined(__sgi) && defined(WITH_THREAD) && !defined(_SGI_MP_SOURCE)
5#define _SGI_MP_SOURCE
6#endif
7
Guido van Rossum7f7f2741995-02-10 17:01:56 +00008/* Convert a possibly signed character to a nonnegative int */
9/* XXX This assumes characters are 8 bits wide */
10#ifdef __CHAR_UNSIGNED__
11#define Py_CHARMASK(c) (c)
12#else
13#define Py_CHARMASK(c) ((c) & 0xff)
14#endif
15
Guido van Rossumb6775db1994-08-01 11:34:53 +000016/* strtol and strtoul, renamed to avoid conflicts */
17
Thomas Wouters477c8d52006-05-27 19:21:47 +000018
19#include <ctype.h>
Thomas Wouters0e3f5912006-08-11 14:57:12 +000020#ifdef HAVE_ERRNO_H
Thomas Wouters477c8d52006-05-27 19:21:47 +000021#include <errno.h>
22#endif
23
24/* Static overflow check values for bases 2 through 36.
25 * smallmax[base] is the largest unsigned long i such that
26 * i * base doesn't overflow unsigned long.
27 */
28static unsigned long smallmax[] = {
29 0, /* bases 0 and 1 are invalid */
30 0,
31 ULONG_MAX / 2,
32 ULONG_MAX / 3,
33 ULONG_MAX / 4,
34 ULONG_MAX / 5,
35 ULONG_MAX / 6,
36 ULONG_MAX / 7,
37 ULONG_MAX / 8,
38 ULONG_MAX / 9,
39 ULONG_MAX / 10,
40 ULONG_MAX / 11,
41 ULONG_MAX / 12,
42 ULONG_MAX / 13,
43 ULONG_MAX / 14,
44 ULONG_MAX / 15,
45 ULONG_MAX / 16,
46 ULONG_MAX / 17,
47 ULONG_MAX / 18,
48 ULONG_MAX / 19,
49 ULONG_MAX / 20,
50 ULONG_MAX / 21,
51 ULONG_MAX / 22,
52 ULONG_MAX / 23,
53 ULONG_MAX / 24,
54 ULONG_MAX / 25,
55 ULONG_MAX / 26,
56 ULONG_MAX / 27,
57 ULONG_MAX / 28,
58 ULONG_MAX / 29,
59 ULONG_MAX / 30,
60 ULONG_MAX / 31,
61 ULONG_MAX / 32,
62 ULONG_MAX / 33,
63 ULONG_MAX / 34,
64 ULONG_MAX / 35,
65 ULONG_MAX / 36,
66};
67
68/* maximum digits that can't ever overflow for bases 2 through 36,
69 * calculated by [int(math.floor(math.log(2**32, i))) for i in range(2, 37)].
70 * Note that this is pessimistic if sizeof(long) > 4.
71 */
Thomas Wouters0e3f5912006-08-11 14:57:12 +000072#if SIZEOF_LONG == 4
Thomas Wouters477c8d52006-05-27 19:21:47 +000073static int digitlimit[] = {
74 0, 0, 32, 20, 16, 13, 12, 11, 10, 10, /* 0 - 9 */
75 9, 9, 8, 8, 8, 8, 8, 7, 7, 7, /* 10 - 19 */
76 7, 7, 7, 7, 6, 6, 6, 6, 6, 6, /* 20 - 29 */
77 6, 6, 6, 6, 6, 6, 6}; /* 30 - 36 */
Thomas Wouters0e3f5912006-08-11 14:57:12 +000078#elif SIZEOF_LONG == 8
79/* [int(math.floor(math.log(2**64, i))) for i in range(2, 37)] */
80static int digitlimit[] = {
81 0, 0, 64, 40, 32, 27, 24, 22, 21, 20, /* 0 - 9 */
82 19, 18, 17, 17, 16, 16, 16, 15, 15, 15, /* 10 - 19 */
83 14, 14, 14, 14, 13, 13, 13, 13, 13, 13, /* 20 - 29 */
84 13, 12, 12, 12, 12, 12, 12}; /* 30 - 36 */
85#else
86#error "Need table for SIZEOF_LONG"
87#endif
Thomas Wouters477c8d52006-05-27 19:21:47 +000088
Guido van Rossumbe0e9421993-12-24 10:32:00 +000089/*
90** strtoul
91** This is a general purpose routine for converting
92** an ascii string to an integer in an arbitrary base.
93** Leading white space is ignored. If 'base' is zero
Guido van Rossumcd16bf62007-06-13 18:07:49 +000094** it looks for a leading 0b, 0o or 0x to tell which
Guido van Rossumbe0e9421993-12-24 10:32:00 +000095** base. If these are absent it defaults to 10.
96** Base must be 0 or between 2 and 36 (inclusive).
97** If 'ptr' is non-NULL it will contain a pointer to
98** the end of the scan.
99** Errors due to bad pointers will probably result in
100** exceptions - we don't check for them.
101*/
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000102unsigned long
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000103PyOS_strtoul(register char *str, char **ptr, int base)
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000104{
Thomas Wouters477c8d52006-05-27 19:21:47 +0000105 register unsigned long result = 0; /* return value of the function */
106 register int c; /* current input character */
107 register int ovlimit; /* required digits to overflow */
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000108
Thomas Wouters477c8d52006-05-27 19:21:47 +0000109 /* skip leading white space */
110 while (*str && isspace(Py_CHARMASK(*str)))
111 ++str;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000112
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000113 /* check for leading 0b, 0o or 0x for auto-base or base 16 */
Thomas Wouters477c8d52006-05-27 19:21:47 +0000114 switch (base) {
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000115 case 0: /* look for leading 0b, 0o or 0x */
116 if (*str == '0') {
117 ++str;
118 if (*str == 'x' || *str == 'X') {
Georg Brandlfceab5a2008-01-19 20:08:23 +0000119 /* there must be at least one digit after 0x */
120 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 16) {
121 if (ptr)
122 *ptr = str;
123 return 0;
124 }
Thomas Wouters477c8d52006-05-27 19:21:47 +0000125 ++str;
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000126 base = 16;
127 } else if (*str == 'o' || *str == 'O') {
Georg Brandlfceab5a2008-01-19 20:08:23 +0000128 /* there must be at least one digit after 0o */
129 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 8) {
130 if (ptr)
131 *ptr = str;
132 return 0;
133 }
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000134 ++str;
135 base = 8;
136 } else if (*str == 'b' || *str == 'B') {
Georg Brandlfceab5a2008-01-19 20:08:23 +0000137 /* there must be at least one digit after 0b */
138 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 2) {
139 if (ptr)
140 *ptr = str;
141 return 0;
142 }
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000143 ++str;
144 base = 2;
145 } else {
146 /* skip all zeroes... */
147 while (*str == '0')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000148 ++str;
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000149 while (isspace(Py_CHARMASK(*str)))
150 ++str;
151 if (ptr)
152 *ptr = str;
153 return 0;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000154 }
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000155 }
156 else
157 base = 10;
158 break;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000159
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000160 /* even with explicit base, skip leading 0? prefix */
161 case 16:
162 if (*str == '0') {
163 ++str;
Georg Brandlfceab5a2008-01-19 20:08:23 +0000164 if (*str == 'x' || *str == 'X') {
165 /* there must be at least one digit after 0x */
166 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 16) {
167 if (ptr)
168 *ptr = str;
169 return 0;
170 }
Thomas Wouters477c8d52006-05-27 19:21:47 +0000171 ++str;
Georg Brandlfceab5a2008-01-19 20:08:23 +0000172 }
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000173 }
174 break;
175 case 8:
176 if (*str == '0') {
177 ++str;
Georg Brandlfceab5a2008-01-19 20:08:23 +0000178 if (*str == 'o' || *str == 'O') {
179 /* there must be at least one digit after 0o */
180 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 8) {
181 if (ptr)
182 *ptr = str;
183 return 0;
184 }
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000185 ++str;
Georg Brandlfceab5a2008-01-19 20:08:23 +0000186 }
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000187 }
188 break;
189 case 2:
190 if(*str == '0') {
191 ++str;
Georg Brandlfceab5a2008-01-19 20:08:23 +0000192 if (*str == 'b' || *str == 'B') {
193 /* there must be at least one digit after 0b */
194 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 2) {
195 if (ptr)
196 *ptr = str;
197 return 0;
198 }
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000199 ++str;
Georg Brandlfceab5a2008-01-19 20:08:23 +0000200 }
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000201 }
202 break;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000203 }
204
205 /* catch silly bases */
206 if (base < 2 || base > 36) {
207 if (ptr)
208 *ptr = str;
209 return 0;
210 }
211
212 /* skip leading zeroes */
213 while (*str == '0')
214 ++str;
215
216 /* base is guaranteed to be in [2, 36] at this point */
217 ovlimit = digitlimit[base];
218
219 /* do the conversion until non-digit character encountered */
220 while ((c = _PyLong_DigitValue[Py_CHARMASK(*str)]) < base) {
221 if (ovlimit > 0) /* no overflow check required */
222 result = result * base + c;
223 else { /* requires overflow check */
224 register unsigned long temp_result;
225
226 if (ovlimit < 0) /* guaranteed overflow */
227 goto overflowed;
228
229 /* there could be an overflow */
230 /* check overflow just from shifting */
231 if (result > smallmax[base])
232 goto overflowed;
233
234 result *= base;
235
236 /* check overflow from the digit's value */
237 temp_result = result + c;
238 if (temp_result < result)
239 goto overflowed;
240
241 result = temp_result;
242 }
243
244 ++str;
245 --ovlimit;
246 }
247
248 /* set pointer to point to the last character scanned */
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000249 if (ptr)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000250 *ptr = str;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000251
Thomas Wouters477c8d52006-05-27 19:21:47 +0000252 return result;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000253
Thomas Wouters477c8d52006-05-27 19:21:47 +0000254overflowed:
255 if (ptr) {
256 /* spool through remaining digit characters */
257 while (_PyLong_DigitValue[Py_CHARMASK(*str)] < base)
258 ++str;
259 *ptr = str;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000260 }
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000261 errno = ERANGE;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000262 return (unsigned long)-1;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000263}
264
Thomas Wouters89f507f2006-12-13 04:49:30 +0000265/* Checking for overflow in PyOS_strtol is a PITA; see comments
266 * about PY_ABS_LONG_MIN in longobject.c.
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000267 */
Thomas Wouters89f507f2006-12-13 04:49:30 +0000268#define PY_ABS_LONG_MIN (0-(unsigned long)LONG_MIN)
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000269
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000270long
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000271PyOS_strtol(char *str, char **ptr, int base)
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000272{
273 long result;
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000274 unsigned long uresult;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000275 char sign;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000276
Guido van Rossum7f7f2741995-02-10 17:01:56 +0000277 while (*str && isspace(Py_CHARMASK(*str)))
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000278 str++;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000279
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000280 sign = *str;
281 if (sign == '+' || sign == '-')
282 str++;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000283
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000284 uresult = PyOS_strtoul(str, ptr, base);
Thomas Wouters477c8d52006-05-27 19:21:47 +0000285
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000286 if (uresult <= (unsigned long)LONG_MAX) {
287 result = (long)uresult;
288 if (sign == '-')
289 result = -result;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000290 }
Thomas Wouters89f507f2006-12-13 04:49:30 +0000291 else if (sign == '-' && uresult == PY_ABS_LONG_MIN) {
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000292 result = LONG_MIN;
293 }
294 else {
295 errno = ERANGE;
296 result = LONG_MAX;
297 }
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000298 return result;
299}