blob: 19fa57aa144e2ac9f53f22e6cbc92fc7faa0808e [file] [log] [blame]
Guido van Rossumbe0e9421993-12-24 10:32:00 +00001
Guido van Rossum1924a061998-12-18 22:02:37 +00002#include "Python.h"
Guido van Rossumb6775db1994-08-01 11:34:53 +00003
Antoine Pitroua6a4dc82017-09-07 18:56:24 +02004#if defined(__sgi) && !defined(_SGI_MP_SOURCE)
Guido van Rossume32d1531998-07-07 21:32:53 +00005#define _SGI_MP_SOURCE
6#endif
7
Guido van Rossumb6775db1994-08-01 11:34:53 +00008/* strtol and strtoul, renamed to avoid conflicts */
9
Thomas Wouters477c8d52006-05-27 19:21:47 +000010
11#include <ctype.h>
Thomas Wouters0e3f5912006-08-11 14:57:12 +000012#ifdef HAVE_ERRNO_H
Thomas Wouters477c8d52006-05-27 19:21:47 +000013#include <errno.h>
14#endif
15
16/* Static overflow check values for bases 2 through 36.
17 * smallmax[base] is the largest unsigned long i such that
18 * i * base doesn't overflow unsigned long.
19 */
Serhiy Storchaka2d06e842015-12-25 19:53:18 +020020static const unsigned long smallmax[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000021 0, /* bases 0 and 1 are invalid */
22 0,
23 ULONG_MAX / 2,
24 ULONG_MAX / 3,
25 ULONG_MAX / 4,
26 ULONG_MAX / 5,
27 ULONG_MAX / 6,
28 ULONG_MAX / 7,
29 ULONG_MAX / 8,
30 ULONG_MAX / 9,
31 ULONG_MAX / 10,
32 ULONG_MAX / 11,
33 ULONG_MAX / 12,
34 ULONG_MAX / 13,
35 ULONG_MAX / 14,
36 ULONG_MAX / 15,
37 ULONG_MAX / 16,
38 ULONG_MAX / 17,
39 ULONG_MAX / 18,
40 ULONG_MAX / 19,
41 ULONG_MAX / 20,
42 ULONG_MAX / 21,
43 ULONG_MAX / 22,
44 ULONG_MAX / 23,
45 ULONG_MAX / 24,
46 ULONG_MAX / 25,
47 ULONG_MAX / 26,
48 ULONG_MAX / 27,
49 ULONG_MAX / 28,
50 ULONG_MAX / 29,
51 ULONG_MAX / 30,
52 ULONG_MAX / 31,
53 ULONG_MAX / 32,
54 ULONG_MAX / 33,
55 ULONG_MAX / 34,
56 ULONG_MAX / 35,
57 ULONG_MAX / 36,
Thomas Wouters477c8d52006-05-27 19:21:47 +000058};
59
60/* maximum digits that can't ever overflow for bases 2 through 36,
61 * calculated by [int(math.floor(math.log(2**32, i))) for i in range(2, 37)].
62 * Note that this is pessimistic if sizeof(long) > 4.
63 */
Thomas Wouters0e3f5912006-08-11 14:57:12 +000064#if SIZEOF_LONG == 4
Serhiy Storchaka2d06e842015-12-25 19:53:18 +020065static const int digitlimit[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000066 0, 0, 32, 20, 16, 13, 12, 11, 10, 10, /* 0 - 9 */
67 9, 9, 8, 8, 8, 8, 8, 7, 7, 7, /* 10 - 19 */
68 7, 7, 7, 7, 6, 6, 6, 6, 6, 6, /* 20 - 29 */
69 6, 6, 6, 6, 6, 6, 6}; /* 30 - 36 */
Thomas Wouters0e3f5912006-08-11 14:57:12 +000070#elif SIZEOF_LONG == 8
71/* [int(math.floor(math.log(2**64, i))) for i in range(2, 37)] */
Serhiy Storchaka2d06e842015-12-25 19:53:18 +020072static const int digitlimit[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000073 0, 0, 64, 40, 32, 27, 24, 22, 21, 20, /* 0 - 9 */
74 19, 18, 17, 17, 16, 16, 16, 15, 15, 15, /* 10 - 19 */
75 14, 14, 14, 14, 13, 13, 13, 13, 13, 13, /* 20 - 29 */
76 13, 12, 12, 12, 12, 12, 12}; /* 30 - 36 */
Thomas Wouters0e3f5912006-08-11 14:57:12 +000077#else
78#error "Need table for SIZEOF_LONG"
79#endif
Thomas Wouters477c8d52006-05-27 19:21:47 +000080
Guido van Rossumbe0e9421993-12-24 10:32:00 +000081/*
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000082** strtoul
83** This is a general purpose routine for converting
84** an ascii string to an integer in an arbitrary base.
85** Leading white space is ignored. If 'base' is zero
86** it looks for a leading 0b, 0o or 0x to tell which
87** base. If these are absent it defaults to 10.
88** Base must be 0 or between 2 and 36 (inclusive).
89** If 'ptr' is non-NULL it will contain a pointer to
90** the end of the scan.
91** Errors due to bad pointers will probably result in
92** exceptions - we don't check for them.
Guido van Rossumbe0e9421993-12-24 10:32:00 +000093*/
Guido van Rossumbe0e9421993-12-24 10:32:00 +000094unsigned long
Serhiy Storchakac6792272013-10-19 21:03:34 +030095PyOS_strtoul(const char *str, char **ptr, int base)
Guido van Rossumbe0e9421993-12-24 10:32:00 +000096{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +020097 unsigned long result = 0; /* return value of the function */
98 int c; /* current input character */
99 int ovlimit; /* required digits to overflow */
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000100
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000101 /* skip leading white space */
Jordon Xu2ec70102019-09-11 00:04:08 +0800102 while (*str && Py_ISSPACE(*str))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000103 ++str;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000104
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000105 /* check for leading 0b, 0o or 0x for auto-base or base 16 */
106 switch (base) {
107 case 0: /* look for leading 0b, 0o or 0x */
108 if (*str == '0') {
109 ++str;
110 if (*str == 'x' || *str == 'X') {
111 /* there must be at least one digit after 0x */
112 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 16) {
113 if (ptr)
Serhiy Storchakac6792272013-10-19 21:03:34 +0300114 *ptr = (char *)str;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000115 return 0;
116 }
117 ++str;
118 base = 16;
119 } else if (*str == 'o' || *str == 'O') {
120 /* there must be at least one digit after 0o */
121 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 8) {
122 if (ptr)
Serhiy Storchakac6792272013-10-19 21:03:34 +0300123 *ptr = (char *)str;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000124 return 0;
125 }
126 ++str;
127 base = 8;
128 } else if (*str == 'b' || *str == 'B') {
129 /* there must be at least one digit after 0b */
130 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 2) {
131 if (ptr)
Serhiy Storchakac6792272013-10-19 21:03:34 +0300132 *ptr = (char *)str;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000133 return 0;
134 }
135 ++str;
136 base = 2;
137 } else {
138 /* skip all zeroes... */
139 while (*str == '0')
140 ++str;
Jordon Xu2ec70102019-09-11 00:04:08 +0800141 while (Py_ISSPACE(*str))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000142 ++str;
143 if (ptr)
Serhiy Storchakac6792272013-10-19 21:03:34 +0300144 *ptr = (char *)str;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000145 return 0;
146 }
147 }
148 else
149 base = 10;
150 break;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000151
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000152 /* even with explicit base, skip leading 0? prefix */
153 case 16:
154 if (*str == '0') {
155 ++str;
156 if (*str == 'x' || *str == 'X') {
157 /* there must be at least one digit after 0x */
158 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 16) {
159 if (ptr)
Serhiy Storchakac6792272013-10-19 21:03:34 +0300160 *ptr = (char *)str;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000161 return 0;
162 }
163 ++str;
164 }
165 }
166 break;
167 case 8:
168 if (*str == '0') {
169 ++str;
170 if (*str == 'o' || *str == 'O') {
171 /* there must be at least one digit after 0o */
172 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 8) {
173 if (ptr)
Serhiy Storchakac6792272013-10-19 21:03:34 +0300174 *ptr = (char *)str;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000175 return 0;
176 }
177 ++str;
178 }
179 }
180 break;
181 case 2:
182 if(*str == '0') {
183 ++str;
184 if (*str == 'b' || *str == 'B') {
185 /* there must be at least one digit after 0b */
186 if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 2) {
187 if (ptr)
Serhiy Storchakac6792272013-10-19 21:03:34 +0300188 *ptr = (char *)str;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000189 return 0;
190 }
191 ++str;
192 }
193 }
194 break;
195 }
Thomas Wouters477c8d52006-05-27 19:21:47 +0000196
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000197 /* catch silly bases */
198 if (base < 2 || base > 36) {
199 if (ptr)
Serhiy Storchakac6792272013-10-19 21:03:34 +0300200 *ptr = (char *)str;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000201 return 0;
202 }
Thomas Wouters477c8d52006-05-27 19:21:47 +0000203
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000204 /* skip leading zeroes */
205 while (*str == '0')
206 ++str;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000207
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000208 /* base is guaranteed to be in [2, 36] at this point */
209 ovlimit = digitlimit[base];
Thomas Wouters477c8d52006-05-27 19:21:47 +0000210
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000211 /* do the conversion until non-digit character encountered */
212 while ((c = _PyLong_DigitValue[Py_CHARMASK(*str)]) < base) {
213 if (ovlimit > 0) /* no overflow check required */
214 result = result * base + c;
215 else { /* requires overflow check */
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200216 unsigned long temp_result;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000217
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000218 if (ovlimit < 0) /* guaranteed overflow */
219 goto overflowed;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000220
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000221 /* there could be an overflow */
222 /* check overflow just from shifting */
223 if (result > smallmax[base])
224 goto overflowed;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000225
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000226 result *= base;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000227
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000228 /* check overflow from the digit's value */
229 temp_result = result + c;
230 if (temp_result < result)
231 goto overflowed;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000232
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000233 result = temp_result;
234 }
Thomas Wouters477c8d52006-05-27 19:21:47 +0000235
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000236 ++str;
237 --ovlimit;
238 }
Thomas Wouters477c8d52006-05-27 19:21:47 +0000239
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000240 /* set pointer to point to the last character scanned */
241 if (ptr)
Serhiy Storchakac6792272013-10-19 21:03:34 +0300242 *ptr = (char *)str;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000243
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000244 return result;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000245
Thomas Wouters477c8d52006-05-27 19:21:47 +0000246overflowed:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000247 if (ptr) {
248 /* spool through remaining digit characters */
249 while (_PyLong_DigitValue[Py_CHARMASK(*str)] < base)
250 ++str;
Serhiy Storchakac6792272013-10-19 21:03:34 +0300251 *ptr = (char *)str;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000252 }
253 errno = ERANGE;
254 return (unsigned long)-1;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000255}
256
Thomas Wouters89f507f2006-12-13 04:49:30 +0000257/* Checking for overflow in PyOS_strtol is a PITA; see comments
258 * about PY_ABS_LONG_MIN in longobject.c.
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000259 */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000260#define PY_ABS_LONG_MIN (0-(unsigned long)LONG_MIN)
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000261
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000262long
Serhiy Storchakac6792272013-10-19 21:03:34 +0300263PyOS_strtol(const char *str, char **ptr, int base)
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000264{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000265 long result;
266 unsigned long uresult;
267 char sign;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000268
Jordon Xu2ec70102019-09-11 00:04:08 +0800269 while (*str && Py_ISSPACE(*str))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000270 str++;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000271
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000272 sign = *str;
273 if (sign == '+' || sign == '-')
274 str++;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000275
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000276 uresult = PyOS_strtoul(str, ptr, base);
Thomas Wouters477c8d52006-05-27 19:21:47 +0000277
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000278 if (uresult <= (unsigned long)LONG_MAX) {
279 result = (long)uresult;
280 if (sign == '-')
281 result = -result;
282 }
283 else if (sign == '-' && uresult == PY_ABS_LONG_MIN) {
284 result = LONG_MIN;
285 }
286 else {
287 errno = ERANGE;
288 result = LONG_MAX;
289 }
290 return result;
Guido van Rossumbe0e9421993-12-24 10:32:00 +0000291}