mystrtoul.c 6.37 KB
Newer Older
Guido van Rossum's avatar
Guido van Rossum committed
1

Guido van Rossum's avatar
Guido van Rossum committed
2
#include "Python.h"
3

4 5 6 7
#if defined(__sgi) && defined(WITH_THREAD) && !defined(_SGI_MP_SOURCE)
#define _SGI_MP_SOURCE
#endif

8 9
/* strtol and strtoul, renamed to avoid conflicts */

10 11

#include <ctype.h>
12
#ifdef HAVE_ERRNO_H
13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63
#include <errno.h>
#endif

/* Static overflow check values for bases 2 through 36.
 * smallmax[base] is the largest unsigned long i such that
 * i * base doesn't overflow unsigned long.
 */
static unsigned long smallmax[] = {
	0, /* bases 0 and 1 are invalid */
	0,
	ULONG_MAX / 2,
	ULONG_MAX / 3,
	ULONG_MAX / 4,
	ULONG_MAX / 5,
	ULONG_MAX / 6,
	ULONG_MAX / 7,
	ULONG_MAX / 8,
	ULONG_MAX / 9,
	ULONG_MAX / 10,
	ULONG_MAX / 11,
	ULONG_MAX / 12,
	ULONG_MAX / 13,
	ULONG_MAX / 14,
	ULONG_MAX / 15,
	ULONG_MAX / 16,
	ULONG_MAX / 17,
	ULONG_MAX / 18,
	ULONG_MAX / 19,
	ULONG_MAX / 20,
	ULONG_MAX / 21,
	ULONG_MAX / 22,
	ULONG_MAX / 23,
	ULONG_MAX / 24,
	ULONG_MAX / 25,
	ULONG_MAX / 26,
	ULONG_MAX / 27,
	ULONG_MAX / 28,
	ULONG_MAX / 29,
	ULONG_MAX / 30,
	ULONG_MAX / 31,
	ULONG_MAX / 32,
	ULONG_MAX / 33,
	ULONG_MAX / 34,
	ULONG_MAX / 35,
	ULONG_MAX / 36,
};

/* maximum digits that can't ever overflow for bases 2 through 36,
 * calculated by [int(math.floor(math.log(2**32, i))) for i in range(2, 37)].
 * Note that this is pessimistic if sizeof(long) > 4.
 */
64
#if SIZEOF_LONG == 4
65 66 67 68 69
static int digitlimit[] = {
	0,  0, 32, 20, 16, 13, 12, 11, 10, 10,  /*  0 -  9 */
	9,  9,  8,  8,  8,  8,  8,  7,  7,  7,  /* 10 - 19 */
	7,  7,  7,  7,  6,  6,  6,  6,  6,  6,  /* 20 - 29 */
	6,  6,  6,  6,  6,  6,  6};             /* 30 - 36 */
70 71 72 73 74 75 76 77 78 79
#elif SIZEOF_LONG == 8
/* [int(math.floor(math.log(2**64, i))) for i in range(2, 37)] */
static int digitlimit[] = {
	 0,   0, 64, 40, 32, 27, 24, 22, 21, 20,  /*  0 -  9 */
	19,  18, 17, 17, 16, 16, 16, 15, 15, 15,  /* 10 - 19 */
	14,  14, 14, 14, 13, 13, 13, 13, 13, 13,  /* 20 - 29 */
	13,  12, 12, 12, 12, 12, 12};             /* 30 - 36 */
#else
#error "Need table for SIZEOF_LONG"
#endif
80

Guido van Rossum's avatar
Guido van Rossum committed
81 82 83 84 85
/*
**	strtoul
**		This is a general purpose routine for converting
**		an ascii string to an integer in an arbitrary base.
**		Leading white space is ignored.  If 'base' is zero
86 87 88
**		it looks for a leading 0, 0b, 0B, 0o, 0O, 0x or 0X
**		to tell which base.  If these are absent it defaults
**		to 10. Base must be 0 or between 2 and 36 (inclusive).
Guido van Rossum's avatar
Guido van Rossum committed
89 90 91 92 93 94
**		If 'ptr' is non-NULL it will contain a pointer to
**		the end of the scan.
**		Errors due to bad pointers will probably result in
**		exceptions - we don't check for them.
*/
unsigned long
95
PyOS_strtoul(register char *str, char **ptr, int base)
Guido van Rossum's avatar
Guido van Rossum committed
96
{
97 98 99
	register unsigned long result = 0; /* return value of the function */
	register int c;	 	/* current input character */
	register int ovlimit; 	/* required digits to overflow */
Guido van Rossum's avatar
Guido van Rossum committed
100

101 102 103
	/* skip leading white space */
	while (*str && isspace(Py_CHARMASK(*str)))
		++str;
Guido van Rossum's avatar
Guido van Rossum committed
104

105 106
	/* check for leading 0 or 0x for auto-base or base 16 */
	switch (base) {
107
	case 0:		/* look for leading 0, 0b, 0o or 0x */
108 109 110 111
		if (*str == '0') {
			++str;
			if (*str == 'x' || *str == 'X') {
				/* there must be at least one digit after 0x */
112
				if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 16) {
113 114 115
					if (ptr)
						*ptr = str;
					return 0;
116
				}
117 118
				++str;
				base = 16;
119 120
			} else if (*str == 'o' || *str == 'O') {
				/* there must be at least one digit after 0o */
121
				if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 8) {
122 123 124 125 126 127 128 129
					if (ptr)
						*ptr = str;
					return 0;
				}
				++str;
				base = 8;
			} else if (*str == 'b' || *str == 'B') {
				/* there must be at least one digit after 0b */
130
				if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 2) {
131 132 133 134 135 136 137
					if (ptr)
						*ptr = str;
					return 0;
				}
				++str;
				base = 2;
			} else {
138
				base = 8;
139
			}
140 141 142 143 144
		}
		else
			base = 10;
		break;

145 146 147 148 149
	case 2:	/* skip leading 0b or 0B */
		if (*str == '0') {
			++str;
			if (*str == 'b' || *str == 'B') {
				/* there must be at least one digit after 0b */
150
				if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 2) {
151 152 153 154 155 156 157 158 159 160 161 162 163 164
					if (ptr)
						*ptr = str;
					return 0;
				}
				++str;
			}
		}
		break;

	case 8:	/* skip leading 0o or 0O */
		if (*str == '0') {
			++str;
			if (*str == 'o' || *str == 'O') {
				/* there must be at least one digit after 0o */
165
				if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 8) {
166 167 168 169 170 171 172 173 174
					if (ptr)
						*ptr = str;
					return 0;
				}
				++str;
			}
		}
		break;

175 176 177 178 179
	case 16:	/* skip leading 0x or 0X */
		if (*str == '0') {
			++str;
			if (*str == 'x' || *str == 'X') {
				/* there must be at least one digit after 0x */
180
				if (_PyLong_DigitValue[Py_CHARMASK(str[1])] >= 16) {
181 182 183 184
					if (ptr)
						*ptr = str;
					return 0;
				}
185 186
				++str;
			}
187 188
		}
		break;
Guido van Rossum's avatar
Guido van Rossum committed
189
	}
190 191 192 193 194 195

	/* catch silly bases */
	if (base < 2 || base > 36) {
		if (ptr)
			*ptr = str;
		return 0;
Guido van Rossum's avatar
Guido van Rossum committed
196
	}
197 198 199 200 201 202 203 204 205

	/* skip leading zeroes */
	while (*str == '0')
		++str;

	/* base is guaranteed to be in [2, 36] at this point */
	ovlimit = digitlimit[base];

	/* do the conversion until non-digit character encountered */
206
	while ((c = _PyLong_DigitValue[Py_CHARMASK(*str)]) < base) {
207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231
		if (ovlimit > 0) /* no overflow check required */
			result = result * base + c;
		else { /* requires overflow check */
			register unsigned long temp_result;

			if (ovlimit < 0) /* guaranteed overflow */
				goto overflowed;

			/* there could be an overflow */
			/* check overflow just from shifting */
			if (result > smallmax[base])
				goto overflowed;

			result *= base;

			/* check overflow from the digit's value */
			temp_result = result + c;
			if (temp_result < result)
				goto overflowed;

			result = temp_result;
		}

		++str;
		--ovlimit;
232
	}
233 234 235 236 237 238 239 240 241 242

	/* set pointer to point to the last character scanned */
	if (ptr)
		*ptr = str;

	return result;

overflowed:
	if (ptr) {
		/* spool through remaining digit characters */
243
		while (_PyLong_DigitValue[Py_CHARMASK(*str)] < base)
244 245
			++str;
		*ptr = str;
246
	}
Guido van Rossum's avatar
Guido van Rossum committed
247
	errno = ERANGE;
248
	return (unsigned long)-1;
Guido van Rossum's avatar
Guido van Rossum committed
249 250
}

251 252
/* Checking for overflow in PyOS_strtol is a PITA; see comments
 * about PY_ABS_LONG_MIN in longobject.c.
253
 */
254
#define PY_ABS_LONG_MIN		(0-(unsigned long)LONG_MIN)
255

Guido van Rossum's avatar
Guido van Rossum committed
256
long
257
PyOS_strtol(char *str, char **ptr, int base)
Guido van Rossum's avatar
Guido van Rossum committed
258 259
{
	long result;
260
	unsigned long uresult;
Guido van Rossum's avatar
Guido van Rossum committed
261
	char sign;
262

Guido van Rossum's avatar
Guido van Rossum committed
263
	while (*str && isspace(Py_CHARMASK(*str)))
Guido van Rossum's avatar
Guido van Rossum committed
264
		str++;
265

Guido van Rossum's avatar
Guido van Rossum committed
266 267 268
	sign = *str;
	if (sign == '+' || sign == '-')
		str++;
269

270
	uresult = PyOS_strtoul(str, ptr, base);
271

272 273 274 275 276
	if (uresult <= (unsigned long)LONG_MAX) {
		result = (long)uresult;
		if (sign == '-')
			result = -result;
	}
277
	else if (sign == '-' && uresult == PY_ABS_LONG_MIN) {
278 279 280
		result = LONG_MIN;
	}
	else {
Guido van Rossum's avatar
Guido van Rossum committed
281
		errno = ERANGE;
282
		result = LONG_MAX;
Guido van Rossum's avatar
Guido van Rossum committed
283 284 285
	}
	return result;
}