str2int.c source code [MariaDB/strings/str2int.c]

1	/ Copyright (c) 2000 TXT DataKonsult Ab & Monty Program Ab*
2	Copyright (c) 2009-2011, Monty Program Ab
3
4	Redistribution and use in source and binary forms, with or without
5	modification, are permitted provided that the following conditions are
6	met:
7
8	1. Redistributions of source code must retain the above copyright
9	notice, this list of conditions and the following disclaimer.
10
11	2. Redistributions in binary form must the following disclaimer in
12	the documentation and/or other materials provided with the
13	distribution.
14
15	THIS SOFTWARE IS PROVIDED BY <COPYRIGHT HOLDER> ``AS IS'' AND ANY
16	EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17	IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
18	PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL <COPYRIGHT HOLDER> OR
19	CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
20	SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
21	LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
22	USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
23	ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24	OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
25	OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26	SUCH DAMAGE.
27	*/
28
29	/*
30	str2int(src, radix, lower, upper, &val)
31	converts the string pointed to by src to an integer and stores it in
32	val. It skips leading spaces and tabs (but not newlines, formfeeds,
33	backspaces), then it accepts an optional sign and a sequence of digits
34	in the specified radix. The result should satisfy lower <= val <= upper.*
35	The result is a pointer to the first character after the number;
36	trailing spaces will NOT be skipped.
37
38	If an error is detected, the result will be NullS, the value put
39	in val will be 0, and errno will be set to
40	EDOM if there are no digits
41	ERANGE if the result would overflow or otherwise fail to lie
42	within the specified bounds.
43	Check that the bounds are right for your machine.
44	This looks amazingly complicated for what you probably thought was an
45	easy task. Coping with integer overflow and the asymmetric range of
46	twos complement machines is anything but easy.
47
48	So that users of atoi and atol can check whether an error occurred,
49	I have taken a wholly unprecedented step: errno is CLEARED if this
50	call has no problems.
51	*/
52
53	#include "strings_def.h"
54	#include <m_ctype.h>
55	#include "my_sys.h" /* defines errno */
56	#include <errno.h>
57
58	#define char_val(X) (X >= '0' && X <= '9' ? X-'0' :\
59	X >= 'A' && X <= 'Z' ? X-'A'+10 :\
60	X >= 'a' && X <= 'z' ? X-'a'+10 :\
61	'\177')
62
63	char str2int(register* const char src, register* int radix, long int lower,
64	long int upper, long int *val)
65	{
66	int sign; / is number negative (+1) or positive (-1) /
67	int n; / number of digits yet to be converted /
68	long limit; / "largest" possible valid input /
69	long scale; / the amount to multiply next digit by /
70	long sofar; / the running value /
71	register int d; / (negative of) next digit /
72	char *start;
73	int digits[`32`]; / Room for numbers /
74
75	/ Make sure val is sensible in case of error /*
76
77	*val = `0`;
78
79	/ Check that the radix is in the range 2..36 /
80
81	#ifndef DBUG_OFF
82	if (radix < `2` \|\| radix > `36`) {
83	errno=EDOM;
84	return NullS;
85	}
86	#endif
87
88	/ The basic problem is: how do we handle the conversion of*
89	a number without resorting to machine-specific code to
90	check for overflow? Obviously, we have to ensure that
91	no calculation can overflow. We are guaranteed that the
92	"lower" and "upper" arguments are valid machine integers.
93	On sign-and-magnitude, twos-complement, and ones-complement
94	machines all, if +\|n\| is representable, so is -\|n\|, but on
95	twos complement machines the converse is not true. So the
96	"maximum" representable number has a negative representative.
97	Limit is set to MY_MIN(-\|lower\|,-\|upper\|); this is the "largest"
98	number we are concerned with. /*
99
100	/ Calculate Limit using Scale as a scratch variable /
101
102	if ((limit = lower) > `0`) limit = -limit;
103	if ((scale = upper) > `0`) scale = -scale;
104	if (scale < limit) limit = scale;
105
106	/ Skip leading spaces and check for a sign.*
107	Note: because on a 2s complement machine MinLong is a valid
108	integer but \|MinLong\| is not, we have to keep the current
109	converted value (and the scale!) as negative* numbers,*
110	so the sign is the opposite of what you might expect.
111	*/
112	while (my_isspace(&my_charset_latin1,*src)) src++;
113	sign = -`1`;
114	if (src == `'+'`) src++; else*
115	if (*src == `'-'`) src++, sign = `1`;
116
117	/ Skip leading zeros so that we never compute a power of radix*
118	in scale that we won't have a need for. Otherwise sticking
119	enough 0s in front of a number could cause the multiplication
120	to overflow when it neededn't.
121	*/
122	start=(char*) src;
123	while (*src == `'0'`) src++;
124
125	/ Move over the remaining digits. We have to convert from left*
126	to left in order to avoid overflow. Answer is after last digit.
127	*/
128
129	for (n = `0`; (digits[n]=char_val(*src)) < radix && n < `20`; n++,src++) ;
130
131	/ Check that there is at least one digit /
132
133	if (start == src) {
134	errno=EDOM;
135	return NullS;
136	}
137
138	/ The invariant we want to maintain is that src is just*
139	to the right of n digits, we've converted k digits to
140	sofar, scale = -radixk, and scale < sofar < 0. Now
141	if the final number is to be within the original
142	Limit, we must have (to the left)scale+sofar >= Limit,*
143	or (to the left)scale >= Limit-sofar, i.e. the digits*
144	to the left of src must form an integer <= (Limit-sofar)/(scale).
145	In particular, this is true of the next digit. In our
146	incremental calculation of Limit,
147
148	IT IS VITAL that (-\|N\|)/(-\|D\|) = \|N\|/\|D\|
149	*/
150
151	for (sofar = `0`, scale = -`1`; --n >= `1`;)
152	{
153	if ((long) -(d=digits[n]) < limit) {
154	errno=ERANGE;
155	return NullS;
156	}
157	limit = (limit+d)/radix, sofar += dscale; scale = radix;
158	}
159	if (n == `0`)
160	{
161	if ((long) -(d=digits[n]) < limit) / get last digit /
162	{
163	errno=ERANGE;
164	return NullS;
165	}
166	sofar+=d*scale;
167	}
168
169	/ Now it might still happen that sofar = -32768 or its equivalent,*
170	so we can't just multiply by the sign and check that the result
171	is in the range lower..upper. All of this caution is a right
172	pain in the neck. If only there were a standard routine which
173	says generate thus and such a signal on integer overflow...
174	But not enough machines can do it SIGH.
175	*/
176	if (sign < `0`)
177	{
178	if (sofar < -LONG_MAX \|\| (sofar= -sofar) > upper)
179	{
180	errno=ERANGE;
181	return NullS;
182	}
183	}
184	else if (sofar < lower)
185	{
186	errno=ERANGE;
187	return NullS;
188	}
189	*val = sofar;
190	errno=`0`; / indicate that all went well /
191	return (char*) src;
192	}
193
194	/ These are so slow compared with ordinary, optimized atoi /
195
196	#ifdef WANT_OUR_ATOI
197
198	int atoi(const char *src)
199	{
200	long val;
201	str2int(src, `10`, (long) INT_MIN, (long) INT_MAX, &val);
202	return (int) val;
203	}
204
205
206	long atol(const char *src)
207	{
208	long val;
209	str2int(src, `10`, LONG_MIN, LONG_MAX, &val);
210	return val;
211	}
212
213	#endif /* WANT_OUR_ATOI */
214

Browse the source code of MariaDB/strings/str2int.c