1 /*
2 FUNCTION
3    <<wcstoll>>, <<wcstoll_l>>---wide string to long long
4 
5 INDEX
6 	wcstoll
7 
8 INDEX
9 	wcstoll_l
10 
11 INDEX
12 	_wcstoll_r
13 
14 SYNOPSIS
15 	#include <wchar.h>
16         long long wcstoll(const wchar_t *__restrict <[s]>,
17 			  wchar_t **__restrict <[ptr]>,int <[base]>);
18 
19 	#include <wchar.h>
20         long long wcstoll_l(const wchar_t *__restrict <[s]>,
21 			    wchar_t **__restrict <[ptr]>, int <[base]>,
22 			    locale_t <[locale]>);
23 
24         long long _wcstoll_r(void *<[reent]>, const wchar_t *<[s]>,
25 			     wchar_t **<[ptr]>, int <[base]>);
26 
27 DESCRIPTION
28 The function <<wcstoll>> converts the wide string <<*<[s]>>> to
29 a <<long long>>. First, it breaks down the string into three parts:
30 leading whitespace, which is ignored; a subject string consisting
31 of characters resembling an integer in the radix specified by <[base]>;
32 and a trailing portion consisting of zero or more unparseable characters,
33 and always including the terminating null character. Then, it attempts
34 to convert the subject string into a <<long long>> and returns the
35 result.
36 
37 If the value of <[base]> is 0, the subject string is expected to look
38 like a normal C integer constant: an optional sign, a possible `<<0x>>'
39 indicating a hexadecimal base, and a number. If <[base]> is between
40 2 and 36, the expected form of the subject is a sequence of letters
41 and digits representing an integer in the radix specified by <[base]>,
42 with an optional plus or minus sign. The letters <<a>>--<<z>> (or,
43 equivalently, <<A>>--<<Z>>) are used to signify values from 10 to 35;
44 only letters whose ascribed values are less than <[base]> are
45 permitted. If <[base]> is 16, a leading <<0x>> is permitted.
46 
47 The subject sequence is the longest initial sequence of the input
48 string that has the expected form, starting with the first
49 non-whitespace character.  If the string is empty or consists entirely
50 of whitespace, or if the first non-whitespace character is not a
51 permissible letter or digit, the subject string is empty.
52 
53 If the subject string is acceptable, and the value of <[base]> is zero,
54 <<wcstoll>> attempts to determine the radix from the input string. A
55 string with a leading <<0x>> is treated as a hexadecimal value; a string with
56 a leading 0 and no <<x>> is treated as octal; all other strings are
57 treated as decimal. If <[base]> is between 2 and 36, it is used as the
58 conversion radix, as described above. If the subject string begins with
59 a minus sign, the value is negated. Finally, a pointer to the first
60 character past the converted subject string is stored in <[ptr]>, if
61 <[ptr]> is not <<NULL>>.
62 
63 If the subject string is empty (or not in acceptable form), no conversion
64 is performed and the value of <[s]> is stored in <[ptr]> (if <[ptr]> is
65 not <<NULL>>).
66 
67 The alternate function <<_wcstoll_r>> is a reentrant version.  The
68 extra argument <[reent]> is a pointer to a reentrancy structure.
69 
70 <<wcstoll_l>> is like <<wcstoll>> but performs the conversion based on the
71 locale specified by the locale object locale.  If <[locale]> is
72 LC_GLOBAL_LOCALE or not a valid locale object, the behaviour is undefined.
73 
74 RETURNS
75 <<wcstoll>>, <<wcstoll_l>> return the converted value, if any. If no
76 conversion was made, 0 is returned.
77 
78 <<wcstoll>>, <<wcstoll_l>> return <<LONG_LONG_MAX>> or <<LONG_LONG_MIN>>
79 if the magnitude of the converted value is too large, and sets <<errno>>
80 to <<ERANGE>>.
81 
82 PORTABILITY
83 <<wcstoll>> is ANSI.
84 <<wcstoll_l>> is a GNU extension.
85 
86 No supporting OS subroutines are required.
87 */
88 
89 /*-
90  * Copyright (c) 1990 The Regents of the University of California.
91  * All rights reserved.
92  *
93  * Redistribution and use in source and binary forms, with or without
94  * modification, are permitted provided that the following conditions
95  * are met:
96  * 1. Redistributions of source code must retain the above copyright
97  *    notice, this list of conditions and the following disclaimer.
98  * 2. Redistributions in binary form must reproduce the above copyright
99  *    notice, this list of conditions and the following disclaimer in the
100  *    documentation and/or other materials provided with the distribution.
101  * 3. Neither the name of the University nor the names of its contributors
102  *    may be used to endorse or promote products derived from this software
103  *    without specific prior written permission.
104  *
105  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
106  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
107  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
108  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
109  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
110  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
111  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
112  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
113  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
114  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
115  * SUCH DAMAGE.
116  */
117 
118 #define _GNU_SOURCE
119 #include <_ansi.h>
120 #include <limits.h>
121 #include <wctype.h>
122 #include <errno.h>
123 #include <wchar.h>
124 #include "../locale/setlocale.h"
125 
126 /*
127  * Convert a wide string to a long long integer.
128  */
129 #ifndef _REENT_ONLY
130 
131 long long
wcstoll_l(const wchar_t * nptr,wchar_t ** endptr,int base,locale_t loc)132 wcstoll_l (const wchar_t *nptr, wchar_t **endptr,
133 	    int base, locale_t loc)
134 {
135 	register const wchar_t *s = nptr;
136 	register unsigned long long acc;
137 	register wchar_t c;
138 	register unsigned long long cutoff;
139 	register int neg = 0, any, cutlim;
140 
141 	/*
142 	 * Skip white space and pick up leading +/- sign if any.
143 	 * If base is 0, allow 0x for hex and 0 for octal, else
144 	 * assume decimal; if base is already 16, allow 0x.
145 	 */
146 	do {
147 		c = *s++;
148 	} while (iswspace_l(c, loc));
149 	if (c == L'-') {
150 		neg = 1;
151 		c = *s++;
152 	} else if (c == L'+')
153 		c = *s++;
154 	if ((base == 0 || base == 16) &&
155 	    c == L'0' && (*s == L'x' || *s == L'X')) {
156 		c = s[1];
157 		s += 2;
158 		base = 16;
159 	}
160 	if (base == 0)
161 		base = c == L'0' ? 8 : 10;
162 
163 	/*
164 	 * Compute the cutoff value between legal numbers and illegal
165 	 * numbers.  That is the largest legal value, divided by the
166 	 * base.  An input number that is greater than this value, if
167 	 * followed by a legal input character, is too big.  One that
168 	 * is equal to this value may be valid or not; the limit
169 	 * between valid and invalid numbers is then based on the last
170 	 * digit.  For instance, if the range for longs is
171 	 * [-2147483648..2147483647] and the input base is 10,
172 	 * cutoff will be set to 214748364 and cutlim to either
173 	 * 7 (neg==0) or 8 (neg==1), meaning that if we have accumulated
174 	 * a value > 214748364, or equal but the next digit is > 7 (or 8),
175 	 * the number is too big, and we will return a range error.
176 	 *
177 	 * Set any if any `digits' consumed; make it negative to indicate
178 	 * overflow.
179 	 */
180 	cutoff = neg ? -(unsigned long long)LLONG_MIN : LLONG_MAX;
181 	cutlim = cutoff % (unsigned long long)base;
182 	cutoff /= (unsigned long long)base;
183 	for (acc = 0, any = 0;; c = *s++) {
184 		if (c >= L'0' && c <= L'9')
185 			c -= L'0';
186 		else if (c >= L'A' && c <= L'Z')
187 			c -= L'A' - 10;
188 		else if (c >= L'a' && c <= L'z')
189 			c -= L'a' - 10;
190 		else
191 			break;
192 		if ((int) c >= base)
193 			break;
194                 if (any < 0 || acc > cutoff || (acc == cutoff && (int) c > cutlim))
195 			any = -1;
196 		else {
197 			any = 1;
198 			acc *= base;
199 			acc += (int) c;
200 		}
201 	}
202 	if (any < 0) {
203 		acc = neg ? LLONG_MIN : LLONG_MAX;
204 		_REENT_ERRNO(rptr) = ERANGE;
205 	} else if (neg)
206 		acc = -acc;
207 	if (endptr != 0)
208 		*endptr = (wchar_t *) (any ? s - 1 : nptr);
209 	return (acc);
210 }
211 
212 long long
wcstoll(const wchar_t * __restrict s,wchar_t ** __restrict ptr,int base)213 wcstoll (const wchar_t *__restrict s,
214 	wchar_t **__restrict ptr,
215 	int base)
216 {
217 	return wcstoll_l (s, ptr, base, __get_current_locale ());
218 }
219 
220 #endif
221