1 /*
2 FUNCTION
3 <<wcstoll>>, <<wcstoll_l>>---wide string to long long
4
5 INDEX
6 wcstoll
7
8 INDEX
9 wcstoll_l
10
11 INDEX
12 _wcstoll_r
13
14 SYNOPSIS
15 #include <wchar.h>
16 long long wcstoll(const wchar_t *__restrict <[s]>,
17 wchar_t **__restrict <[ptr]>,int <[base]>);
18
19 #include <wchar.h>
20 long long wcstoll_l(const wchar_t *__restrict <[s]>,
21 wchar_t **__restrict <[ptr]>, int <[base]>,
22 locale_t <[locale]>);
23
24 long long _wcstoll_r(void *<[reent]>, const wchar_t *<[s]>,
25 wchar_t **<[ptr]>, int <[base]>);
26
27 DESCRIPTION
28 The function <<wcstoll>> converts the wide string <<*<[s]>>> to
29 a <<long long>>. First, it breaks down the string into three parts:
30 leading whitespace, which is ignored; a subject string consisting
31 of characters resembling an integer in the radix specified by <[base]>;
32 and a trailing portion consisting of zero or more unparseable characters,
33 and always including the terminating null character. Then, it attempts
34 to convert the subject string into a <<long long>> and returns the
35 result.
36
37 If the value of <[base]> is 0, the subject string is expected to look
38 like a normal C integer constant: an optional sign, a possible `<<0x>>'
39 indicating a hexadecimal base, and a number. If <[base]> is between
40 2 and 36, the expected form of the subject is a sequence of letters
41 and digits representing an integer in the radix specified by <[base]>,
42 with an optional plus or minus sign. The letters <<a>>--<<z>> (or,
43 equivalently, <<A>>--<<Z>>) are used to signify values from 10 to 35;
44 only letters whose ascribed values are less than <[base]> are
45 permitted. If <[base]> is 16, a leading <<0x>> is permitted.
46
47 The subject sequence is the longest initial sequence of the input
48 string that has the expected form, starting with the first
49 non-whitespace character. If the string is empty or consists entirely
50 of whitespace, or if the first non-whitespace character is not a
51 permissible letter or digit, the subject string is empty.
52
53 If the subject string is acceptable, and the value of <[base]> is zero,
54 <<wcstoll>> attempts to determine the radix from the input string. A
55 string with a leading <<0x>> is treated as a hexadecimal value; a string with
56 a leading 0 and no <<x>> is treated as octal; all other strings are
57 treated as decimal. If <[base]> is between 2 and 36, it is used as the
58 conversion radix, as described above. If the subject string begins with
59 a minus sign, the value is negated. Finally, a pointer to the first
60 character past the converted subject string is stored in <[ptr]>, if
61 <[ptr]> is not <<NULL>>.
62
63 If the subject string is empty (or not in acceptable form), no conversion
64 is performed and the value of <[s]> is stored in <[ptr]> (if <[ptr]> is
65 not <<NULL>>).
66
67 The alternate function <<_wcstoll_r>> is a reentrant version. The
68 extra argument <[reent]> is a pointer to a reentrancy structure.
69
70 <<wcstoll_l>> is like <<wcstoll>> but performs the conversion based on the
71 locale specified by the locale object locale. If <[locale]> is
72 LC_GLOBAL_LOCALE or not a valid locale object, the behaviour is undefined.
73
74 RETURNS
75 <<wcstoll>>, <<wcstoll_l>> return the converted value, if any. If no
76 conversion was made, 0 is returned.
77
78 <<wcstoll>>, <<wcstoll_l>> return <<LONG_LONG_MAX>> or <<LONG_LONG_MIN>>
79 if the magnitude of the converted value is too large, and sets <<errno>>
80 to <<ERANGE>>.
81
82 PORTABILITY
83 <<wcstoll>> is ANSI.
84 <<wcstoll_l>> is a GNU extension.
85
86 No supporting OS subroutines are required.
87 */
88
89 /*-
90 * Copyright (c) 1990 The Regents of the University of California.
91 * All rights reserved.
92 *
93 * Redistribution and use in source and binary forms, with or without
94 * modification, are permitted provided that the following conditions
95 * are met:
96 * 1. Redistributions of source code must retain the above copyright
97 * notice, this list of conditions and the following disclaimer.
98 * 2. Redistributions in binary form must reproduce the above copyright
99 * notice, this list of conditions and the following disclaimer in the
100 * documentation and/or other materials provided with the distribution.
101 * 3. Neither the name of the University nor the names of its contributors
102 * may be used to endorse or promote products derived from this software
103 * without specific prior written permission.
104 *
105 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
106 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
107 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
108 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
109 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
110 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
111 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
112 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
113 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
114 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
115 * SUCH DAMAGE.
116 */
117
118 #define _GNU_SOURCE
119 #include <_ansi.h>
120 #include <limits.h>
121 #include <wctype.h>
122 #include <errno.h>
123 #include <wchar.h>
124 #include "../locale/setlocale.h"
125
126 /*
127 * Convert a wide string to a long long integer.
128 */
129 #ifndef _REENT_ONLY
130
131 long long
wcstoll_l(const wchar_t * nptr,wchar_t ** endptr,int base,locale_t loc)132 wcstoll_l (const wchar_t *nptr, wchar_t **endptr,
133 int base, locale_t loc)
134 {
135 register const wchar_t *s = nptr;
136 register unsigned long long acc;
137 register wchar_t c;
138 register unsigned long long cutoff;
139 register int neg = 0, any, cutlim;
140
141 /*
142 * Skip white space and pick up leading +/- sign if any.
143 * If base is 0, allow 0x for hex and 0 for octal, else
144 * assume decimal; if base is already 16, allow 0x.
145 */
146 do {
147 c = *s++;
148 } while (iswspace_l(c, loc));
149 if (c == L'-') {
150 neg = 1;
151 c = *s++;
152 } else if (c == L'+')
153 c = *s++;
154 if ((base == 0 || base == 16) &&
155 c == L'0' && (*s == L'x' || *s == L'X')) {
156 c = s[1];
157 s += 2;
158 base = 16;
159 }
160 if (base == 0)
161 base = c == L'0' ? 8 : 10;
162
163 /*
164 * Compute the cutoff value between legal numbers and illegal
165 * numbers. That is the largest legal value, divided by the
166 * base. An input number that is greater than this value, if
167 * followed by a legal input character, is too big. One that
168 * is equal to this value may be valid or not; the limit
169 * between valid and invalid numbers is then based on the last
170 * digit. For instance, if the range for longs is
171 * [-2147483648..2147483647] and the input base is 10,
172 * cutoff will be set to 214748364 and cutlim to either
173 * 7 (neg==0) or 8 (neg==1), meaning that if we have accumulated
174 * a value > 214748364, or equal but the next digit is > 7 (or 8),
175 * the number is too big, and we will return a range error.
176 *
177 * Set any if any `digits' consumed; make it negative to indicate
178 * overflow.
179 */
180 cutoff = neg ? -(unsigned long long)LLONG_MIN : LLONG_MAX;
181 cutlim = cutoff % (unsigned long long)base;
182 cutoff /= (unsigned long long)base;
183 for (acc = 0, any = 0;; c = *s++) {
184 if (c >= L'0' && c <= L'9')
185 c -= L'0';
186 else if (c >= L'A' && c <= L'Z')
187 c -= L'A' - 10;
188 else if (c >= L'a' && c <= L'z')
189 c -= L'a' - 10;
190 else
191 break;
192 if ((int) c >= base)
193 break;
194 if (any < 0 || acc > cutoff || (acc == cutoff && (int) c > cutlim))
195 any = -1;
196 else {
197 any = 1;
198 acc *= base;
199 acc += (int) c;
200 }
201 }
202 if (any < 0) {
203 acc = neg ? LLONG_MIN : LLONG_MAX;
204 _REENT_ERRNO(rptr) = ERANGE;
205 } else if (neg)
206 acc = -acc;
207 if (endptr != 0)
208 *endptr = (wchar_t *) (any ? s - 1 : nptr);
209 return (acc);
210 }
211
212 long long
wcstoll(const wchar_t * __restrict s,wchar_t ** __restrict ptr,int base)213 wcstoll (const wchar_t *__restrict s,
214 wchar_t **__restrict ptr,
215 int base)
216 {
217 return wcstoll_l (s, ptr, base, __get_current_locale ());
218 }
219
220 #endif
221