1 /*
2 FUNCTION
3 <<wcstol>>, <<wcstol_l>>---wide string to long
4
5 INDEX
6 wcstol
7
8 INDEX
9 wcstol_l
10
11 INDEX
12 _wcstol_r
13
14 SYNOPSIS
15 #include <wchar.h>
16 long wcstol(const wchar_t *__restrict <[s]>,
17 wchar_t **__restrict <[ptr]>, int <[base]>);
18
19 #include <wchar.h>
20 long wcstol_l(const wchar_t *__restrict <[s]>,
21 wchar_t **__restrict <[ptr]>, int <[base]>,
22 locale_t <[locale]>);
23
24 long _wcstol_r(void *<[reent]>, const wchar_t *<[s]>,
25 wchar_t **<[ptr]>, int <[base]>);
26
27 DESCRIPTION
28 The function <<wcstol>> converts the wide string <<*<[s]>>> to
29 a <<long>>. First, it breaks down the string into three parts:
30 leading whitespace, which is ignored; a subject string consisting
31 of characters resembling an integer in the radix specified by <[base]>;
32 and a trailing portion consisting of zero or more unparseable characters,
33 and always including the terminating null character. Then, it attempts
34 to convert the subject string into a <<long>> and returns the
35 result.
36
37 If the value of <[base]> is 0, the subject string is expected to look
38 like a normal C integer constant: an optional sign, a possible `<<0x>>'
39 indicating a hexadecimal base, and a number. If <[base]> is between
40 2 and 36, the expected form of the subject is a sequence of letters
41 and digits representing an integer in the radix specified by <[base]>,
42 with an optional plus or minus sign. The letters <<a>>--<<z>> (or,
43 equivalently, <<A>>--<<Z>>) are used to signify values from 10 to 35;
44 only letters whose ascribed values are less than <[base]> are
45 permitted. If <[base]> is 16, a leading <<0x>> is permitted.
46
47 The subject sequence is the longest initial sequence of the input
48 string that has the expected form, starting with the first
49 non-whitespace character. If the string is empty or consists entirely
50 of whitespace, or if the first non-whitespace character is not a
51 permissible letter or digit, the subject string is empty.
52
53 If the subject string is acceptable, and the value of <[base]> is zero,
54 <<wcstol>> attempts to determine the radix from the input string. A
55 string with a leading <<0x>> is treated as a hexadecimal value; a string with
56 a leading 0 and no <<x>> is treated as octal; all other strings are
57 treated as decimal. If <[base]> is between 2 and 36, it is used as the
58 conversion radix, as described above. If the subject string begins with
59 a minus sign, the value is negated. Finally, a pointer to the first
60 character past the converted subject string is stored in <[ptr]>, if
61 <[ptr]> is not <<NULL>>.
62
63 If the subject string is empty (or not in acceptable form), no conversion
64 is performed and the value of <[s]> is stored in <[ptr]> (if <[ptr]> is
65 not <<NULL>>).
66
67 The alternate function <<_wcstol_r>> is a reentrant version. The
68 extra argument <[reent]> is a pointer to a reentrancy structure.
69
70 <<wcstol_l>> is like <<wcstol>> but performs the conversion based on the
71 locale specified by the locale object locale. If <[locale]> is
72 LC_GLOBAL_LOCALE or not a valid locale object, the behaviour is undefined.
73
74 RETURNS
75 <<wcstol>>, <<wcstol_l>> return the converted value, if any. If no
76 conversion was made, 0 is returned.
77
78 <<wcstol>>, <<wcstol_l>> return <<LONG_MAX>> or <<LONG_MIN>> if the
79 magnitude of the converted value is too large, and sets <<errno>>
80 to <<ERANGE>>.
81
82 PORTABILITY
83 <<wcstol>> is ANSI.
84 <<wcstol_l>> is a GNU extension.
85
86 No supporting OS subroutines are required.
87 */
88
89 /*-
90 * Copyright (c) 1990 The Regents of the University of California.
91 * All rights reserved.
92 *
93 * Redistribution and use in source and binary forms, with or without
94 * modification, are permitted provided that the following conditions
95 * are met:
96 * 1. Redistributions of source code must retain the above copyright
97 * notice, this list of conditions and the following disclaimer.
98 * 2. Redistributions in binary form must reproduce the above copyright
99 * notice, this list of conditions and the following disclaimer in the
100 * documentation and/or other materials provided with the distribution.
101 * 3. Neither the name of the University nor the names of its contributors
102 * may be used to endorse or promote products derived from this software
103 * without specific prior written permission.
104 *
105 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
106 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
107 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
108 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
109 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
110 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
111 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
112 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
113 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
114 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
115 * SUCH DAMAGE.
116 */
117
118
119 #define _GNU_SOURCE
120 #include <limits.h>
121 #include <wctype.h>
122 #include <errno.h>
123 #include <wchar.h>
124 #include "../locale/setlocale.h"
125
126 /*
127 * Convert a wide string to a long integer.
128 */
129 long
wcstol_l(const wchar_t * nptr,wchar_t ** endptr,int base,locale_t loc)130 wcstol_l (const wchar_t *nptr, wchar_t **endptr,
131 int base, locale_t loc)
132 {
133 register const wchar_t *s = nptr;
134 register unsigned long acc;
135 register wchar_t c;
136 register unsigned long cutoff;
137 register int neg = 0, any, cutlim;
138
139 /*
140 * Skip white space and pick up leading +/- sign if any.
141 * If base is 0, allow 0x for hex and 0 for octal, else
142 * assume decimal; if base is already 16, allow 0x.
143 */
144 do {
145 c = *s++;
146 } while (iswspace_l(c, loc));
147 if (c == L'-') {
148 neg = 1;
149 c = *s++;
150 } else if (c == L'+')
151 c = *s++;
152 if ((base == 0 || base == 16) &&
153 c == L'0' && (*s == L'x' || *s == L'X')) {
154 c = s[1];
155 s += 2;
156 base = 16;
157 }
158 if (base == 0)
159 base = c == L'0' ? 8 : 10;
160
161 /*
162 * Compute the cutoff value between legal numbers and illegal
163 * numbers. That is the largest legal value, divided by the
164 * base. An input number that is greater than this value, if
165 * followed by a legal input character, is too big. One that
166 * is equal to this value may be valid or not; the limit
167 * between valid and invalid numbers is then based on the last
168 * digit. For instance, if the range for longs is
169 * [-2147483648..2147483647] and the input base is 10,
170 * cutoff will be set to 214748364 and cutlim to either
171 * 7 (neg==0) or 8 (neg==1), meaning that if we have accumulated
172 * a value > 214748364, or equal but the next digit is > 7 (or 8),
173 * the number is too big, and we will return a range error.
174 *
175 * Set any if any `digits' consumed; make it negative to indicate
176 * overflow.
177 */
178 cutoff = neg ? -(unsigned long)LONG_MIN : LONG_MAX;
179 cutlim = cutoff % (unsigned long)base;
180 cutoff /= (unsigned long)base;
181 for (acc = 0, any = 0;; c = *s++) {
182 if (c >= L'0' && c <= L'9')
183 c -= L'0';
184 else if (c >= L'A' && c <= L'Z')
185 c -= L'A' - 10;
186 else if (c >= L'a' && c <= L'z')
187 c -= L'a' - 10;
188 else
189 break;
190 if ((int) c >= base)
191 break;
192 if (any < 0 || acc > cutoff || (acc == cutoff && (int) c > cutlim))
193 any = -1;
194 else {
195 any = 1;
196 acc *= base;
197 acc += (int) c;
198 }
199 }
200 if (any < 0) {
201 acc = neg ? LONG_MIN : LONG_MAX;
202 _REENT_ERRNO(rptr) = ERANGE;
203 } else if (neg)
204 acc = -acc;
205 if (endptr != 0)
206 *endptr = (wchar_t *) (any ? s - 1 : nptr);
207 return (acc);
208 }
209
210
211 long
wcstol(const wchar_t * __restrict s,wchar_t ** __restrict ptr,int base)212 wcstol (const wchar_t *__restrict s,
213 wchar_t **__restrict ptr,
214 int base)
215 {
216 return wcstol_l (s, ptr, base, __get_current_locale ());
217 }
218