1 
2 /* @(#)e_rem_pio2.c 5.1 93/09/24 */
3 /*
4  * ====================================================
5  * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
6  *
7  * Developed at SunPro, a Sun Microsystems, Inc. business.
8  * Permission to use, copy, modify, and distribute this
9  * software is freely granted, provided that this notice
10  * is preserved.
11  * ====================================================
12  *
13  */
14 
15 /* __rem_pio2(x,y)
16  *
17  * return the remainder of x rem pi/2 in y[0]+y[1]
18  * use __kernel_rem_pio2()
19  */
20 
21 #include "fdlibm.h"
22 
23 #ifdef _NEED_FLOAT64
24 
25 /*
26  * Table of constants for 2/pi, 396 Hex digits (476 decimal) of 2/pi
27  */
28 static const __int32_t two_over_pi[] = {
29     0xA2F983, 0x6E4E44, 0x1529FC, 0x2757D1, 0xF534DD, 0xC0DB62, 0x95993C,
30     0x439041, 0xFE5163, 0xABDEBB, 0xC561B7, 0x246E3A, 0x424DD2, 0xE00649,
31     0x2EEA09, 0xD1921C, 0xFE1DEB, 0x1CB129, 0xA73EE8, 0x8235F5, 0x2EBB44,
32     0x84E99C, 0x7026B4, 0x5F7E41, 0x3991D6, 0x398353, 0x39F49C, 0x845F8B,
33     0xBDF928, 0x3B1FF8, 0x97FFDE, 0x05980F, 0xEF2F11, 0x8B5A0A, 0x6D1F6D,
34     0x367ECF, 0x27CB09, 0xB74F46, 0x3F669E, 0x5FEA2D, 0x7527BA, 0xC7EBE5,
35     0xF17B3D, 0x0739F7, 0x8A5292, 0xEA6BFB, 0x5FB11F, 0x8D5D08, 0x560330,
36     0x46FC7B, 0x6BABF0, 0xCFBC20, 0x9AF436, 0x1DA9E3, 0x91615E, 0xE61B08,
37     0x659985, 0x5F14A0, 0x68408D, 0xFFD880, 0x4D7327, 0x310606, 0x1556CA,
38     0x73A8C9, 0x60E27B, 0xC08C6B,
39 };
40 
41 static const __int32_t npio2_hw[] = {
42     0x3FF921FB, 0x400921FB, 0x4012D97C, 0x401921FB, 0x401F6A7A, 0x4022D97C,
43     0x4025FDBB, 0x402921FB, 0x402C463A, 0x402F6A7A, 0x4031475C, 0x4032D97C,
44     0x40346B9C, 0x4035FDBB, 0x40378FDB, 0x403921FB, 0x403AB41B, 0x403C463A,
45     0x403DD85A, 0x403F6A7A, 0x40407E4C, 0x4041475C, 0x4042106C, 0x4042D97C,
46     0x4043A28C, 0x40446B9C, 0x404534AC, 0x4045FDBB, 0x4046C6CB, 0x40478FDB,
47     0x404858EB, 0x404921FB,
48 };
49 
50 /*
51  * invpio2:  53 bits of 2/pi
52  * pio2_1:   first  33 bit of pi/2
53  * pio2_1t:  pi/2 - pio2_1
54  * pio2_2:   second 33 bit of pi/2
55  * pio2_2t:  pi/2 - (pio2_1+pio2_2)
56  * pio2_3:   third  33 bit of pi/2
57  * pio2_3t:  pi/2 - (pio2_1+pio2_2+pio2_3)
58  */
59 
60 static const __float64
61     zero = _F_64(0.00000000000000000000e+00), /* 0x00000000, 0x00000000 */
62     half = _F_64(5.00000000000000000000e-01), /* 0x3FE00000, 0x00000000 */
63     two24 = _F_64(1.67772160000000000000e+07), /* 0x41700000, 0x00000000 */
64     invpio2 = _F_64(6.36619772367581382433e-01), /* 0x3FE45F30, 0x6DC9C883 */
65     pio2_1 = _F_64(1.57079632673412561417e+00), /* 0x3FF921FB, 0x54400000 */
66     pio2_1t = _F_64(6.07710050650619224932e-11), /* 0x3DD0B461, 0x1A626331 */
67     pio2_2 = _F_64(6.07710050630396597660e-11), /* 0x3DD0B461, 0x1A600000 */
68     pio2_2t = _F_64(2.02226624879595063154e-21), /* 0x3BA3198A, 0x2E037073 */
69     pio2_3 = _F_64(2.02226624871116645580e-21), /* 0x3BA3198A, 0x2E000000 */
70     pio2_3t = _F_64(8.47842766036889956997e-32); /* 0x397B839A, 0x252049C1 */
71 
72 __int32_t
__rem_pio2(__float64 x,__float64 * y)73 __rem_pio2(__float64 x, __float64 *y)
74 {
75     __float64 z = _F_64(0.0), w, t, r, fn;
76     __float64 tx[3];
77     __int32_t i, j, n, ix, hx;
78     int e0, nx;
79     __uint32_t low;
80 
81     GET_HIGH_WORD(hx, x); /* high word of x */
82     ix = hx & 0x7fffffff;
83     if (ix <= 0x3fe921fb) /* |x| ~<= pi/4 , no need for reduction */
84     {
85         y[0] = x;
86         y[1] = 0;
87         return 0;
88     }
89     if (ix < 0x4002d97c) { /* |x| < 3pi/4, special case with n=+-1 */
90         if (hx > 0) {
91             z = x - pio2_1;
92             if (ix != 0x3ff921fb) { /* 33+53 bit pi is good enough */
93                 y[0] = z - pio2_1t;
94                 y[1] = (z - y[0]) - pio2_1t;
95             } else { /* near pi/2, use 33+33+53 bit pi */
96                 z -= pio2_2;
97                 y[0] = z - pio2_2t;
98                 y[1] = (z - y[0]) - pio2_2t;
99             }
100             return 1;
101         } else { /* negative x */
102             z = x + pio2_1;
103             if (ix != 0x3ff921fb) { /* 33+53 bit pi is good enough */
104                 y[0] = z + pio2_1t;
105                 y[1] = (z - y[0]) + pio2_1t;
106             } else { /* near pi/2, use 33+33+53 bit pi */
107                 z += pio2_2;
108                 y[0] = z + pio2_2t;
109                 y[1] = (z - y[0]) + pio2_2t;
110             }
111             return -1;
112         }
113     }
114     if (ix <= 0x413921fb) { /* |x| ~<= 2^19*(pi/2), medium size */
115         t = _NAME_64(fabs)(x);
116         n = (__int32_t)(t * invpio2 + half);
117         fn = (__float64)n;
118         r = t - fn * pio2_1;
119         w = fn * pio2_1t; /* 1st round good to 85 bit */
120         if (n < 32 && ix != npio2_hw[n - 1]) {
121             y[0] = r - w; /* quick check no cancellation */
122         } else {
123             __uint32_t high;
124             j = ix >> 20;
125             y[0] = r - w;
126             GET_HIGH_WORD(high, y[0]);
127             i = j - ((high >> 20) & 0x7ff);
128             if (i > 16) { /* 2nd iteration needed, good to 118 */
129                 t = r;
130                 w = fn * pio2_2;
131                 r = t - w;
132                 w = fn * pio2_2t - ((t - r) - w);
133                 y[0] = r - w;
134                 GET_HIGH_WORD(high, y[0]);
135                 i = j - ((high >> 20) & 0x7ff);
136                 if (i > 49) { /* 3rd iteration need, 151 bits acc */
137                     t = r; /* will cover all possible cases */
138                     w = fn * pio2_3;
139                     r = t - w;
140                     w = fn * pio2_3t - ((t - r) - w);
141                     y[0] = r - w;
142                 }
143             }
144         }
145         y[1] = (r - y[0]) - w;
146         if (hx < 0) {
147             y[0] = -y[0];
148             y[1] = -y[1];
149             return -n;
150         } else
151             return n;
152     }
153     /*
154      * all other (large) arguments
155      */
156     if (ix >= 0x7ff00000) { /* x is inf or NaN */
157         y[0] = y[1] = x - x;
158         return 0;
159     }
160     /* set z = scalbn(|x|,ilogb(x)-23) */
161     GET_LOW_WORD(low, x);
162     SET_LOW_WORD(z, low);
163     e0 = (int)((ix >> 20) - 1046); /* e0 = ilogb(z)-23; */
164     SET_HIGH_WORD(z, ix - ((__int32_t)e0 << 20));
165     for (i = 0; i < 2; i++) {
166         tx[i] = (__float64)((__int32_t)(z));
167         z = (z - tx[i]) * two24;
168     }
169     tx[2] = z;
170     nx = 3;
171     while (tx[nx - 1] == zero)
172         nx--; /* skip zero term */
173     n = __kernel_rem_pio2(tx, y, e0, nx, 2, two_over_pi);
174     if (hx < 0) {
175         y[0] = -y[0];
176         y[1] = -y[1];
177         return -n;
178     }
179     return n;
180 }
181 
182 #endif /* _NEED_FLOAT64 */
183