annotate src/share/vm/runtime/sharedRuntimeTrig.cpp @ 1091:6aa7255741f3

6906727: UseCompressedOops: some card-marking fixes related to object arrays Summary: Introduced a new write_ref_array(HeapWords* start, size_t count) method that does the requisite MemRegion range calculation so (some of the) clients of the erstwhile write_ref_array(MemRegion mr) do not need to worry. This removed all external uses of array_size(), which was also simplified and made private. Asserts were added to catch other possible issues. Further, less essential, fixes stemming from this investigation are deferred to CR 6904516 (to follow shortly in hs17). Reviewed-by: kvn, coleenp, jmasa
author ysr
date Thu, 03 Dec 2009 15:01:57 -0800
parents a61af66fc99e
children fb57d4cf76c2
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1 /*
a61af66fc99e Initial load
duke
parents:
diff changeset
2 * Copyright 2001-2005 Sun Microsystems, Inc. All Rights Reserved.
a61af66fc99e Initial load
duke
parents:
diff changeset
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
a61af66fc99e Initial load
duke
parents:
diff changeset
4 *
a61af66fc99e Initial load
duke
parents:
diff changeset
5 * This code is free software; you can redistribute it and/or modify it
a61af66fc99e Initial load
duke
parents:
diff changeset
6 * under the terms of the GNU General Public License version 2 only, as
a61af66fc99e Initial load
duke
parents:
diff changeset
7 * published by the Free Software Foundation.
a61af66fc99e Initial load
duke
parents:
diff changeset
8 *
a61af66fc99e Initial load
duke
parents:
diff changeset
9 * This code is distributed in the hope that it will be useful, but WITHOUT
a61af66fc99e Initial load
duke
parents:
diff changeset
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
a61af66fc99e Initial load
duke
parents:
diff changeset
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
a61af66fc99e Initial load
duke
parents:
diff changeset
12 * version 2 for more details (a copy is included in the LICENSE file that
a61af66fc99e Initial load
duke
parents:
diff changeset
13 * accompanied this code).
a61af66fc99e Initial load
duke
parents:
diff changeset
14 *
a61af66fc99e Initial load
duke
parents:
diff changeset
15 * You should have received a copy of the GNU General Public License version
a61af66fc99e Initial load
duke
parents:
diff changeset
16 * 2 along with this work; if not, write to the Free Software Foundation,
a61af66fc99e Initial load
duke
parents:
diff changeset
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
a61af66fc99e Initial load
duke
parents:
diff changeset
18 *
a61af66fc99e Initial load
duke
parents:
diff changeset
19 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
a61af66fc99e Initial load
duke
parents:
diff changeset
20 * CA 95054 USA or visit www.sun.com if you need additional information or
a61af66fc99e Initial load
duke
parents:
diff changeset
21 * have any questions.
a61af66fc99e Initial load
duke
parents:
diff changeset
22 *
a61af66fc99e Initial load
duke
parents:
diff changeset
23 */
a61af66fc99e Initial load
duke
parents:
diff changeset
24
a61af66fc99e Initial load
duke
parents:
diff changeset
25 #include "incls/_precompiled.incl"
a61af66fc99e Initial load
duke
parents:
diff changeset
26 #include "incls/_sharedRuntimeTrig.cpp.incl"
a61af66fc99e Initial load
duke
parents:
diff changeset
27
a61af66fc99e Initial load
duke
parents:
diff changeset
28 // This file contains copies of the fdlibm routines used by
a61af66fc99e Initial load
duke
parents:
diff changeset
29 // StrictMath. It turns out that it is almost always required to use
a61af66fc99e Initial load
duke
parents:
diff changeset
30 // these runtime routines; the Intel CPU doesn't meet the Java
a61af66fc99e Initial load
duke
parents:
diff changeset
31 // specification for sin/cos outside a certain limited argument range,
a61af66fc99e Initial load
duke
parents:
diff changeset
32 // and the SPARC CPU doesn't appear to have sin/cos instructions. It
a61af66fc99e Initial load
duke
parents:
diff changeset
33 // also turns out that avoiding the indirect call through function
a61af66fc99e Initial load
duke
parents:
diff changeset
34 // pointer out to libjava.so in SharedRuntime speeds these routines up
a61af66fc99e Initial load
duke
parents:
diff changeset
35 // by roughly 15% on both Win32/x86 and Solaris/SPARC.
a61af66fc99e Initial load
duke
parents:
diff changeset
36
a61af66fc99e Initial load
duke
parents:
diff changeset
37 // Enabling optimizations in this file causes incorrect code to be
a61af66fc99e Initial load
duke
parents:
diff changeset
38 // generated; can not figure out how to turn down optimization for one
a61af66fc99e Initial load
duke
parents:
diff changeset
39 // file in the IDE on Windows
a61af66fc99e Initial load
duke
parents:
diff changeset
40 #ifdef WIN32
a61af66fc99e Initial load
duke
parents:
diff changeset
41 # pragma optimize ( "", off )
a61af66fc99e Initial load
duke
parents:
diff changeset
42 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
43
a61af66fc99e Initial load
duke
parents:
diff changeset
44 #include <math.h>
a61af66fc99e Initial load
duke
parents:
diff changeset
45
a61af66fc99e Initial load
duke
parents:
diff changeset
46 // VM_LITTLE_ENDIAN is #defined appropriately in the Makefiles
a61af66fc99e Initial load
duke
parents:
diff changeset
47 // [jk] this is not 100% correct because the float word order may different
a61af66fc99e Initial load
duke
parents:
diff changeset
48 // from the byte order (e.g. on ARM)
a61af66fc99e Initial load
duke
parents:
diff changeset
49 #ifdef VM_LITTLE_ENDIAN
a61af66fc99e Initial load
duke
parents:
diff changeset
50 # define __HI(x) *(1+(int*)&x)
a61af66fc99e Initial load
duke
parents:
diff changeset
51 # define __LO(x) *(int*)&x
a61af66fc99e Initial load
duke
parents:
diff changeset
52 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
53 # define __HI(x) *(int*)&x
a61af66fc99e Initial load
duke
parents:
diff changeset
54 # define __LO(x) *(1+(int*)&x)
a61af66fc99e Initial load
duke
parents:
diff changeset
55 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
56
a61af66fc99e Initial load
duke
parents:
diff changeset
57 static double copysignA(double x, double y) {
a61af66fc99e Initial load
duke
parents:
diff changeset
58 __HI(x) = (__HI(x)&0x7fffffff)|(__HI(y)&0x80000000);
a61af66fc99e Initial load
duke
parents:
diff changeset
59 return x;
a61af66fc99e Initial load
duke
parents:
diff changeset
60 }
a61af66fc99e Initial load
duke
parents:
diff changeset
61
a61af66fc99e Initial load
duke
parents:
diff changeset
62 /*
a61af66fc99e Initial load
duke
parents:
diff changeset
63 * scalbn (double x, int n)
a61af66fc99e Initial load
duke
parents:
diff changeset
64 * scalbn(x,n) returns x* 2**n computed by exponent
a61af66fc99e Initial load
duke
parents:
diff changeset
65 * manipulation rather than by actually performing an
a61af66fc99e Initial load
duke
parents:
diff changeset
66 * exponentiation or a multiplication.
a61af66fc99e Initial load
duke
parents:
diff changeset
67 */
a61af66fc99e Initial load
duke
parents:
diff changeset
68
a61af66fc99e Initial load
duke
parents:
diff changeset
69 static const double
a61af66fc99e Initial load
duke
parents:
diff changeset
70 two54 = 1.80143985094819840000e+16, /* 0x43500000, 0x00000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
71 twom54 = 5.55111512312578270212e-17, /* 0x3C900000, 0x00000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
72 hugeX = 1.0e+300,
a61af66fc99e Initial load
duke
parents:
diff changeset
73 tiny = 1.0e-300;
a61af66fc99e Initial load
duke
parents:
diff changeset
74
a61af66fc99e Initial load
duke
parents:
diff changeset
75 static double scalbnA (double x, int n) {
a61af66fc99e Initial load
duke
parents:
diff changeset
76 int k,hx,lx;
a61af66fc99e Initial load
duke
parents:
diff changeset
77 hx = __HI(x);
a61af66fc99e Initial load
duke
parents:
diff changeset
78 lx = __LO(x);
a61af66fc99e Initial load
duke
parents:
diff changeset
79 k = (hx&0x7ff00000)>>20; /* extract exponent */
a61af66fc99e Initial load
duke
parents:
diff changeset
80 if (k==0) { /* 0 or subnormal x */
a61af66fc99e Initial load
duke
parents:
diff changeset
81 if ((lx|(hx&0x7fffffff))==0) return x; /* +-0 */
a61af66fc99e Initial load
duke
parents:
diff changeset
82 x *= two54;
a61af66fc99e Initial load
duke
parents:
diff changeset
83 hx = __HI(x);
a61af66fc99e Initial load
duke
parents:
diff changeset
84 k = ((hx&0x7ff00000)>>20) - 54;
a61af66fc99e Initial load
duke
parents:
diff changeset
85 if (n< -50000) return tiny*x; /*underflow*/
a61af66fc99e Initial load
duke
parents:
diff changeset
86 }
a61af66fc99e Initial load
duke
parents:
diff changeset
87 if (k==0x7ff) return x+x; /* NaN or Inf */
a61af66fc99e Initial load
duke
parents:
diff changeset
88 k = k+n;
a61af66fc99e Initial load
duke
parents:
diff changeset
89 if (k > 0x7fe) return hugeX*copysignA(hugeX,x); /* overflow */
a61af66fc99e Initial load
duke
parents:
diff changeset
90 if (k > 0) /* normal result */
a61af66fc99e Initial load
duke
parents:
diff changeset
91 {__HI(x) = (hx&0x800fffff)|(k<<20); return x;}
a61af66fc99e Initial load
duke
parents:
diff changeset
92 if (k <= -54) {
a61af66fc99e Initial load
duke
parents:
diff changeset
93 if (n > 50000) /* in case integer overflow in n+k */
a61af66fc99e Initial load
duke
parents:
diff changeset
94 return hugeX*copysignA(hugeX,x); /*overflow*/
a61af66fc99e Initial load
duke
parents:
diff changeset
95 else return tiny*copysignA(tiny,x); /*underflow*/
a61af66fc99e Initial load
duke
parents:
diff changeset
96 }
a61af66fc99e Initial load
duke
parents:
diff changeset
97 k += 54; /* subnormal result */
a61af66fc99e Initial load
duke
parents:
diff changeset
98 __HI(x) = (hx&0x800fffff)|(k<<20);
a61af66fc99e Initial load
duke
parents:
diff changeset
99 return x*twom54;
a61af66fc99e Initial load
duke
parents:
diff changeset
100 }
a61af66fc99e Initial load
duke
parents:
diff changeset
101
a61af66fc99e Initial load
duke
parents:
diff changeset
102 /*
a61af66fc99e Initial load
duke
parents:
diff changeset
103 * __kernel_rem_pio2(x,y,e0,nx,prec,ipio2)
a61af66fc99e Initial load
duke
parents:
diff changeset
104 * double x[],y[]; int e0,nx,prec; int ipio2[];
a61af66fc99e Initial load
duke
parents:
diff changeset
105 *
a61af66fc99e Initial load
duke
parents:
diff changeset
106 * __kernel_rem_pio2 return the last three digits of N with
a61af66fc99e Initial load
duke
parents:
diff changeset
107 * y = x - N*pi/2
a61af66fc99e Initial load
duke
parents:
diff changeset
108 * so that |y| < pi/2.
a61af66fc99e Initial load
duke
parents:
diff changeset
109 *
a61af66fc99e Initial load
duke
parents:
diff changeset
110 * The method is to compute the integer (mod 8) and fraction parts of
a61af66fc99e Initial load
duke
parents:
diff changeset
111 * (2/pi)*x without doing the full multiplication. In general we
a61af66fc99e Initial load
duke
parents:
diff changeset
112 * skip the part of the product that are known to be a huge integer (
a61af66fc99e Initial load
duke
parents:
diff changeset
113 * more accurately, = 0 mod 8 ). Thus the number of operations are
a61af66fc99e Initial load
duke
parents:
diff changeset
114 * independent of the exponent of the input.
a61af66fc99e Initial load
duke
parents:
diff changeset
115 *
a61af66fc99e Initial load
duke
parents:
diff changeset
116 * (2/pi) is represented by an array of 24-bit integers in ipio2[].
a61af66fc99e Initial load
duke
parents:
diff changeset
117 *
a61af66fc99e Initial load
duke
parents:
diff changeset
118 * Input parameters:
a61af66fc99e Initial load
duke
parents:
diff changeset
119 * x[] The input value (must be positive) is broken into nx
a61af66fc99e Initial load
duke
parents:
diff changeset
120 * pieces of 24-bit integers in double precision format.
a61af66fc99e Initial load
duke
parents:
diff changeset
121 * x[i] will be the i-th 24 bit of x. The scaled exponent
a61af66fc99e Initial load
duke
parents:
diff changeset
122 * of x[0] is given in input parameter e0 (i.e., x[0]*2^e0
a61af66fc99e Initial load
duke
parents:
diff changeset
123 * match x's up to 24 bits.
a61af66fc99e Initial load
duke
parents:
diff changeset
124 *
a61af66fc99e Initial load
duke
parents:
diff changeset
125 * Example of breaking a double positive z into x[0]+x[1]+x[2]:
a61af66fc99e Initial load
duke
parents:
diff changeset
126 * e0 = ilogb(z)-23
a61af66fc99e Initial load
duke
parents:
diff changeset
127 * z = scalbn(z,-e0)
a61af66fc99e Initial load
duke
parents:
diff changeset
128 * for i = 0,1,2
a61af66fc99e Initial load
duke
parents:
diff changeset
129 * x[i] = floor(z)
a61af66fc99e Initial load
duke
parents:
diff changeset
130 * z = (z-x[i])*2**24
a61af66fc99e Initial load
duke
parents:
diff changeset
131 *
a61af66fc99e Initial load
duke
parents:
diff changeset
132 *
a61af66fc99e Initial load
duke
parents:
diff changeset
133 * y[] ouput result in an array of double precision numbers.
a61af66fc99e Initial load
duke
parents:
diff changeset
134 * The dimension of y[] is:
a61af66fc99e Initial load
duke
parents:
diff changeset
135 * 24-bit precision 1
a61af66fc99e Initial load
duke
parents:
diff changeset
136 * 53-bit precision 2
a61af66fc99e Initial load
duke
parents:
diff changeset
137 * 64-bit precision 2
a61af66fc99e Initial load
duke
parents:
diff changeset
138 * 113-bit precision 3
a61af66fc99e Initial load
duke
parents:
diff changeset
139 * The actual value is the sum of them. Thus for 113-bit
a61af66fc99e Initial load
duke
parents:
diff changeset
140 * precsion, one may have to do something like:
a61af66fc99e Initial load
duke
parents:
diff changeset
141 *
a61af66fc99e Initial load
duke
parents:
diff changeset
142 * long double t,w,r_head, r_tail;
a61af66fc99e Initial load
duke
parents:
diff changeset
143 * t = (long double)y[2] + (long double)y[1];
a61af66fc99e Initial load
duke
parents:
diff changeset
144 * w = (long double)y[0];
a61af66fc99e Initial load
duke
parents:
diff changeset
145 * r_head = t+w;
a61af66fc99e Initial load
duke
parents:
diff changeset
146 * r_tail = w - (r_head - t);
a61af66fc99e Initial load
duke
parents:
diff changeset
147 *
a61af66fc99e Initial load
duke
parents:
diff changeset
148 * e0 The exponent of x[0]
a61af66fc99e Initial load
duke
parents:
diff changeset
149 *
a61af66fc99e Initial load
duke
parents:
diff changeset
150 * nx dimension of x[]
a61af66fc99e Initial load
duke
parents:
diff changeset
151 *
a61af66fc99e Initial load
duke
parents:
diff changeset
152 * prec an interger indicating the precision:
a61af66fc99e Initial load
duke
parents:
diff changeset
153 * 0 24 bits (single)
a61af66fc99e Initial load
duke
parents:
diff changeset
154 * 1 53 bits (double)
a61af66fc99e Initial load
duke
parents:
diff changeset
155 * 2 64 bits (extended)
a61af66fc99e Initial load
duke
parents:
diff changeset
156 * 3 113 bits (quad)
a61af66fc99e Initial load
duke
parents:
diff changeset
157 *
a61af66fc99e Initial load
duke
parents:
diff changeset
158 * ipio2[]
a61af66fc99e Initial load
duke
parents:
diff changeset
159 * integer array, contains the (24*i)-th to (24*i+23)-th
a61af66fc99e Initial load
duke
parents:
diff changeset
160 * bit of 2/pi after binary point. The corresponding
a61af66fc99e Initial load
duke
parents:
diff changeset
161 * floating value is
a61af66fc99e Initial load
duke
parents:
diff changeset
162 *
a61af66fc99e Initial load
duke
parents:
diff changeset
163 * ipio2[i] * 2^(-24(i+1)).
a61af66fc99e Initial load
duke
parents:
diff changeset
164 *
a61af66fc99e Initial load
duke
parents:
diff changeset
165 * External function:
a61af66fc99e Initial load
duke
parents:
diff changeset
166 * double scalbn(), floor();
a61af66fc99e Initial load
duke
parents:
diff changeset
167 *
a61af66fc99e Initial load
duke
parents:
diff changeset
168 *
a61af66fc99e Initial load
duke
parents:
diff changeset
169 * Here is the description of some local variables:
a61af66fc99e Initial load
duke
parents:
diff changeset
170 *
a61af66fc99e Initial load
duke
parents:
diff changeset
171 * jk jk+1 is the initial number of terms of ipio2[] needed
a61af66fc99e Initial load
duke
parents:
diff changeset
172 * in the computation. The recommended value is 2,3,4,
a61af66fc99e Initial load
duke
parents:
diff changeset
173 * 6 for single, double, extended,and quad.
a61af66fc99e Initial load
duke
parents:
diff changeset
174 *
a61af66fc99e Initial load
duke
parents:
diff changeset
175 * jz local integer variable indicating the number of
a61af66fc99e Initial load
duke
parents:
diff changeset
176 * terms of ipio2[] used.
a61af66fc99e Initial load
duke
parents:
diff changeset
177 *
a61af66fc99e Initial load
duke
parents:
diff changeset
178 * jx nx - 1
a61af66fc99e Initial load
duke
parents:
diff changeset
179 *
a61af66fc99e Initial load
duke
parents:
diff changeset
180 * jv index for pointing to the suitable ipio2[] for the
a61af66fc99e Initial load
duke
parents:
diff changeset
181 * computation. In general, we want
a61af66fc99e Initial load
duke
parents:
diff changeset
182 * ( 2^e0*x[0] * ipio2[jv-1]*2^(-24jv) )/8
a61af66fc99e Initial load
duke
parents:
diff changeset
183 * is an integer. Thus
a61af66fc99e Initial load
duke
parents:
diff changeset
184 * e0-3-24*jv >= 0 or (e0-3)/24 >= jv
a61af66fc99e Initial load
duke
parents:
diff changeset
185 * Hence jv = max(0,(e0-3)/24).
a61af66fc99e Initial load
duke
parents:
diff changeset
186 *
a61af66fc99e Initial load
duke
parents:
diff changeset
187 * jp jp+1 is the number of terms in PIo2[] needed, jp = jk.
a61af66fc99e Initial load
duke
parents:
diff changeset
188 *
a61af66fc99e Initial load
duke
parents:
diff changeset
189 * q[] double array with integral value, representing the
a61af66fc99e Initial load
duke
parents:
diff changeset
190 * 24-bits chunk of the product of x and 2/pi.
a61af66fc99e Initial load
duke
parents:
diff changeset
191 *
a61af66fc99e Initial load
duke
parents:
diff changeset
192 * q0 the corresponding exponent of q[0]. Note that the
a61af66fc99e Initial load
duke
parents:
diff changeset
193 * exponent for q[i] would be q0-24*i.
a61af66fc99e Initial load
duke
parents:
diff changeset
194 *
a61af66fc99e Initial load
duke
parents:
diff changeset
195 * PIo2[] double precision array, obtained by cutting pi/2
a61af66fc99e Initial load
duke
parents:
diff changeset
196 * into 24 bits chunks.
a61af66fc99e Initial load
duke
parents:
diff changeset
197 *
a61af66fc99e Initial load
duke
parents:
diff changeset
198 * f[] ipio2[] in floating point
a61af66fc99e Initial load
duke
parents:
diff changeset
199 *
a61af66fc99e Initial load
duke
parents:
diff changeset
200 * iq[] integer array by breaking up q[] in 24-bits chunk.
a61af66fc99e Initial load
duke
parents:
diff changeset
201 *
a61af66fc99e Initial load
duke
parents:
diff changeset
202 * fq[] final product of x*(2/pi) in fq[0],..,fq[jk]
a61af66fc99e Initial load
duke
parents:
diff changeset
203 *
a61af66fc99e Initial load
duke
parents:
diff changeset
204 * ih integer. If >0 it indicats q[] is >= 0.5, hence
a61af66fc99e Initial load
duke
parents:
diff changeset
205 * it also indicates the *sign* of the result.
a61af66fc99e Initial load
duke
parents:
diff changeset
206 *
a61af66fc99e Initial load
duke
parents:
diff changeset
207 */
a61af66fc99e Initial load
duke
parents:
diff changeset
208
a61af66fc99e Initial load
duke
parents:
diff changeset
209
a61af66fc99e Initial load
duke
parents:
diff changeset
210 /*
a61af66fc99e Initial load
duke
parents:
diff changeset
211 * Constants:
a61af66fc99e Initial load
duke
parents:
diff changeset
212 * The hexadecimal values are the intended ones for the following
a61af66fc99e Initial load
duke
parents:
diff changeset
213 * constants. The decimal values may be used, provided that the
a61af66fc99e Initial load
duke
parents:
diff changeset
214 * compiler will convert from decimal to binary accurately enough
a61af66fc99e Initial load
duke
parents:
diff changeset
215 * to produce the hexadecimal values shown.
a61af66fc99e Initial load
duke
parents:
diff changeset
216 */
a61af66fc99e Initial load
duke
parents:
diff changeset
217
a61af66fc99e Initial load
duke
parents:
diff changeset
218
a61af66fc99e Initial load
duke
parents:
diff changeset
219 static const int init_jk[] = {2,3,4,6}; /* initial value for jk */
a61af66fc99e Initial load
duke
parents:
diff changeset
220
a61af66fc99e Initial load
duke
parents:
diff changeset
221 static const double PIo2[] = {
a61af66fc99e Initial load
duke
parents:
diff changeset
222 1.57079625129699707031e+00, /* 0x3FF921FB, 0x40000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
223 7.54978941586159635335e-08, /* 0x3E74442D, 0x00000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
224 5.39030252995776476554e-15, /* 0x3CF84698, 0x80000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
225 3.28200341580791294123e-22, /* 0x3B78CC51, 0x60000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
226 1.27065575308067607349e-29, /* 0x39F01B83, 0x80000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
227 1.22933308981111328932e-36, /* 0x387A2520, 0x40000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
228 2.73370053816464559624e-44, /* 0x36E38222, 0x80000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
229 2.16741683877804819444e-51, /* 0x3569F31D, 0x00000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
230 };
a61af66fc99e Initial load
duke
parents:
diff changeset
231
a61af66fc99e Initial load
duke
parents:
diff changeset
232 static const double
a61af66fc99e Initial load
duke
parents:
diff changeset
233 zeroB = 0.0,
a61af66fc99e Initial load
duke
parents:
diff changeset
234 one = 1.0,
a61af66fc99e Initial load
duke
parents:
diff changeset
235 two24B = 1.67772160000000000000e+07, /* 0x41700000, 0x00000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
236 twon24 = 5.96046447753906250000e-08; /* 0x3E700000, 0x00000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
237
a61af66fc99e Initial load
duke
parents:
diff changeset
238 static int __kernel_rem_pio2(double *x, double *y, int e0, int nx, int prec, const int *ipio2) {
a61af66fc99e Initial load
duke
parents:
diff changeset
239 int jz,jx,jv,jp,jk,carry,n,iq[20],i,j,k,m,q0,ih;
a61af66fc99e Initial load
duke
parents:
diff changeset
240 double z,fw,f[20],fq[20],q[20];
a61af66fc99e Initial load
duke
parents:
diff changeset
241
a61af66fc99e Initial load
duke
parents:
diff changeset
242 /* initialize jk*/
a61af66fc99e Initial load
duke
parents:
diff changeset
243 jk = init_jk[prec];
a61af66fc99e Initial load
duke
parents:
diff changeset
244 jp = jk;
a61af66fc99e Initial load
duke
parents:
diff changeset
245
a61af66fc99e Initial load
duke
parents:
diff changeset
246 /* determine jx,jv,q0, note that 3>q0 */
a61af66fc99e Initial load
duke
parents:
diff changeset
247 jx = nx-1;
a61af66fc99e Initial load
duke
parents:
diff changeset
248 jv = (e0-3)/24; if(jv<0) jv=0;
a61af66fc99e Initial load
duke
parents:
diff changeset
249 q0 = e0-24*(jv+1);
a61af66fc99e Initial load
duke
parents:
diff changeset
250
a61af66fc99e Initial load
duke
parents:
diff changeset
251 /* set up f[0] to f[jx+jk] where f[jx+jk] = ipio2[jv+jk] */
a61af66fc99e Initial load
duke
parents:
diff changeset
252 j = jv-jx; m = jx+jk;
a61af66fc99e Initial load
duke
parents:
diff changeset
253 for(i=0;i<=m;i++,j++) f[i] = (j<0)? zeroB : (double) ipio2[j];
a61af66fc99e Initial load
duke
parents:
diff changeset
254
a61af66fc99e Initial load
duke
parents:
diff changeset
255 /* compute q[0],q[1],...q[jk] */
a61af66fc99e Initial load
duke
parents:
diff changeset
256 for (i=0;i<=jk;i++) {
a61af66fc99e Initial load
duke
parents:
diff changeset
257 for(j=0,fw=0.0;j<=jx;j++) fw += x[j]*f[jx+i-j]; q[i] = fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
258 }
a61af66fc99e Initial load
duke
parents:
diff changeset
259
a61af66fc99e Initial load
duke
parents:
diff changeset
260 jz = jk;
a61af66fc99e Initial load
duke
parents:
diff changeset
261 recompute:
a61af66fc99e Initial load
duke
parents:
diff changeset
262 /* distill q[] into iq[] reversingly */
a61af66fc99e Initial load
duke
parents:
diff changeset
263 for(i=0,j=jz,z=q[jz];j>0;i++,j--) {
a61af66fc99e Initial load
duke
parents:
diff changeset
264 fw = (double)((int)(twon24* z));
a61af66fc99e Initial load
duke
parents:
diff changeset
265 iq[i] = (int)(z-two24B*fw);
a61af66fc99e Initial load
duke
parents:
diff changeset
266 z = q[j-1]+fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
267 }
a61af66fc99e Initial load
duke
parents:
diff changeset
268
a61af66fc99e Initial load
duke
parents:
diff changeset
269 /* compute n */
a61af66fc99e Initial load
duke
parents:
diff changeset
270 z = scalbnA(z,q0); /* actual value of z */
a61af66fc99e Initial load
duke
parents:
diff changeset
271 z -= 8.0*floor(z*0.125); /* trim off integer >= 8 */
a61af66fc99e Initial load
duke
parents:
diff changeset
272 n = (int) z;
a61af66fc99e Initial load
duke
parents:
diff changeset
273 z -= (double)n;
a61af66fc99e Initial load
duke
parents:
diff changeset
274 ih = 0;
a61af66fc99e Initial load
duke
parents:
diff changeset
275 if(q0>0) { /* need iq[jz-1] to determine n */
a61af66fc99e Initial load
duke
parents:
diff changeset
276 i = (iq[jz-1]>>(24-q0)); n += i;
a61af66fc99e Initial load
duke
parents:
diff changeset
277 iq[jz-1] -= i<<(24-q0);
a61af66fc99e Initial load
duke
parents:
diff changeset
278 ih = iq[jz-1]>>(23-q0);
a61af66fc99e Initial load
duke
parents:
diff changeset
279 }
a61af66fc99e Initial load
duke
parents:
diff changeset
280 else if(q0==0) ih = iq[jz-1]>>23;
a61af66fc99e Initial load
duke
parents:
diff changeset
281 else if(z>=0.5) ih=2;
a61af66fc99e Initial load
duke
parents:
diff changeset
282
a61af66fc99e Initial load
duke
parents:
diff changeset
283 if(ih>0) { /* q > 0.5 */
a61af66fc99e Initial load
duke
parents:
diff changeset
284 n += 1; carry = 0;
a61af66fc99e Initial load
duke
parents:
diff changeset
285 for(i=0;i<jz ;i++) { /* compute 1-q */
a61af66fc99e Initial load
duke
parents:
diff changeset
286 j = iq[i];
a61af66fc99e Initial load
duke
parents:
diff changeset
287 if(carry==0) {
a61af66fc99e Initial load
duke
parents:
diff changeset
288 if(j!=0) {
a61af66fc99e Initial load
duke
parents:
diff changeset
289 carry = 1; iq[i] = 0x1000000- j;
a61af66fc99e Initial load
duke
parents:
diff changeset
290 }
a61af66fc99e Initial load
duke
parents:
diff changeset
291 } else iq[i] = 0xffffff - j;
a61af66fc99e Initial load
duke
parents:
diff changeset
292 }
a61af66fc99e Initial load
duke
parents:
diff changeset
293 if(q0>0) { /* rare case: chance is 1 in 12 */
a61af66fc99e Initial load
duke
parents:
diff changeset
294 switch(q0) {
a61af66fc99e Initial load
duke
parents:
diff changeset
295 case 1:
a61af66fc99e Initial load
duke
parents:
diff changeset
296 iq[jz-1] &= 0x7fffff; break;
a61af66fc99e Initial load
duke
parents:
diff changeset
297 case 2:
a61af66fc99e Initial load
duke
parents:
diff changeset
298 iq[jz-1] &= 0x3fffff; break;
a61af66fc99e Initial load
duke
parents:
diff changeset
299 }
a61af66fc99e Initial load
duke
parents:
diff changeset
300 }
a61af66fc99e Initial load
duke
parents:
diff changeset
301 if(ih==2) {
a61af66fc99e Initial load
duke
parents:
diff changeset
302 z = one - z;
a61af66fc99e Initial load
duke
parents:
diff changeset
303 if(carry!=0) z -= scalbnA(one,q0);
a61af66fc99e Initial load
duke
parents:
diff changeset
304 }
a61af66fc99e Initial load
duke
parents:
diff changeset
305 }
a61af66fc99e Initial load
duke
parents:
diff changeset
306
a61af66fc99e Initial load
duke
parents:
diff changeset
307 /* check if recomputation is needed */
a61af66fc99e Initial load
duke
parents:
diff changeset
308 if(z==zeroB) {
a61af66fc99e Initial load
duke
parents:
diff changeset
309 j = 0;
a61af66fc99e Initial load
duke
parents:
diff changeset
310 for (i=jz-1;i>=jk;i--) j |= iq[i];
a61af66fc99e Initial load
duke
parents:
diff changeset
311 if(j==0) { /* need recomputation */
a61af66fc99e Initial load
duke
parents:
diff changeset
312 for(k=1;iq[jk-k]==0;k++); /* k = no. of terms needed */
a61af66fc99e Initial load
duke
parents:
diff changeset
313
a61af66fc99e Initial load
duke
parents:
diff changeset
314 for(i=jz+1;i<=jz+k;i++) { /* add q[jz+1] to q[jz+k] */
a61af66fc99e Initial load
duke
parents:
diff changeset
315 f[jx+i] = (double) ipio2[jv+i];
a61af66fc99e Initial load
duke
parents:
diff changeset
316 for(j=0,fw=0.0;j<=jx;j++) fw += x[j]*f[jx+i-j];
a61af66fc99e Initial load
duke
parents:
diff changeset
317 q[i] = fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
318 }
a61af66fc99e Initial load
duke
parents:
diff changeset
319 jz += k;
a61af66fc99e Initial load
duke
parents:
diff changeset
320 goto recompute;
a61af66fc99e Initial load
duke
parents:
diff changeset
321 }
a61af66fc99e Initial load
duke
parents:
diff changeset
322 }
a61af66fc99e Initial load
duke
parents:
diff changeset
323
a61af66fc99e Initial load
duke
parents:
diff changeset
324 /* chop off zero terms */
a61af66fc99e Initial load
duke
parents:
diff changeset
325 if(z==0.0) {
a61af66fc99e Initial load
duke
parents:
diff changeset
326 jz -= 1; q0 -= 24;
a61af66fc99e Initial load
duke
parents:
diff changeset
327 while(iq[jz]==0) { jz--; q0-=24;}
a61af66fc99e Initial load
duke
parents:
diff changeset
328 } else { /* break z into 24-bit if neccessary */
a61af66fc99e Initial load
duke
parents:
diff changeset
329 z = scalbnA(z,-q0);
a61af66fc99e Initial load
duke
parents:
diff changeset
330 if(z>=two24B) {
a61af66fc99e Initial load
duke
parents:
diff changeset
331 fw = (double)((int)(twon24*z));
a61af66fc99e Initial load
duke
parents:
diff changeset
332 iq[jz] = (int)(z-two24B*fw);
a61af66fc99e Initial load
duke
parents:
diff changeset
333 jz += 1; q0 += 24;
a61af66fc99e Initial load
duke
parents:
diff changeset
334 iq[jz] = (int) fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
335 } else iq[jz] = (int) z ;
a61af66fc99e Initial load
duke
parents:
diff changeset
336 }
a61af66fc99e Initial load
duke
parents:
diff changeset
337
a61af66fc99e Initial load
duke
parents:
diff changeset
338 /* convert integer "bit" chunk to floating-point value */
a61af66fc99e Initial load
duke
parents:
diff changeset
339 fw = scalbnA(one,q0);
a61af66fc99e Initial load
duke
parents:
diff changeset
340 for(i=jz;i>=0;i--) {
a61af66fc99e Initial load
duke
parents:
diff changeset
341 q[i] = fw*(double)iq[i]; fw*=twon24;
a61af66fc99e Initial load
duke
parents:
diff changeset
342 }
a61af66fc99e Initial load
duke
parents:
diff changeset
343
a61af66fc99e Initial load
duke
parents:
diff changeset
344 /* compute PIo2[0,...,jp]*q[jz,...,0] */
a61af66fc99e Initial load
duke
parents:
diff changeset
345 for(i=jz;i>=0;i--) {
a61af66fc99e Initial load
duke
parents:
diff changeset
346 for(fw=0.0,k=0;k<=jp&&k<=jz-i;k++) fw += PIo2[k]*q[i+k];
a61af66fc99e Initial load
duke
parents:
diff changeset
347 fq[jz-i] = fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
348 }
a61af66fc99e Initial load
duke
parents:
diff changeset
349
a61af66fc99e Initial load
duke
parents:
diff changeset
350 /* compress fq[] into y[] */
a61af66fc99e Initial load
duke
parents:
diff changeset
351 switch(prec) {
a61af66fc99e Initial load
duke
parents:
diff changeset
352 case 0:
a61af66fc99e Initial load
duke
parents:
diff changeset
353 fw = 0.0;
a61af66fc99e Initial load
duke
parents:
diff changeset
354 for (i=jz;i>=0;i--) fw += fq[i];
a61af66fc99e Initial load
duke
parents:
diff changeset
355 y[0] = (ih==0)? fw: -fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
356 break;
a61af66fc99e Initial load
duke
parents:
diff changeset
357 case 1:
a61af66fc99e Initial load
duke
parents:
diff changeset
358 case 2:
a61af66fc99e Initial load
duke
parents:
diff changeset
359 fw = 0.0;
a61af66fc99e Initial load
duke
parents:
diff changeset
360 for (i=jz;i>=0;i--) fw += fq[i];
a61af66fc99e Initial load
duke
parents:
diff changeset
361 y[0] = (ih==0)? fw: -fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
362 fw = fq[0]-fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
363 for (i=1;i<=jz;i++) fw += fq[i];
a61af66fc99e Initial load
duke
parents:
diff changeset
364 y[1] = (ih==0)? fw: -fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
365 break;
a61af66fc99e Initial load
duke
parents:
diff changeset
366 case 3: /* painful */
a61af66fc99e Initial load
duke
parents:
diff changeset
367 for (i=jz;i>0;i--) {
a61af66fc99e Initial load
duke
parents:
diff changeset
368 fw = fq[i-1]+fq[i];
a61af66fc99e Initial load
duke
parents:
diff changeset
369 fq[i] += fq[i-1]-fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
370 fq[i-1] = fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
371 }
a61af66fc99e Initial load
duke
parents:
diff changeset
372 for (i=jz;i>1;i--) {
a61af66fc99e Initial load
duke
parents:
diff changeset
373 fw = fq[i-1]+fq[i];
a61af66fc99e Initial load
duke
parents:
diff changeset
374 fq[i] += fq[i-1]-fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
375 fq[i-1] = fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
376 }
a61af66fc99e Initial load
duke
parents:
diff changeset
377 for (fw=0.0,i=jz;i>=2;i--) fw += fq[i];
a61af66fc99e Initial load
duke
parents:
diff changeset
378 if(ih==0) {
a61af66fc99e Initial load
duke
parents:
diff changeset
379 y[0] = fq[0]; y[1] = fq[1]; y[2] = fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
380 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
381 y[0] = -fq[0]; y[1] = -fq[1]; y[2] = -fw;
a61af66fc99e Initial load
duke
parents:
diff changeset
382 }
a61af66fc99e Initial load
duke
parents:
diff changeset
383 }
a61af66fc99e Initial load
duke
parents:
diff changeset
384 return n&7;
a61af66fc99e Initial load
duke
parents:
diff changeset
385 }
a61af66fc99e Initial load
duke
parents:
diff changeset
386
a61af66fc99e Initial load
duke
parents:
diff changeset
387
a61af66fc99e Initial load
duke
parents:
diff changeset
388 /*
a61af66fc99e Initial load
duke
parents:
diff changeset
389 * ====================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
390 * Copyright 13 Dec 1993 Sun Microsystems, Inc. All Rights Reserved.
a61af66fc99e Initial load
duke
parents:
diff changeset
391 *
a61af66fc99e Initial load
duke
parents:
diff changeset
392 * Developed at SunPro, a Sun Microsystems, Inc. business.
a61af66fc99e Initial load
duke
parents:
diff changeset
393 * Permission to use, copy, modify, and distribute this
a61af66fc99e Initial load
duke
parents:
diff changeset
394 * software is freely granted, provided that this notice
a61af66fc99e Initial load
duke
parents:
diff changeset
395 * is preserved.
a61af66fc99e Initial load
duke
parents:
diff changeset
396 * ====================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
397 *
a61af66fc99e Initial load
duke
parents:
diff changeset
398 */
a61af66fc99e Initial load
duke
parents:
diff changeset
399
a61af66fc99e Initial load
duke
parents:
diff changeset
400 /* __ieee754_rem_pio2(x,y)
a61af66fc99e Initial load
duke
parents:
diff changeset
401 *
a61af66fc99e Initial load
duke
parents:
diff changeset
402 * return the remainder of x rem pi/2 in y[0]+y[1]
a61af66fc99e Initial load
duke
parents:
diff changeset
403 * use __kernel_rem_pio2()
a61af66fc99e Initial load
duke
parents:
diff changeset
404 */
a61af66fc99e Initial load
duke
parents:
diff changeset
405
a61af66fc99e Initial load
duke
parents:
diff changeset
406 /*
a61af66fc99e Initial load
duke
parents:
diff changeset
407 * Table of constants for 2/pi, 396 Hex digits (476 decimal) of 2/pi
a61af66fc99e Initial load
duke
parents:
diff changeset
408 */
a61af66fc99e Initial load
duke
parents:
diff changeset
409 static const int two_over_pi[] = {
a61af66fc99e Initial load
duke
parents:
diff changeset
410 0xA2F983, 0x6E4E44, 0x1529FC, 0x2757D1, 0xF534DD, 0xC0DB62,
a61af66fc99e Initial load
duke
parents:
diff changeset
411 0x95993C, 0x439041, 0xFE5163, 0xABDEBB, 0xC561B7, 0x246E3A,
a61af66fc99e Initial load
duke
parents:
diff changeset
412 0x424DD2, 0xE00649, 0x2EEA09, 0xD1921C, 0xFE1DEB, 0x1CB129,
a61af66fc99e Initial load
duke
parents:
diff changeset
413 0xA73EE8, 0x8235F5, 0x2EBB44, 0x84E99C, 0x7026B4, 0x5F7E41,
a61af66fc99e Initial load
duke
parents:
diff changeset
414 0x3991D6, 0x398353, 0x39F49C, 0x845F8B, 0xBDF928, 0x3B1FF8,
a61af66fc99e Initial load
duke
parents:
diff changeset
415 0x97FFDE, 0x05980F, 0xEF2F11, 0x8B5A0A, 0x6D1F6D, 0x367ECF,
a61af66fc99e Initial load
duke
parents:
diff changeset
416 0x27CB09, 0xB74F46, 0x3F669E, 0x5FEA2D, 0x7527BA, 0xC7EBE5,
a61af66fc99e Initial load
duke
parents:
diff changeset
417 0xF17B3D, 0x0739F7, 0x8A5292, 0xEA6BFB, 0x5FB11F, 0x8D5D08,
a61af66fc99e Initial load
duke
parents:
diff changeset
418 0x560330, 0x46FC7B, 0x6BABF0, 0xCFBC20, 0x9AF436, 0x1DA9E3,
a61af66fc99e Initial load
duke
parents:
diff changeset
419 0x91615E, 0xE61B08, 0x659985, 0x5F14A0, 0x68408D, 0xFFD880,
a61af66fc99e Initial load
duke
parents:
diff changeset
420 0x4D7327, 0x310606, 0x1556CA, 0x73A8C9, 0x60E27B, 0xC08C6B,
a61af66fc99e Initial load
duke
parents:
diff changeset
421 };
a61af66fc99e Initial load
duke
parents:
diff changeset
422
a61af66fc99e Initial load
duke
parents:
diff changeset
423 static const int npio2_hw[] = {
a61af66fc99e Initial load
duke
parents:
diff changeset
424 0x3FF921FB, 0x400921FB, 0x4012D97C, 0x401921FB, 0x401F6A7A, 0x4022D97C,
a61af66fc99e Initial load
duke
parents:
diff changeset
425 0x4025FDBB, 0x402921FB, 0x402C463A, 0x402F6A7A, 0x4031475C, 0x4032D97C,
a61af66fc99e Initial load
duke
parents:
diff changeset
426 0x40346B9C, 0x4035FDBB, 0x40378FDB, 0x403921FB, 0x403AB41B, 0x403C463A,
a61af66fc99e Initial load
duke
parents:
diff changeset
427 0x403DD85A, 0x403F6A7A, 0x40407E4C, 0x4041475C, 0x4042106C, 0x4042D97C,
a61af66fc99e Initial load
duke
parents:
diff changeset
428 0x4043A28C, 0x40446B9C, 0x404534AC, 0x4045FDBB, 0x4046C6CB, 0x40478FDB,
a61af66fc99e Initial load
duke
parents:
diff changeset
429 0x404858EB, 0x404921FB,
a61af66fc99e Initial load
duke
parents:
diff changeset
430 };
a61af66fc99e Initial load
duke
parents:
diff changeset
431
a61af66fc99e Initial load
duke
parents:
diff changeset
432 /*
a61af66fc99e Initial load
duke
parents:
diff changeset
433 * invpio2: 53 bits of 2/pi
a61af66fc99e Initial load
duke
parents:
diff changeset
434 * pio2_1: first 33 bit of pi/2
a61af66fc99e Initial load
duke
parents:
diff changeset
435 * pio2_1t: pi/2 - pio2_1
a61af66fc99e Initial load
duke
parents:
diff changeset
436 * pio2_2: second 33 bit of pi/2
a61af66fc99e Initial load
duke
parents:
diff changeset
437 * pio2_2t: pi/2 - (pio2_1+pio2_2)
a61af66fc99e Initial load
duke
parents:
diff changeset
438 * pio2_3: third 33 bit of pi/2
a61af66fc99e Initial load
duke
parents:
diff changeset
439 * pio2_3t: pi/2 - (pio2_1+pio2_2+pio2_3)
a61af66fc99e Initial load
duke
parents:
diff changeset
440 */
a61af66fc99e Initial load
duke
parents:
diff changeset
441
a61af66fc99e Initial load
duke
parents:
diff changeset
442 static const double
a61af66fc99e Initial load
duke
parents:
diff changeset
443 zeroA = 0.00000000000000000000e+00, /* 0x00000000, 0x00000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
444 half = 5.00000000000000000000e-01, /* 0x3FE00000, 0x00000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
445 two24A = 1.67772160000000000000e+07, /* 0x41700000, 0x00000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
446 invpio2 = 6.36619772367581382433e-01, /* 0x3FE45F30, 0x6DC9C883 */
a61af66fc99e Initial load
duke
parents:
diff changeset
447 pio2_1 = 1.57079632673412561417e+00, /* 0x3FF921FB, 0x54400000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
448 pio2_1t = 6.07710050650619224932e-11, /* 0x3DD0B461, 0x1A626331 */
a61af66fc99e Initial load
duke
parents:
diff changeset
449 pio2_2 = 6.07710050630396597660e-11, /* 0x3DD0B461, 0x1A600000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
450 pio2_2t = 2.02226624879595063154e-21, /* 0x3BA3198A, 0x2E037073 */
a61af66fc99e Initial load
duke
parents:
diff changeset
451 pio2_3 = 2.02226624871116645580e-21, /* 0x3BA3198A, 0x2E000000 */
a61af66fc99e Initial load
duke
parents:
diff changeset
452 pio2_3t = 8.47842766036889956997e-32; /* 0x397B839A, 0x252049C1 */
a61af66fc99e Initial load
duke
parents:
diff changeset
453
a61af66fc99e Initial load
duke
parents:
diff changeset
454 static int __ieee754_rem_pio2(double x, double *y) {
a61af66fc99e Initial load
duke
parents:
diff changeset
455 double z,w,t,r,fn;
a61af66fc99e Initial load
duke
parents:
diff changeset
456 double tx[3];
a61af66fc99e Initial load
duke
parents:
diff changeset
457 int e0,i,j,nx,n,ix,hx,i0;
a61af66fc99e Initial load
duke
parents:
diff changeset
458
a61af66fc99e Initial load
duke
parents:
diff changeset
459 i0 = ((*(int*)&two24A)>>30)^1; /* high word index */
a61af66fc99e Initial load
duke
parents:
diff changeset
460 hx = *(i0+(int*)&x); /* high word of x */
a61af66fc99e Initial load
duke
parents:
diff changeset
461 ix = hx&0x7fffffff;
a61af66fc99e Initial load
duke
parents:
diff changeset
462 if(ix<=0x3fe921fb) /* |x| ~<= pi/4 , no need for reduction */
a61af66fc99e Initial load
duke
parents:
diff changeset
463 {y[0] = x; y[1] = 0; return 0;}
a61af66fc99e Initial load
duke
parents:
diff changeset
464 if(ix<0x4002d97c) { /* |x| < 3pi/4, special case with n=+-1 */
a61af66fc99e Initial load
duke
parents:
diff changeset
465 if(hx>0) {
a61af66fc99e Initial load
duke
parents:
diff changeset
466 z = x - pio2_1;
a61af66fc99e Initial load
duke
parents:
diff changeset
467 if(ix!=0x3ff921fb) { /* 33+53 bit pi is good enough */
a61af66fc99e Initial load
duke
parents:
diff changeset
468 y[0] = z - pio2_1t;
a61af66fc99e Initial load
duke
parents:
diff changeset
469 y[1] = (z-y[0])-pio2_1t;
a61af66fc99e Initial load
duke
parents:
diff changeset
470 } else { /* near pi/2, use 33+33+53 bit pi */
a61af66fc99e Initial load
duke
parents:
diff changeset
471 z -= pio2_2;
a61af66fc99e Initial load
duke
parents:
diff changeset
472 y[0] = z - pio2_2t;
a61af66fc99e Initial load
duke
parents:
diff changeset
473 y[1] = (z-y[0])-pio2_2t;
a61af66fc99e Initial load
duke
parents:
diff changeset
474 }
a61af66fc99e Initial load
duke
parents:
diff changeset
475 return 1;
a61af66fc99e Initial load
duke
parents:
diff changeset
476 } else { /* negative x */
a61af66fc99e Initial load
duke
parents:
diff changeset
477 z = x + pio2_1;
a61af66fc99e Initial load
duke
parents:
diff changeset
478 if(ix!=0x3ff921fb) { /* 33+53 bit pi is good enough */
a61af66fc99e Initial load
duke
parents:
diff changeset
479 y[0] = z + pio2_1t;
a61af66fc99e Initial load
duke
parents:
diff changeset
480 y[1] = (z-y[0])+pio2_1t;
a61af66fc99e Initial load
duke
parents:
diff changeset
481 } else { /* near pi/2, use 33+33+53 bit pi */
a61af66fc99e Initial load
duke
parents:
diff changeset
482 z += pio2_2;
a61af66fc99e Initial load
duke
parents:
diff changeset
483 y[0] = z + pio2_2t;
a61af66fc99e Initial load
duke
parents:
diff changeset
484 y[1] = (z-y[0])+pio2_2t;
a61af66fc99e Initial load
duke
parents:
diff changeset
485 }
a61af66fc99e Initial load
duke
parents:
diff changeset
486 return -1;
a61af66fc99e Initial load
duke
parents:
diff changeset
487 }
a61af66fc99e Initial load
duke
parents:
diff changeset
488 }
a61af66fc99e Initial load
duke
parents:
diff changeset
489 if(ix<=0x413921fb) { /* |x| ~<= 2^19*(pi/2), medium size */
a61af66fc99e Initial load
duke
parents:
diff changeset
490 t = fabsd(x);
a61af66fc99e Initial load
duke
parents:
diff changeset
491 n = (int) (t*invpio2+half);
a61af66fc99e Initial load
duke
parents:
diff changeset
492 fn = (double)n;
a61af66fc99e Initial load
duke
parents:
diff changeset
493 r = t-fn*pio2_1;
a61af66fc99e Initial load
duke
parents:
diff changeset
494 w = fn*pio2_1t; /* 1st round good to 85 bit */
a61af66fc99e Initial load
duke
parents:
diff changeset
495 if(n<32&&ix!=npio2_hw[n-1]) {
a61af66fc99e Initial load
duke
parents:
diff changeset
496 y[0] = r-w; /* quick check no cancellation */
a61af66fc99e Initial load
duke
parents:
diff changeset
497 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
498 j = ix>>20;
a61af66fc99e Initial load
duke
parents:
diff changeset
499 y[0] = r-w;
a61af66fc99e Initial load
duke
parents:
diff changeset
500 i = j-(((*(i0+(int*)&y[0]))>>20)&0x7ff);
a61af66fc99e Initial load
duke
parents:
diff changeset
501 if(i>16) { /* 2nd iteration needed, good to 118 */
a61af66fc99e Initial load
duke
parents:
diff changeset
502 t = r;
a61af66fc99e Initial load
duke
parents:
diff changeset
503 w = fn*pio2_2;
a61af66fc99e Initial load
duke
parents:
diff changeset
504 r = t-w;
a61af66fc99e Initial load
duke
parents:
diff changeset
505 w = fn*pio2_2t-((t-r)-w);
a61af66fc99e Initial load
duke
parents:
diff changeset
506 y[0] = r-w;
a61af66fc99e Initial load
duke
parents:
diff changeset
507 i = j-(((*(i0+(int*)&y[0]))>>20)&0x7ff);
a61af66fc99e Initial load
duke
parents:
diff changeset
508 if(i>49) { /* 3rd iteration need, 151 bits acc */
a61af66fc99e Initial load
duke
parents:
diff changeset
509 t = r; /* will cover all possible cases */
a61af66fc99e Initial load
duke
parents:
diff changeset
510 w = fn*pio2_3;
a61af66fc99e Initial load
duke
parents:
diff changeset
511 r = t-w;
a61af66fc99e Initial load
duke
parents:
diff changeset
512 w = fn*pio2_3t-((t-r)-w);
a61af66fc99e Initial load
duke
parents:
diff changeset
513 y[0] = r-w;
a61af66fc99e Initial load
duke
parents:
diff changeset
514 }
a61af66fc99e Initial load
duke
parents:
diff changeset
515 }
a61af66fc99e Initial load
duke
parents:
diff changeset
516 }
a61af66fc99e Initial load
duke
parents:
diff changeset
517 y[1] = (r-y[0])-w;
a61af66fc99e Initial load
duke
parents:
diff changeset
518 if(hx<0) {y[0] = -y[0]; y[1] = -y[1]; return -n;}
a61af66fc99e Initial load
duke
parents:
diff changeset
519 else return n;
a61af66fc99e Initial load
duke
parents:
diff changeset
520 }
a61af66fc99e Initial load
duke
parents:
diff changeset
521 /*
a61af66fc99e Initial load
duke
parents:
diff changeset
522 * all other (large) arguments
a61af66fc99e Initial load
duke
parents:
diff changeset
523 */
a61af66fc99e Initial load
duke
parents:
diff changeset
524 if(ix>=0x7ff00000) { /* x is inf or NaN */
a61af66fc99e Initial load
duke
parents:
diff changeset
525 y[0]=y[1]=x-x; return 0;
a61af66fc99e Initial load
duke
parents:
diff changeset
526 }
a61af66fc99e Initial load
duke
parents:
diff changeset
527 /* set z = scalbn(|x|,ilogb(x)-23) */
a61af66fc99e Initial load
duke
parents:
diff changeset
528 *(1-i0+(int*)&z) = *(1-i0+(int*)&x);
a61af66fc99e Initial load
duke
parents:
diff changeset
529 e0 = (ix>>20)-1046; /* e0 = ilogb(z)-23; */
a61af66fc99e Initial load
duke
parents:
diff changeset
530 *(i0+(int*)&z) = ix - (e0<<20);
a61af66fc99e Initial load
duke
parents:
diff changeset
531 for(i=0;i<2;i++) {
a61af66fc99e Initial load
duke
parents:
diff changeset
532 tx[i] = (double)((int)(z));
a61af66fc99e Initial load
duke
parents:
diff changeset
533 z = (z-tx[i])*two24A;
a61af66fc99e Initial load
duke
parents:
diff changeset
534 }
a61af66fc99e Initial load
duke
parents:
diff changeset
535 tx[2] = z;
a61af66fc99e Initial load
duke
parents:
diff changeset
536 nx = 3;
a61af66fc99e Initial load
duke
parents:
diff changeset
537 while(tx[nx-1]==zeroA) nx--; /* skip zero term */
a61af66fc99e Initial load
duke
parents:
diff changeset
538 n = __kernel_rem_pio2(tx,y,e0,nx,2,two_over_pi);
a61af66fc99e Initial load
duke
parents:
diff changeset
539 if(hx<0) {y[0] = -y[0]; y[1] = -y[1]; return -n;}
a61af66fc99e Initial load
duke
parents:
diff changeset
540 return n;
a61af66fc99e Initial load
duke
parents:
diff changeset
541 }
a61af66fc99e Initial load
duke
parents:
diff changeset
542
a61af66fc99e Initial load
duke
parents:
diff changeset
543
a61af66fc99e Initial load
duke
parents:
diff changeset
544 /* __kernel_sin( x, y, iy)
a61af66fc99e Initial load
duke
parents:
diff changeset
545 * kernel sin function on [-pi/4, pi/4], pi/4 ~ 0.7854
a61af66fc99e Initial load
duke
parents:
diff changeset
546 * Input x is assumed to be bounded by ~pi/4 in magnitude.
a61af66fc99e Initial load
duke
parents:
diff changeset
547 * Input y is the tail of x.
a61af66fc99e Initial load
duke
parents:
diff changeset
548 * Input iy indicates whether y is 0. (if iy=0, y assume to be 0).
a61af66fc99e Initial load
duke
parents:
diff changeset
549 *
a61af66fc99e Initial load
duke
parents:
diff changeset
550 * Algorithm
a61af66fc99e Initial load
duke
parents:
diff changeset
551 * 1. Since sin(-x) = -sin(x), we need only to consider positive x.
a61af66fc99e Initial load
duke
parents:
diff changeset
552 * 2. if x < 2^-27 (hx<0x3e400000 0), return x with inexact if x!=0.
a61af66fc99e Initial load
duke
parents:
diff changeset
553 * 3. sin(x) is approximated by a polynomial of degree 13 on
a61af66fc99e Initial load
duke
parents:
diff changeset
554 * [0,pi/4]
a61af66fc99e Initial load
duke
parents:
diff changeset
555 * 3 13
a61af66fc99e Initial load
duke
parents:
diff changeset
556 * sin(x) ~ x + S1*x + ... + S6*x
a61af66fc99e Initial load
duke
parents:
diff changeset
557 * where
a61af66fc99e Initial load
duke
parents:
diff changeset
558 *
a61af66fc99e Initial load
duke
parents:
diff changeset
559 * |sin(x) 2 4 6 8 10 12 | -58
a61af66fc99e Initial load
duke
parents:
diff changeset
560 * |----- - (1+S1*x +S2*x +S3*x +S4*x +S5*x +S6*x )| <= 2
a61af66fc99e Initial load
duke
parents:
diff changeset
561 * | x |
a61af66fc99e Initial load
duke
parents:
diff changeset
562 *
a61af66fc99e Initial load
duke
parents:
diff changeset
563 * 4. sin(x+y) = sin(x) + sin'(x')*y
a61af66fc99e Initial load
duke
parents:
diff changeset
564 * ~ sin(x) + (1-x*x/2)*y
a61af66fc99e Initial load
duke
parents:
diff changeset
565 * For better accuracy, let
a61af66fc99e Initial load
duke
parents:
diff changeset
566 * 3 2 2 2 2
a61af66fc99e Initial load
duke
parents:
diff changeset
567 * r = x *(S2+x *(S3+x *(S4+x *(S5+x *S6))))
a61af66fc99e Initial load
duke
parents:
diff changeset
568 * then 3 2
a61af66fc99e Initial load
duke
parents:
diff changeset
569 * sin(x) = x + (S1*x + (x *(r-y/2)+y))
a61af66fc99e Initial load
duke
parents:
diff changeset
570 */
a61af66fc99e Initial load
duke
parents:
diff changeset
571
a61af66fc99e Initial load
duke
parents:
diff changeset
572 static const double
a61af66fc99e Initial load
duke
parents:
diff changeset
573 S1 = -1.66666666666666324348e-01, /* 0xBFC55555, 0x55555549 */
a61af66fc99e Initial load
duke
parents:
diff changeset
574 S2 = 8.33333333332248946124e-03, /* 0x3F811111, 0x1110F8A6 */
a61af66fc99e Initial load
duke
parents:
diff changeset
575 S3 = -1.98412698298579493134e-04, /* 0xBF2A01A0, 0x19C161D5 */
a61af66fc99e Initial load
duke
parents:
diff changeset
576 S4 = 2.75573137070700676789e-06, /* 0x3EC71DE3, 0x57B1FE7D */
a61af66fc99e Initial load
duke
parents:
diff changeset
577 S5 = -2.50507602534068634195e-08, /* 0xBE5AE5E6, 0x8A2B9CEB */
a61af66fc99e Initial load
duke
parents:
diff changeset
578 S6 = 1.58969099521155010221e-10; /* 0x3DE5D93A, 0x5ACFD57C */
a61af66fc99e Initial load
duke
parents:
diff changeset
579
a61af66fc99e Initial load
duke
parents:
diff changeset
580 static double __kernel_sin(double x, double y, int iy)
a61af66fc99e Initial load
duke
parents:
diff changeset
581 {
a61af66fc99e Initial load
duke
parents:
diff changeset
582 double z,r,v;
a61af66fc99e Initial load
duke
parents:
diff changeset
583 int ix;
a61af66fc99e Initial load
duke
parents:
diff changeset
584 ix = __HI(x)&0x7fffffff; /* high word of x */
a61af66fc99e Initial load
duke
parents:
diff changeset
585 if(ix<0x3e400000) /* |x| < 2**-27 */
a61af66fc99e Initial load
duke
parents:
diff changeset
586 {if((int)x==0) return x;} /* generate inexact */
a61af66fc99e Initial load
duke
parents:
diff changeset
587 z = x*x;
a61af66fc99e Initial load
duke
parents:
diff changeset
588 v = z*x;
a61af66fc99e Initial load
duke
parents:
diff changeset
589 r = S2+z*(S3+z*(S4+z*(S5+z*S6)));
a61af66fc99e Initial load
duke
parents:
diff changeset
590 if(iy==0) return x+v*(S1+z*r);
a61af66fc99e Initial load
duke
parents:
diff changeset
591 else return x-((z*(half*y-v*r)-y)-v*S1);
a61af66fc99e Initial load
duke
parents:
diff changeset
592 }
a61af66fc99e Initial load
duke
parents:
diff changeset
593
a61af66fc99e Initial load
duke
parents:
diff changeset
594 /*
a61af66fc99e Initial load
duke
parents:
diff changeset
595 * __kernel_cos( x, y )
a61af66fc99e Initial load
duke
parents:
diff changeset
596 * kernel cos function on [-pi/4, pi/4], pi/4 ~ 0.785398164
a61af66fc99e Initial load
duke
parents:
diff changeset
597 * Input x is assumed to be bounded by ~pi/4 in magnitude.
a61af66fc99e Initial load
duke
parents:
diff changeset
598 * Input y is the tail of x.
a61af66fc99e Initial load
duke
parents:
diff changeset
599 *
a61af66fc99e Initial load
duke
parents:
diff changeset
600 * Algorithm
a61af66fc99e Initial load
duke
parents:
diff changeset
601 * 1. Since cos(-x) = cos(x), we need only to consider positive x.
a61af66fc99e Initial load
duke
parents:
diff changeset
602 * 2. if x < 2^-27 (hx<0x3e400000 0), return 1 with inexact if x!=0.
a61af66fc99e Initial load
duke
parents:
diff changeset
603 * 3. cos(x) is approximated by a polynomial of degree 14 on
a61af66fc99e Initial load
duke
parents:
diff changeset
604 * [0,pi/4]
a61af66fc99e Initial load
duke
parents:
diff changeset
605 * 4 14
a61af66fc99e Initial load
duke
parents:
diff changeset
606 * cos(x) ~ 1 - x*x/2 + C1*x + ... + C6*x
a61af66fc99e Initial load
duke
parents:
diff changeset
607 * where the remez error is
a61af66fc99e Initial load
duke
parents:
diff changeset
608 *
a61af66fc99e Initial load
duke
parents:
diff changeset
609 * | 2 4 6 8 10 12 14 | -58
a61af66fc99e Initial load
duke
parents:
diff changeset
610 * |cos(x)-(1-.5*x +C1*x +C2*x +C3*x +C4*x +C5*x +C6*x )| <= 2
a61af66fc99e Initial load
duke
parents:
diff changeset
611 * | |
a61af66fc99e Initial load
duke
parents:
diff changeset
612 *
a61af66fc99e Initial load
duke
parents:
diff changeset
613 * 4 6 8 10 12 14
a61af66fc99e Initial load
duke
parents:
diff changeset
614 * 4. let r = C1*x +C2*x +C3*x +C4*x +C5*x +C6*x , then
a61af66fc99e Initial load
duke
parents:
diff changeset
615 * cos(x) = 1 - x*x/2 + r
a61af66fc99e Initial load
duke
parents:
diff changeset
616 * since cos(x+y) ~ cos(x) - sin(x)*y
a61af66fc99e Initial load
duke
parents:
diff changeset
617 * ~ cos(x) - x*y,
a61af66fc99e Initial load
duke
parents:
diff changeset
618 * a correction term is necessary in cos(x) and hence
a61af66fc99e Initial load
duke
parents:
diff changeset
619 * cos(x+y) = 1 - (x*x/2 - (r - x*y))
a61af66fc99e Initial load
duke
parents:
diff changeset
620 * For better accuracy when x > 0.3, let qx = |x|/4 with
a61af66fc99e Initial load
duke
parents:
diff changeset
621 * the last 32 bits mask off, and if x > 0.78125, let qx = 0.28125.
a61af66fc99e Initial load
duke
parents:
diff changeset
622 * Then
a61af66fc99e Initial load
duke
parents:
diff changeset
623 * cos(x+y) = (1-qx) - ((x*x/2-qx) - (r-x*y)).
a61af66fc99e Initial load
duke
parents:
diff changeset
624 * Note that 1-qx and (x*x/2-qx) is EXACT here, and the
a61af66fc99e Initial load
duke
parents:
diff changeset
625 * magnitude of the latter is at least a quarter of x*x/2,
a61af66fc99e Initial load
duke
parents:
diff changeset
626 * thus, reducing the rounding error in the subtraction.
a61af66fc99e Initial load
duke
parents:
diff changeset
627 */
a61af66fc99e Initial load
duke
parents:
diff changeset
628
a61af66fc99e Initial load
duke
parents:
diff changeset
629 static const double
a61af66fc99e Initial load
duke
parents:
diff changeset
630 C1 = 4.16666666666666019037e-02, /* 0x3FA55555, 0x5555554C */
a61af66fc99e Initial load
duke
parents:
diff changeset
631 C2 = -1.38888888888741095749e-03, /* 0xBF56C16C, 0x16C15177 */
a61af66fc99e Initial load
duke
parents:
diff changeset
632 C3 = 2.48015872894767294178e-05, /* 0x3EFA01A0, 0x19CB1590 */
a61af66fc99e Initial load
duke
parents:
diff changeset
633 C4 = -2.75573143513906633035e-07, /* 0xBE927E4F, 0x809C52AD */
a61af66fc99e Initial load
duke
parents:
diff changeset
634 C5 = 2.08757232129817482790e-09, /* 0x3E21EE9E, 0xBDB4B1C4 */
a61af66fc99e Initial load
duke
parents:
diff changeset
635 C6 = -1.13596475577881948265e-11; /* 0xBDA8FAE9, 0xBE8838D4 */
a61af66fc99e Initial load
duke
parents:
diff changeset
636
a61af66fc99e Initial load
duke
parents:
diff changeset
637 static double __kernel_cos(double x, double y)
a61af66fc99e Initial load
duke
parents:
diff changeset
638 {
a61af66fc99e Initial load
duke
parents:
diff changeset
639 double a,hz,z,r,qx;
a61af66fc99e Initial load
duke
parents:
diff changeset
640 int ix;
a61af66fc99e Initial load
duke
parents:
diff changeset
641 ix = __HI(x)&0x7fffffff; /* ix = |x|'s high word*/
a61af66fc99e Initial load
duke
parents:
diff changeset
642 if(ix<0x3e400000) { /* if x < 2**27 */
a61af66fc99e Initial load
duke
parents:
diff changeset
643 if(((int)x)==0) return one; /* generate inexact */
a61af66fc99e Initial load
duke
parents:
diff changeset
644 }
a61af66fc99e Initial load
duke
parents:
diff changeset
645 z = x*x;
a61af66fc99e Initial load
duke
parents:
diff changeset
646 r = z*(C1+z*(C2+z*(C3+z*(C4+z*(C5+z*C6)))));
a61af66fc99e Initial load
duke
parents:
diff changeset
647 if(ix < 0x3FD33333) /* if |x| < 0.3 */
a61af66fc99e Initial load
duke
parents:
diff changeset
648 return one - (0.5*z - (z*r - x*y));
a61af66fc99e Initial load
duke
parents:
diff changeset
649 else {
a61af66fc99e Initial load
duke
parents:
diff changeset
650 if(ix > 0x3fe90000) { /* x > 0.78125 */
a61af66fc99e Initial load
duke
parents:
diff changeset
651 qx = 0.28125;
a61af66fc99e Initial load
duke
parents:
diff changeset
652 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
653 __HI(qx) = ix-0x00200000; /* x/4 */
a61af66fc99e Initial load
duke
parents:
diff changeset
654 __LO(qx) = 0;
a61af66fc99e Initial load
duke
parents:
diff changeset
655 }
a61af66fc99e Initial load
duke
parents:
diff changeset
656 hz = 0.5*z-qx;
a61af66fc99e Initial load
duke
parents:
diff changeset
657 a = one-qx;
a61af66fc99e Initial load
duke
parents:
diff changeset
658 return a - (hz - (z*r-x*y));
a61af66fc99e Initial load
duke
parents:
diff changeset
659 }
a61af66fc99e Initial load
duke
parents:
diff changeset
660 }
a61af66fc99e Initial load
duke
parents:
diff changeset
661
a61af66fc99e Initial load
duke
parents:
diff changeset
662 /* __kernel_tan( x, y, k )
a61af66fc99e Initial load
duke
parents:
diff changeset
663 * kernel tan function on [-pi/4, pi/4], pi/4 ~ 0.7854
a61af66fc99e Initial load
duke
parents:
diff changeset
664 * Input x is assumed to be bounded by ~pi/4 in magnitude.
a61af66fc99e Initial load
duke
parents:
diff changeset
665 * Input y is the tail of x.
a61af66fc99e Initial load
duke
parents:
diff changeset
666 * Input k indicates whether tan (if k=1) or
a61af66fc99e Initial load
duke
parents:
diff changeset
667 * -1/tan (if k= -1) is returned.
a61af66fc99e Initial load
duke
parents:
diff changeset
668 *
a61af66fc99e Initial load
duke
parents:
diff changeset
669 * Algorithm
a61af66fc99e Initial load
duke
parents:
diff changeset
670 * 1. Since tan(-x) = -tan(x), we need only to consider positive x.
a61af66fc99e Initial load
duke
parents:
diff changeset
671 * 2. if x < 2^-28 (hx<0x3e300000 0), return x with inexact if x!=0.
a61af66fc99e Initial load
duke
parents:
diff changeset
672 * 3. tan(x) is approximated by a odd polynomial of degree 27 on
a61af66fc99e Initial load
duke
parents:
diff changeset
673 * [0,0.67434]
a61af66fc99e Initial load
duke
parents:
diff changeset
674 * 3 27
a61af66fc99e Initial load
duke
parents:
diff changeset
675 * tan(x) ~ x + T1*x + ... + T13*x
a61af66fc99e Initial load
duke
parents:
diff changeset
676 * where
a61af66fc99e Initial load
duke
parents:
diff changeset
677 *
a61af66fc99e Initial load
duke
parents:
diff changeset
678 * |tan(x) 2 4 26 | -59.2
a61af66fc99e Initial load
duke
parents:
diff changeset
679 * |----- - (1+T1*x +T2*x +.... +T13*x )| <= 2
a61af66fc99e Initial load
duke
parents:
diff changeset
680 * | x |
a61af66fc99e Initial load
duke
parents:
diff changeset
681 *
a61af66fc99e Initial load
duke
parents:
diff changeset
682 * Note: tan(x+y) = tan(x) + tan'(x)*y
a61af66fc99e Initial load
duke
parents:
diff changeset
683 * ~ tan(x) + (1+x*x)*y
a61af66fc99e Initial load
duke
parents:
diff changeset
684 * Therefore, for better accuracy in computing tan(x+y), let
a61af66fc99e Initial load
duke
parents:
diff changeset
685 * 3 2 2 2 2
a61af66fc99e Initial load
duke
parents:
diff changeset
686 * r = x *(T2+x *(T3+x *(...+x *(T12+x *T13))))
a61af66fc99e Initial load
duke
parents:
diff changeset
687 * then
a61af66fc99e Initial load
duke
parents:
diff changeset
688 * 3 2
a61af66fc99e Initial load
duke
parents:
diff changeset
689 * tan(x+y) = x + (T1*x + (x *(r+y)+y))
a61af66fc99e Initial load
duke
parents:
diff changeset
690 *
a61af66fc99e Initial load
duke
parents:
diff changeset
691 * 4. For x in [0.67434,pi/4], let y = pi/4 - x, then
a61af66fc99e Initial load
duke
parents:
diff changeset
692 * tan(x) = tan(pi/4-y) = (1-tan(y))/(1+tan(y))
a61af66fc99e Initial load
duke
parents:
diff changeset
693 * = 1 - 2*(tan(y) - (tan(y)^2)/(1+tan(y)))
a61af66fc99e Initial load
duke
parents:
diff changeset
694 */
a61af66fc99e Initial load
duke
parents:
diff changeset
695
a61af66fc99e Initial load
duke
parents:
diff changeset
696 static const double
a61af66fc99e Initial load
duke
parents:
diff changeset
697 pio4 = 7.85398163397448278999e-01, /* 0x3FE921FB, 0x54442D18 */
a61af66fc99e Initial load
duke
parents:
diff changeset
698 pio4lo= 3.06161699786838301793e-17, /* 0x3C81A626, 0x33145C07 */
a61af66fc99e Initial load
duke
parents:
diff changeset
699 T[] = {
a61af66fc99e Initial load
duke
parents:
diff changeset
700 3.33333333333334091986e-01, /* 0x3FD55555, 0x55555563 */
a61af66fc99e Initial load
duke
parents:
diff changeset
701 1.33333333333201242699e-01, /* 0x3FC11111, 0x1110FE7A */
a61af66fc99e Initial load
duke
parents:
diff changeset
702 5.39682539762260521377e-02, /* 0x3FABA1BA, 0x1BB341FE */
a61af66fc99e Initial load
duke
parents:
diff changeset
703 2.18694882948595424599e-02, /* 0x3F9664F4, 0x8406D637 */
a61af66fc99e Initial load
duke
parents:
diff changeset
704 8.86323982359930005737e-03, /* 0x3F8226E3, 0xE96E8493 */
a61af66fc99e Initial load
duke
parents:
diff changeset
705 3.59207910759131235356e-03, /* 0x3F6D6D22, 0xC9560328 */
a61af66fc99e Initial load
duke
parents:
diff changeset
706 1.45620945432529025516e-03, /* 0x3F57DBC8, 0xFEE08315 */
a61af66fc99e Initial load
duke
parents:
diff changeset
707 5.88041240820264096874e-04, /* 0x3F4344D8, 0xF2F26501 */
a61af66fc99e Initial load
duke
parents:
diff changeset
708 2.46463134818469906812e-04, /* 0x3F3026F7, 0x1A8D1068 */
a61af66fc99e Initial load
duke
parents:
diff changeset
709 7.81794442939557092300e-05, /* 0x3F147E88, 0xA03792A6 */
a61af66fc99e Initial load
duke
parents:
diff changeset
710 7.14072491382608190305e-05, /* 0x3F12B80F, 0x32F0A7E9 */
a61af66fc99e Initial load
duke
parents:
diff changeset
711 -1.85586374855275456654e-05, /* 0xBEF375CB, 0xDB605373 */
a61af66fc99e Initial load
duke
parents:
diff changeset
712 2.59073051863633712884e-05, /* 0x3EFB2A70, 0x74BF7AD4 */
a61af66fc99e Initial load
duke
parents:
diff changeset
713 };
a61af66fc99e Initial load
duke
parents:
diff changeset
714
a61af66fc99e Initial load
duke
parents:
diff changeset
715 static double __kernel_tan(double x, double y, int iy)
a61af66fc99e Initial load
duke
parents:
diff changeset
716 {
a61af66fc99e Initial load
duke
parents:
diff changeset
717 double z,r,v,w,s;
a61af66fc99e Initial load
duke
parents:
diff changeset
718 int ix,hx;
a61af66fc99e Initial load
duke
parents:
diff changeset
719 hx = __HI(x); /* high word of x */
a61af66fc99e Initial load
duke
parents:
diff changeset
720 ix = hx&0x7fffffff; /* high word of |x| */
a61af66fc99e Initial load
duke
parents:
diff changeset
721 if(ix<0x3e300000) { /* x < 2**-28 */
a61af66fc99e Initial load
duke
parents:
diff changeset
722 if((int)x==0) { /* generate inexact */
a61af66fc99e Initial load
duke
parents:
diff changeset
723 if (((ix | __LO(x)) | (iy + 1)) == 0)
a61af66fc99e Initial load
duke
parents:
diff changeset
724 return one / fabsd(x);
a61af66fc99e Initial load
duke
parents:
diff changeset
725 else {
a61af66fc99e Initial load
duke
parents:
diff changeset
726 if (iy == 1)
a61af66fc99e Initial load
duke
parents:
diff changeset
727 return x;
a61af66fc99e Initial load
duke
parents:
diff changeset
728 else { /* compute -1 / (x+y) carefully */
a61af66fc99e Initial load
duke
parents:
diff changeset
729 double a, t;
a61af66fc99e Initial load
duke
parents:
diff changeset
730
a61af66fc99e Initial load
duke
parents:
diff changeset
731 z = w = x + y;
a61af66fc99e Initial load
duke
parents:
diff changeset
732 __LO(z) = 0;
a61af66fc99e Initial load
duke
parents:
diff changeset
733 v = y - (z - x);
a61af66fc99e Initial load
duke
parents:
diff changeset
734 t = a = -one / w;
a61af66fc99e Initial load
duke
parents:
diff changeset
735 __LO(t) = 0;
a61af66fc99e Initial load
duke
parents:
diff changeset
736 s = one + t * z;
a61af66fc99e Initial load
duke
parents:
diff changeset
737 return t + a * (s + t * v);
a61af66fc99e Initial load
duke
parents:
diff changeset
738 }
a61af66fc99e Initial load
duke
parents:
diff changeset
739 }
a61af66fc99e Initial load
duke
parents:
diff changeset
740 }
a61af66fc99e Initial load
duke
parents:
diff changeset
741 }
a61af66fc99e Initial load
duke
parents:
diff changeset
742 if(ix>=0x3FE59428) { /* |x|>=0.6744 */
a61af66fc99e Initial load
duke
parents:
diff changeset
743 if(hx<0) {x = -x; y = -y;}
a61af66fc99e Initial load
duke
parents:
diff changeset
744 z = pio4-x;
a61af66fc99e Initial load
duke
parents:
diff changeset
745 w = pio4lo-y;
a61af66fc99e Initial load
duke
parents:
diff changeset
746 x = z+w; y = 0.0;
a61af66fc99e Initial load
duke
parents:
diff changeset
747 }
a61af66fc99e Initial load
duke
parents:
diff changeset
748 z = x*x;
a61af66fc99e Initial load
duke
parents:
diff changeset
749 w = z*z;
a61af66fc99e Initial load
duke
parents:
diff changeset
750 /* Break x^5*(T[1]+x^2*T[2]+...) into
a61af66fc99e Initial load
duke
parents:
diff changeset
751 * x^5(T[1]+x^4*T[3]+...+x^20*T[11]) +
a61af66fc99e Initial load
duke
parents:
diff changeset
752 * x^5(x^2*(T[2]+x^4*T[4]+...+x^22*[T12]))
a61af66fc99e Initial load
duke
parents:
diff changeset
753 */
a61af66fc99e Initial load
duke
parents:
diff changeset
754 r = T[1]+w*(T[3]+w*(T[5]+w*(T[7]+w*(T[9]+w*T[11]))));
a61af66fc99e Initial load
duke
parents:
diff changeset
755 v = z*(T[2]+w*(T[4]+w*(T[6]+w*(T[8]+w*(T[10]+w*T[12])))));
a61af66fc99e Initial load
duke
parents:
diff changeset
756 s = z*x;
a61af66fc99e Initial load
duke
parents:
diff changeset
757 r = y + z*(s*(r+v)+y);
a61af66fc99e Initial load
duke
parents:
diff changeset
758 r += T[0]*s;
a61af66fc99e Initial load
duke
parents:
diff changeset
759 w = x+r;
a61af66fc99e Initial load
duke
parents:
diff changeset
760 if(ix>=0x3FE59428) {
a61af66fc99e Initial load
duke
parents:
diff changeset
761 v = (double)iy;
a61af66fc99e Initial load
duke
parents:
diff changeset
762 return (double)(1-((hx>>30)&2))*(v-2.0*(x-(w*w/(w+v)-r)));
a61af66fc99e Initial load
duke
parents:
diff changeset
763 }
a61af66fc99e Initial load
duke
parents:
diff changeset
764 if(iy==1) return w;
a61af66fc99e Initial load
duke
parents:
diff changeset
765 else { /* if allow error up to 2 ulp,
a61af66fc99e Initial load
duke
parents:
diff changeset
766 simply return -1.0/(x+r) here */
a61af66fc99e Initial load
duke
parents:
diff changeset
767 /* compute -1.0/(x+r) accurately */
a61af66fc99e Initial load
duke
parents:
diff changeset
768 double a,t;
a61af66fc99e Initial load
duke
parents:
diff changeset
769 z = w;
a61af66fc99e Initial load
duke
parents:
diff changeset
770 __LO(z) = 0;
a61af66fc99e Initial load
duke
parents:
diff changeset
771 v = r-(z - x); /* z+v = r+x */
a61af66fc99e Initial load
duke
parents:
diff changeset
772 t = a = -1.0/w; /* a = -1.0/w */
a61af66fc99e Initial load
duke
parents:
diff changeset
773 __LO(t) = 0;
a61af66fc99e Initial load
duke
parents:
diff changeset
774 s = 1.0+t*z;
a61af66fc99e Initial load
duke
parents:
diff changeset
775 return t+a*(s+t*v);
a61af66fc99e Initial load
duke
parents:
diff changeset
776 }
a61af66fc99e Initial load
duke
parents:
diff changeset
777 }
a61af66fc99e Initial load
duke
parents:
diff changeset
778
a61af66fc99e Initial load
duke
parents:
diff changeset
779
a61af66fc99e Initial load
duke
parents:
diff changeset
780 //----------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
781 //
a61af66fc99e Initial load
duke
parents:
diff changeset
782 // Routines for new sin/cos implementation
a61af66fc99e Initial load
duke
parents:
diff changeset
783 //
a61af66fc99e Initial load
duke
parents:
diff changeset
784 //----------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
785
a61af66fc99e Initial load
duke
parents:
diff changeset
786 /* sin(x)
a61af66fc99e Initial load
duke
parents:
diff changeset
787 * Return sine function of x.
a61af66fc99e Initial load
duke
parents:
diff changeset
788 *
a61af66fc99e Initial load
duke
parents:
diff changeset
789 * kernel function:
a61af66fc99e Initial load
duke
parents:
diff changeset
790 * __kernel_sin ... sine function on [-pi/4,pi/4]
a61af66fc99e Initial load
duke
parents:
diff changeset
791 * __kernel_cos ... cose function on [-pi/4,pi/4]
a61af66fc99e Initial load
duke
parents:
diff changeset
792 * __ieee754_rem_pio2 ... argument reduction routine
a61af66fc99e Initial load
duke
parents:
diff changeset
793 *
a61af66fc99e Initial load
duke
parents:
diff changeset
794 * Method.
a61af66fc99e Initial load
duke
parents:
diff changeset
795 * Let S,C and T denote the sin, cos and tan respectively on
a61af66fc99e Initial load
duke
parents:
diff changeset
796 * [-PI/4, +PI/4]. Reduce the argument x to y1+y2 = x-k*pi/2
a61af66fc99e Initial load
duke
parents:
diff changeset
797 * in [-pi/4 , +pi/4], and let n = k mod 4.
a61af66fc99e Initial load
duke
parents:
diff changeset
798 * We have
a61af66fc99e Initial load
duke
parents:
diff changeset
799 *
a61af66fc99e Initial load
duke
parents:
diff changeset
800 * n sin(x) cos(x) tan(x)
a61af66fc99e Initial load
duke
parents:
diff changeset
801 * ----------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
802 * 0 S C T
a61af66fc99e Initial load
duke
parents:
diff changeset
803 * 1 C -S -1/T
a61af66fc99e Initial load
duke
parents:
diff changeset
804 * 2 -S -C T
a61af66fc99e Initial load
duke
parents:
diff changeset
805 * 3 -C S -1/T
a61af66fc99e Initial load
duke
parents:
diff changeset
806 * ----------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
807 *
a61af66fc99e Initial load
duke
parents:
diff changeset
808 * Special cases:
a61af66fc99e Initial load
duke
parents:
diff changeset
809 * Let trig be any of sin, cos, or tan.
a61af66fc99e Initial load
duke
parents:
diff changeset
810 * trig(+-INF) is NaN, with signals;
a61af66fc99e Initial load
duke
parents:
diff changeset
811 * trig(NaN) is that NaN;
a61af66fc99e Initial load
duke
parents:
diff changeset
812 *
a61af66fc99e Initial load
duke
parents:
diff changeset
813 * Accuracy:
a61af66fc99e Initial load
duke
parents:
diff changeset
814 * TRIG(x) returns trig(x) nearly rounded
a61af66fc99e Initial load
duke
parents:
diff changeset
815 */
a61af66fc99e Initial load
duke
parents:
diff changeset
816
a61af66fc99e Initial load
duke
parents:
diff changeset
817 JRT_LEAF(jdouble, SharedRuntime::dsin(jdouble x))
a61af66fc99e Initial load
duke
parents:
diff changeset
818 double y[2],z=0.0;
a61af66fc99e Initial load
duke
parents:
diff changeset
819 int n, ix;
a61af66fc99e Initial load
duke
parents:
diff changeset
820
a61af66fc99e Initial load
duke
parents:
diff changeset
821 /* High word of x. */
a61af66fc99e Initial load
duke
parents:
diff changeset
822 ix = __HI(x);
a61af66fc99e Initial load
duke
parents:
diff changeset
823
a61af66fc99e Initial load
duke
parents:
diff changeset
824 /* |x| ~< pi/4 */
a61af66fc99e Initial load
duke
parents:
diff changeset
825 ix &= 0x7fffffff;
a61af66fc99e Initial load
duke
parents:
diff changeset
826 if(ix <= 0x3fe921fb) return __kernel_sin(x,z,0);
a61af66fc99e Initial load
duke
parents:
diff changeset
827
a61af66fc99e Initial load
duke
parents:
diff changeset
828 /* sin(Inf or NaN) is NaN */
a61af66fc99e Initial load
duke
parents:
diff changeset
829 else if (ix>=0x7ff00000) return x-x;
a61af66fc99e Initial load
duke
parents:
diff changeset
830
a61af66fc99e Initial load
duke
parents:
diff changeset
831 /* argument reduction needed */
a61af66fc99e Initial load
duke
parents:
diff changeset
832 else {
a61af66fc99e Initial load
duke
parents:
diff changeset
833 n = __ieee754_rem_pio2(x,y);
a61af66fc99e Initial load
duke
parents:
diff changeset
834 switch(n&3) {
a61af66fc99e Initial load
duke
parents:
diff changeset
835 case 0: return __kernel_sin(y[0],y[1],1);
a61af66fc99e Initial load
duke
parents:
diff changeset
836 case 1: return __kernel_cos(y[0],y[1]);
a61af66fc99e Initial load
duke
parents:
diff changeset
837 case 2: return -__kernel_sin(y[0],y[1],1);
a61af66fc99e Initial load
duke
parents:
diff changeset
838 default:
a61af66fc99e Initial load
duke
parents:
diff changeset
839 return -__kernel_cos(y[0],y[1]);
a61af66fc99e Initial load
duke
parents:
diff changeset
840 }
a61af66fc99e Initial load
duke
parents:
diff changeset
841 }
a61af66fc99e Initial load
duke
parents:
diff changeset
842 JRT_END
a61af66fc99e Initial load
duke
parents:
diff changeset
843
a61af66fc99e Initial load
duke
parents:
diff changeset
844 /* cos(x)
a61af66fc99e Initial load
duke
parents:
diff changeset
845 * Return cosine function of x.
a61af66fc99e Initial load
duke
parents:
diff changeset
846 *
a61af66fc99e Initial load
duke
parents:
diff changeset
847 * kernel function:
a61af66fc99e Initial load
duke
parents:
diff changeset
848 * __kernel_sin ... sine function on [-pi/4,pi/4]
a61af66fc99e Initial load
duke
parents:
diff changeset
849 * __kernel_cos ... cosine function on [-pi/4,pi/4]
a61af66fc99e Initial load
duke
parents:
diff changeset
850 * __ieee754_rem_pio2 ... argument reduction routine
a61af66fc99e Initial load
duke
parents:
diff changeset
851 *
a61af66fc99e Initial load
duke
parents:
diff changeset
852 * Method.
a61af66fc99e Initial load
duke
parents:
diff changeset
853 * Let S,C and T denote the sin, cos and tan respectively on
a61af66fc99e Initial load
duke
parents:
diff changeset
854 * [-PI/4, +PI/4]. Reduce the argument x to y1+y2 = x-k*pi/2
a61af66fc99e Initial load
duke
parents:
diff changeset
855 * in [-pi/4 , +pi/4], and let n = k mod 4.
a61af66fc99e Initial load
duke
parents:
diff changeset
856 * We have
a61af66fc99e Initial load
duke
parents:
diff changeset
857 *
a61af66fc99e Initial load
duke
parents:
diff changeset
858 * n sin(x) cos(x) tan(x)
a61af66fc99e Initial load
duke
parents:
diff changeset
859 * ----------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
860 * 0 S C T
a61af66fc99e Initial load
duke
parents:
diff changeset
861 * 1 C -S -1/T
a61af66fc99e Initial load
duke
parents:
diff changeset
862 * 2 -S -C T
a61af66fc99e Initial load
duke
parents:
diff changeset
863 * 3 -C S -1/T
a61af66fc99e Initial load
duke
parents:
diff changeset
864 * ----------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
865 *
a61af66fc99e Initial load
duke
parents:
diff changeset
866 * Special cases:
a61af66fc99e Initial load
duke
parents:
diff changeset
867 * Let trig be any of sin, cos, or tan.
a61af66fc99e Initial load
duke
parents:
diff changeset
868 * trig(+-INF) is NaN, with signals;
a61af66fc99e Initial load
duke
parents:
diff changeset
869 * trig(NaN) is that NaN;
a61af66fc99e Initial load
duke
parents:
diff changeset
870 *
a61af66fc99e Initial load
duke
parents:
diff changeset
871 * Accuracy:
a61af66fc99e Initial load
duke
parents:
diff changeset
872 * TRIG(x) returns trig(x) nearly rounded
a61af66fc99e Initial load
duke
parents:
diff changeset
873 */
a61af66fc99e Initial load
duke
parents:
diff changeset
874
a61af66fc99e Initial load
duke
parents:
diff changeset
875 JRT_LEAF(jdouble, SharedRuntime::dcos(jdouble x))
a61af66fc99e Initial load
duke
parents:
diff changeset
876 double y[2],z=0.0;
a61af66fc99e Initial load
duke
parents:
diff changeset
877 int n, ix;
a61af66fc99e Initial load
duke
parents:
diff changeset
878
a61af66fc99e Initial load
duke
parents:
diff changeset
879 /* High word of x. */
a61af66fc99e Initial load
duke
parents:
diff changeset
880 ix = __HI(x);
a61af66fc99e Initial load
duke
parents:
diff changeset
881
a61af66fc99e Initial load
duke
parents:
diff changeset
882 /* |x| ~< pi/4 */
a61af66fc99e Initial load
duke
parents:
diff changeset
883 ix &= 0x7fffffff;
a61af66fc99e Initial load
duke
parents:
diff changeset
884 if(ix <= 0x3fe921fb) return __kernel_cos(x,z);
a61af66fc99e Initial load
duke
parents:
diff changeset
885
a61af66fc99e Initial load
duke
parents:
diff changeset
886 /* cos(Inf or NaN) is NaN */
a61af66fc99e Initial load
duke
parents:
diff changeset
887 else if (ix>=0x7ff00000) return x-x;
a61af66fc99e Initial load
duke
parents:
diff changeset
888
a61af66fc99e Initial load
duke
parents:
diff changeset
889 /* argument reduction needed */
a61af66fc99e Initial load
duke
parents:
diff changeset
890 else {
a61af66fc99e Initial load
duke
parents:
diff changeset
891 n = __ieee754_rem_pio2(x,y);
a61af66fc99e Initial load
duke
parents:
diff changeset
892 switch(n&3) {
a61af66fc99e Initial load
duke
parents:
diff changeset
893 case 0: return __kernel_cos(y[0],y[1]);
a61af66fc99e Initial load
duke
parents:
diff changeset
894 case 1: return -__kernel_sin(y[0],y[1],1);
a61af66fc99e Initial load
duke
parents:
diff changeset
895 case 2: return -__kernel_cos(y[0],y[1]);
a61af66fc99e Initial load
duke
parents:
diff changeset
896 default:
a61af66fc99e Initial load
duke
parents:
diff changeset
897 return __kernel_sin(y[0],y[1],1);
a61af66fc99e Initial load
duke
parents:
diff changeset
898 }
a61af66fc99e Initial load
duke
parents:
diff changeset
899 }
a61af66fc99e Initial load
duke
parents:
diff changeset
900 JRT_END
a61af66fc99e Initial load
duke
parents:
diff changeset
901
a61af66fc99e Initial load
duke
parents:
diff changeset
902 /* tan(x)
a61af66fc99e Initial load
duke
parents:
diff changeset
903 * Return tangent function of x.
a61af66fc99e Initial load
duke
parents:
diff changeset
904 *
a61af66fc99e Initial load
duke
parents:
diff changeset
905 * kernel function:
a61af66fc99e Initial load
duke
parents:
diff changeset
906 * __kernel_tan ... tangent function on [-pi/4,pi/4]
a61af66fc99e Initial load
duke
parents:
diff changeset
907 * __ieee754_rem_pio2 ... argument reduction routine
a61af66fc99e Initial load
duke
parents:
diff changeset
908 *
a61af66fc99e Initial load
duke
parents:
diff changeset
909 * Method.
a61af66fc99e Initial load
duke
parents:
diff changeset
910 * Let S,C and T denote the sin, cos and tan respectively on
a61af66fc99e Initial load
duke
parents:
diff changeset
911 * [-PI/4, +PI/4]. Reduce the argument x to y1+y2 = x-k*pi/2
a61af66fc99e Initial load
duke
parents:
diff changeset
912 * in [-pi/4 , +pi/4], and let n = k mod 4.
a61af66fc99e Initial load
duke
parents:
diff changeset
913 * We have
a61af66fc99e Initial load
duke
parents:
diff changeset
914 *
a61af66fc99e Initial load
duke
parents:
diff changeset
915 * n sin(x) cos(x) tan(x)
a61af66fc99e Initial load
duke
parents:
diff changeset
916 * ----------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
917 * 0 S C T
a61af66fc99e Initial load
duke
parents:
diff changeset
918 * 1 C -S -1/T
a61af66fc99e Initial load
duke
parents:
diff changeset
919 * 2 -S -C T
a61af66fc99e Initial load
duke
parents:
diff changeset
920 * 3 -C S -1/T
a61af66fc99e Initial load
duke
parents:
diff changeset
921 * ----------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
922 *
a61af66fc99e Initial load
duke
parents:
diff changeset
923 * Special cases:
a61af66fc99e Initial load
duke
parents:
diff changeset
924 * Let trig be any of sin, cos, or tan.
a61af66fc99e Initial load
duke
parents:
diff changeset
925 * trig(+-INF) is NaN, with signals;
a61af66fc99e Initial load
duke
parents:
diff changeset
926 * trig(NaN) is that NaN;
a61af66fc99e Initial load
duke
parents:
diff changeset
927 *
a61af66fc99e Initial load
duke
parents:
diff changeset
928 * Accuracy:
a61af66fc99e Initial load
duke
parents:
diff changeset
929 * TRIG(x) returns trig(x) nearly rounded
a61af66fc99e Initial load
duke
parents:
diff changeset
930 */
a61af66fc99e Initial load
duke
parents:
diff changeset
931
a61af66fc99e Initial load
duke
parents:
diff changeset
932 JRT_LEAF(jdouble, SharedRuntime::dtan(jdouble x))
a61af66fc99e Initial load
duke
parents:
diff changeset
933 double y[2],z=0.0;
a61af66fc99e Initial load
duke
parents:
diff changeset
934 int n, ix;
a61af66fc99e Initial load
duke
parents:
diff changeset
935
a61af66fc99e Initial load
duke
parents:
diff changeset
936 /* High word of x. */
a61af66fc99e Initial load
duke
parents:
diff changeset
937 ix = __HI(x);
a61af66fc99e Initial load
duke
parents:
diff changeset
938
a61af66fc99e Initial load
duke
parents:
diff changeset
939 /* |x| ~< pi/4 */
a61af66fc99e Initial load
duke
parents:
diff changeset
940 ix &= 0x7fffffff;
a61af66fc99e Initial load
duke
parents:
diff changeset
941 if(ix <= 0x3fe921fb) return __kernel_tan(x,z,1);
a61af66fc99e Initial load
duke
parents:
diff changeset
942
a61af66fc99e Initial load
duke
parents:
diff changeset
943 /* tan(Inf or NaN) is NaN */
a61af66fc99e Initial load
duke
parents:
diff changeset
944 else if (ix>=0x7ff00000) return x-x; /* NaN */
a61af66fc99e Initial load
duke
parents:
diff changeset
945
a61af66fc99e Initial load
duke
parents:
diff changeset
946 /* argument reduction needed */
a61af66fc99e Initial load
duke
parents:
diff changeset
947 else {
a61af66fc99e Initial load
duke
parents:
diff changeset
948 n = __ieee754_rem_pio2(x,y);
a61af66fc99e Initial load
duke
parents:
diff changeset
949 return __kernel_tan(y[0],y[1],1-((n&1)<<1)); /* 1 -- n even
a61af66fc99e Initial load
duke
parents:
diff changeset
950 -1 -- n odd */
a61af66fc99e Initial load
duke
parents:
diff changeset
951 }
a61af66fc99e Initial load
duke
parents:
diff changeset
952 JRT_END
a61af66fc99e Initial load
duke
parents:
diff changeset
953
a61af66fc99e Initial load
duke
parents:
diff changeset
954
a61af66fc99e Initial load
duke
parents:
diff changeset
955 #ifdef WIN32
a61af66fc99e Initial load
duke
parents:
diff changeset
956 # pragma optimize ( "", on )
a61af66fc99e Initial load
duke
parents:
diff changeset
957 #endif