125c28e83SPiotr Jasiukajtis /*
225c28e83SPiotr Jasiukajtis  * CDDL HEADER START
325c28e83SPiotr Jasiukajtis  *
425c28e83SPiotr Jasiukajtis  * The contents of this file are subject to the terms of the
525c28e83SPiotr Jasiukajtis  * Common Development and Distribution License (the "License").
625c28e83SPiotr Jasiukajtis  * You may not use this file except in compliance with the License.
725c28e83SPiotr Jasiukajtis  *
825c28e83SPiotr Jasiukajtis  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
925c28e83SPiotr Jasiukajtis  * or http://www.opensolaris.org/os/licensing.
1025c28e83SPiotr Jasiukajtis  * See the License for the specific language governing permissions
1125c28e83SPiotr Jasiukajtis  * and limitations under the License.
1225c28e83SPiotr Jasiukajtis  *
1325c28e83SPiotr Jasiukajtis  * When distributing Covered Code, include this CDDL HEADER in each
1425c28e83SPiotr Jasiukajtis  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
1525c28e83SPiotr Jasiukajtis  * If applicable, add the following below this CDDL HEADER, with the
1625c28e83SPiotr Jasiukajtis  * fields enclosed by brackets "[]" replaced with your own identifying
1725c28e83SPiotr Jasiukajtis  * information: Portions Copyright [yyyy] [name of copyright owner]
1825c28e83SPiotr Jasiukajtis  *
1925c28e83SPiotr Jasiukajtis  * CDDL HEADER END
2025c28e83SPiotr Jasiukajtis  */
2125c28e83SPiotr Jasiukajtis 
2225c28e83SPiotr Jasiukajtis /*
2325c28e83SPiotr Jasiukajtis  * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
2425c28e83SPiotr Jasiukajtis  */
2525c28e83SPiotr Jasiukajtis /*
2625c28e83SPiotr Jasiukajtis  * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
2725c28e83SPiotr Jasiukajtis  * Use is subject to license terms.
2825c28e83SPiotr Jasiukajtis  */
2925c28e83SPiotr Jasiukajtis 
3025c28e83SPiotr Jasiukajtis #ifdef __RESTRICT
3125c28e83SPiotr Jasiukajtis #define restrict _Restrict
3225c28e83SPiotr Jasiukajtis #else
3325c28e83SPiotr Jasiukajtis #define restrict
3425c28e83SPiotr Jasiukajtis #endif
3525c28e83SPiotr Jasiukajtis 
3625c28e83SPiotr Jasiukajtis void
__vatanf(int n,float * restrict x,int stridex,float * restrict y,int stridey)3725c28e83SPiotr Jasiukajtis __vatanf(int n, float * restrict x, int stridex, float * restrict y, int stridey)
3825c28e83SPiotr Jasiukajtis {
3925c28e83SPiotr Jasiukajtis   extern const double __vlibm_TBL_atan1[];
4025c28e83SPiotr Jasiukajtis   double  conup0, conup1, conup2;
4125c28e83SPiotr Jasiukajtis   float dummy, ansf = 0.0;
4225c28e83SPiotr Jasiukajtis   float f0, f1, f2;
4325c28e83SPiotr Jasiukajtis   float ans0, ans1, ans2;
4425c28e83SPiotr Jasiukajtis   float poly0, poly1, poly2;
4525c28e83SPiotr Jasiukajtis   float sign0, sign1, sign2;
4625c28e83SPiotr Jasiukajtis   int intf, intz, argcount;
47*55fea89dSDan Cross   int index0, index1, index2;
4825c28e83SPiotr Jasiukajtis   float z,*yaddr0,*yaddr1,*yaddr2;
4925c28e83SPiotr Jasiukajtis   int *pz = (int *) &z;
5025c28e83SPiotr Jasiukajtis #ifdef UNROLL4
5125c28e83SPiotr Jasiukajtis   double conup3;
5225c28e83SPiotr Jasiukajtis   int index3;
5325c28e83SPiotr Jasiukajtis   float f3, ans3, poly3, sign3, *yaddr3;
5425c28e83SPiotr Jasiukajtis #endif
5525c28e83SPiotr Jasiukajtis 
5625c28e83SPiotr Jasiukajtis /*    Power series  atan(x) = x + p1*x**3 + p2*x**5 + p3*x**7
5725c28e83SPiotr Jasiukajtis  *    Error =  -3.08254E-18   On the interval  |x| < 1/64 */
5825c28e83SPiotr Jasiukajtis 
5925c28e83SPiotr Jasiukajtis   static const float p1 = -0.33329644f /* -3.333333333329292858E-01f */ ;
6025c28e83SPiotr Jasiukajtis   static const float pone = 1.0f;
6125c28e83SPiotr Jasiukajtis 
6225c28e83SPiotr Jasiukajtis   if (n <= 0) return;		/* if no. of elements is 0 or neg, do nothing */
6325c28e83SPiotr Jasiukajtis   do
6425c28e83SPiotr Jasiukajtis   {
6525c28e83SPiotr Jasiukajtis   LOOP0:
6625c28e83SPiotr Jasiukajtis 
6725c28e83SPiotr Jasiukajtis 	intf     = *(int *) x;		/* upper half of x, as integer */
6825c28e83SPiotr Jasiukajtis 	f0 = *x;
6925c28e83SPiotr Jasiukajtis 	sign0 = pone;
7025c28e83SPiotr Jasiukajtis     	if (intf < 0) {
7125c28e83SPiotr Jasiukajtis     		intf = intf & ~0x80000000; /* abs(upper argument) */
7225c28e83SPiotr Jasiukajtis 		f0 = -f0;
7325c28e83SPiotr Jasiukajtis 		sign0 = -sign0;
7425c28e83SPiotr Jasiukajtis 	}
75*55fea89dSDan Cross 
7625c28e83SPiotr Jasiukajtis     if ((intf > 0x5B000000) || (intf < 0x31800000)) /* filter out special cases */
7725c28e83SPiotr Jasiukajtis     {
78*55fea89dSDan Cross       if (intf > 0x7f800000)
79*55fea89dSDan Cross       {
8025c28e83SPiotr Jasiukajtis 	ansf  = f0- f0; 				/* return NaN if x=NaN*/
8125c28e83SPiotr Jasiukajtis       }
8225c28e83SPiotr Jasiukajtis       else if (intf < 0x31800000) 		/* avoid underflow for small arg */
8325c28e83SPiotr Jasiukajtis       {
8425c28e83SPiotr Jasiukajtis         dummy = 1.0e37 + f0;
8525c28e83SPiotr Jasiukajtis         dummy = dummy;
8625c28e83SPiotr Jasiukajtis 	ansf  = f0;
8725c28e83SPiotr Jasiukajtis       }
8825c28e83SPiotr Jasiukajtis       else if (intf > 0x5B000000)		/* avoid underflow for big arg  */
8925c28e83SPiotr Jasiukajtis       {
9025c28e83SPiotr Jasiukajtis         index0= 2;
9125c28e83SPiotr Jasiukajtis         ansf  = __vlibm_TBL_atan1[index0];/* pi/2 up */
9225c28e83SPiotr Jasiukajtis       }
9325c28e83SPiotr Jasiukajtis       *y      = sign0*ansf;		/* store answer, with sign bit 	*/
9425c28e83SPiotr Jasiukajtis       x      += stridex;
9525c28e83SPiotr Jasiukajtis       y      += stridey;
9625c28e83SPiotr Jasiukajtis       argcount = 0;				/* initialize argcount		*/
9725c28e83SPiotr Jasiukajtis       if (--n <=0) break;			/* we are done 			*/
9825c28e83SPiotr Jasiukajtis       goto LOOP0;				/* otherwise, examine next arg  */
9925c28e83SPiotr Jasiukajtis     }
100*55fea89dSDan Cross 
10125c28e83SPiotr Jasiukajtis     if (intf > 0x42800000)			/* if (|x| > 64               	*/
102*55fea89dSDan Cross     {
10325c28e83SPiotr Jasiukajtis     f0 = -pone/f0;
10425c28e83SPiotr Jasiukajtis 	index0 = 2; 				/* point to pi/2 upper, lower	*/
10525c28e83SPiotr Jasiukajtis     }
10625c28e83SPiotr Jasiukajtis     else if (intf >= 0x3C800000)		/* if |x| >= (1/64)... 		*/
10725c28e83SPiotr Jasiukajtis     {
10825c28e83SPiotr Jasiukajtis       intz   = (intf + 0x00040000) & 0x7ff80000;/* round arg, keep upper	*/
10925c28e83SPiotr Jasiukajtis       pz[0]  = intz;				/* store as a float (z)		*/
11025c28e83SPiotr Jasiukajtis     f0 = (f0 - z)/(pone + f0*z);
11125c28e83SPiotr Jasiukajtis 	index0 = (intz - 0x3C800000) >> 18;	/* (index >> 19) << 1)		*/
11225c28e83SPiotr Jasiukajtis 	index0 = index0+ 4;			/* skip over 0,0,pi/2,pi/2	*/
113*55fea89dSDan Cross     }
11425c28e83SPiotr Jasiukajtis     else					/* |x| < 1/64 */
11525c28e83SPiotr Jasiukajtis     {
11625c28e83SPiotr Jasiukajtis 	index0   = 0;				/* points to 0,0 in table	*/
11725c28e83SPiotr Jasiukajtis     }
118*55fea89dSDan Cross     yaddr0   = y;				/* address to store this answer */
11925c28e83SPiotr Jasiukajtis     x       += stridex;				/* point to next arg		*/
12025c28e83SPiotr Jasiukajtis     y       += stridey;				/* point to next result		*/
12125c28e83SPiotr Jasiukajtis     argcount = 1;				/* we now have 1 good argument  */
122*55fea89dSDan Cross     if (--n <=0)
12325c28e83SPiotr Jasiukajtis     {
12425c28e83SPiotr Jasiukajtis       goto UNROLL;				/* finish up with 1 good arg 	*/
12525c28e83SPiotr Jasiukajtis     }
12625c28e83SPiotr Jasiukajtis 
12725c28e83SPiotr Jasiukajtis     /*--------------------------------------------------------------------------*/
12825c28e83SPiotr Jasiukajtis     /*--------------------------------------------------------------------------*/
12925c28e83SPiotr Jasiukajtis     /*--------------------------------------------------------------------------*/
13025c28e83SPiotr Jasiukajtis 
13125c28e83SPiotr Jasiukajtis   LOOP1:
13225c28e83SPiotr Jasiukajtis 
13325c28e83SPiotr Jasiukajtis 	intf     = *(int *) x;		/* upper half of x, as integer */
13425c28e83SPiotr Jasiukajtis 	f1 = *x;
13525c28e83SPiotr Jasiukajtis 	sign1 = pone;
13625c28e83SPiotr Jasiukajtis     	if (intf < 0) {
13725c28e83SPiotr Jasiukajtis     		intf = intf & ~0x80000000; /* abs(upper argument) */
13825c28e83SPiotr Jasiukajtis 		f1 = -f1;
13925c28e83SPiotr Jasiukajtis 		sign1 = -sign1;
14025c28e83SPiotr Jasiukajtis 	}
141*55fea89dSDan Cross 
14225c28e83SPiotr Jasiukajtis     if ((intf > 0x5B000000) || (intf < 0x31800000)) /* filter out special cases */
14325c28e83SPiotr Jasiukajtis     {
144*55fea89dSDan Cross       if (intf > 0x7f800000)
145*55fea89dSDan Cross       {
14625c28e83SPiotr Jasiukajtis 	ansf   = f1 - f1;			/* return NaN if x=NaN*/
14725c28e83SPiotr Jasiukajtis       }
14825c28e83SPiotr Jasiukajtis       else if (intf < 0x31800000) 		/* avoid underflow for small arg */
14925c28e83SPiotr Jasiukajtis       {
15025c28e83SPiotr Jasiukajtis         dummy = 1.0e37 + f1;
15125c28e83SPiotr Jasiukajtis         dummy = dummy;
15225c28e83SPiotr Jasiukajtis 	ansf   = f1;
15325c28e83SPiotr Jasiukajtis       }
15425c28e83SPiotr Jasiukajtis       else if (intf > 0x5B000000)		/* avoid underflow for big arg  */
15525c28e83SPiotr Jasiukajtis       {
15625c28e83SPiotr Jasiukajtis         index1 = 2;
15725c28e83SPiotr Jasiukajtis         ansf   = __vlibm_TBL_atan1[index1] ;/* pi/2 up */
15825c28e83SPiotr Jasiukajtis       }
15925c28e83SPiotr Jasiukajtis       *y      = sign1 * ansf;		/* store answer, with sign bit 	*/
16025c28e83SPiotr Jasiukajtis       x      += stridex;
16125c28e83SPiotr Jasiukajtis       y      += stridey;
16225c28e83SPiotr Jasiukajtis       argcount = 1;				/* we still have 1 good arg 	*/
163*55fea89dSDan Cross       if (--n <=0)
16425c28e83SPiotr Jasiukajtis       {
16525c28e83SPiotr Jasiukajtis         goto UNROLL;				/* finish up with 1 good arg 	*/
16625c28e83SPiotr Jasiukajtis       }
16725c28e83SPiotr Jasiukajtis       goto LOOP1;				/* otherwise, examine next arg  */
16825c28e83SPiotr Jasiukajtis     }
169*55fea89dSDan Cross 
17025c28e83SPiotr Jasiukajtis     if (intf > 0x42800000)			/* if (|x| > 64               	*/
171*55fea89dSDan Cross     {
17225c28e83SPiotr Jasiukajtis     f1 = -pone/f1;
17325c28e83SPiotr Jasiukajtis       index1 = 2; 				/* point to pi/2 upper, lower	*/
17425c28e83SPiotr Jasiukajtis     }
17525c28e83SPiotr Jasiukajtis     else if (intf >= 0x3C800000)		/* if |x| >= (1/64)... 		*/
17625c28e83SPiotr Jasiukajtis     {
17725c28e83SPiotr Jasiukajtis       intz   = (intf + 0x00040000) & 0x7ff80000;/* round arg, keep upper	*/
17825c28e83SPiotr Jasiukajtis       pz[0]  = intz;				/* store as a float (z)		*/
179*55fea89dSDan Cross     f1 = (f1 - z)/(pone + f1*z);
18025c28e83SPiotr Jasiukajtis       index1 = (intz - 0x3C800000) >> 18;	/* (index >> 19) << 1)		*/
18125c28e83SPiotr Jasiukajtis       index1 = index1 + 4;			/* skip over 0,0,pi/2,pi/2	*/
18225c28e83SPiotr Jasiukajtis     }
18325c28e83SPiotr Jasiukajtis     else
18425c28e83SPiotr Jasiukajtis     {
18525c28e83SPiotr Jasiukajtis 	index1   = 0;				/* points to 0,0 in table	*/
18625c28e83SPiotr Jasiukajtis     }
18725c28e83SPiotr Jasiukajtis 
188*55fea89dSDan Cross     yaddr1   = y;				/* address to store this answer */
18925c28e83SPiotr Jasiukajtis     x       += stridex;				/* point to next arg		*/
19025c28e83SPiotr Jasiukajtis     y       += stridey;				/* point to next result		*/
19125c28e83SPiotr Jasiukajtis     argcount = 2;				/* we now have 2 good arguments */
192*55fea89dSDan Cross     if (--n <=0)
19325c28e83SPiotr Jasiukajtis     {
19425c28e83SPiotr Jasiukajtis       goto UNROLL;				/* finish up with 2 good args 	*/
19525c28e83SPiotr Jasiukajtis     }
19625c28e83SPiotr Jasiukajtis 
19725c28e83SPiotr Jasiukajtis     /*--------------------------------------------------------------------------*/
19825c28e83SPiotr Jasiukajtis     /*--------------------------------------------------------------------------*/
19925c28e83SPiotr Jasiukajtis     /*--------------------------------------------------------------------------*/
20025c28e83SPiotr Jasiukajtis 
20125c28e83SPiotr Jasiukajtis   LOOP2:
20225c28e83SPiotr Jasiukajtis 
20325c28e83SPiotr Jasiukajtis 	intf     = *(int *) x;		/* upper half of x, as integer */
20425c28e83SPiotr Jasiukajtis 	f2 = *x;
20525c28e83SPiotr Jasiukajtis 	sign2 = pone;
20625c28e83SPiotr Jasiukajtis     	if (intf < 0) {
20725c28e83SPiotr Jasiukajtis     		intf = intf & ~0x80000000; /* abs(upper argument) */
20825c28e83SPiotr Jasiukajtis 		f2 = -f2;
20925c28e83SPiotr Jasiukajtis 		sign2 = -sign2;
21025c28e83SPiotr Jasiukajtis 	}
211*55fea89dSDan Cross 
21225c28e83SPiotr Jasiukajtis     if ((intf > 0x5B000000) || (intf < 0x31800000)) /* filter out special cases */
21325c28e83SPiotr Jasiukajtis     {
214*55fea89dSDan Cross       if (intf > 0x7f800000)
215*55fea89dSDan Cross       {
21625c28e83SPiotr Jasiukajtis 	ansf   = f2 - f2;			/* return NaN if x=NaN*/
21725c28e83SPiotr Jasiukajtis       }
21825c28e83SPiotr Jasiukajtis       else if (intf < 0x31800000) 		/* avoid underflow for small arg */
21925c28e83SPiotr Jasiukajtis       {
22025c28e83SPiotr Jasiukajtis         dummy = 1.0e37 + f2;
22125c28e83SPiotr Jasiukajtis         dummy = dummy;
22225c28e83SPiotr Jasiukajtis 	ansf   = f2;
22325c28e83SPiotr Jasiukajtis       }
22425c28e83SPiotr Jasiukajtis       else if (intf > 0x5B000000)		/* avoid underflow for big arg  */
22525c28e83SPiotr Jasiukajtis       {
22625c28e83SPiotr Jasiukajtis         index2 = 2;
22725c28e83SPiotr Jasiukajtis         ansf   = __vlibm_TBL_atan1[index2] ;/* pi/2 up */
22825c28e83SPiotr Jasiukajtis       }
22925c28e83SPiotr Jasiukajtis       *y      = sign2 * ansf;		/* store answer, with sign bit 	*/
23025c28e83SPiotr Jasiukajtis       x      += stridex;
23125c28e83SPiotr Jasiukajtis       y      += stridey;
23225c28e83SPiotr Jasiukajtis       argcount = 2;				/* we still have 2 good args 	*/
233*55fea89dSDan Cross       if (--n <=0)
23425c28e83SPiotr Jasiukajtis       {
23525c28e83SPiotr Jasiukajtis         goto UNROLL;				/* finish up with 2 good args 	*/
23625c28e83SPiotr Jasiukajtis       }
23725c28e83SPiotr Jasiukajtis       goto LOOP2;				/* otherwise, examine next arg  */
23825c28e83SPiotr Jasiukajtis     }
239*55fea89dSDan Cross 
24025c28e83SPiotr Jasiukajtis     if (intf > 0x42800000)			/* if (|x| > 64               	*/
241*55fea89dSDan Cross     {
24225c28e83SPiotr Jasiukajtis     f2 = -pone/f2;
24325c28e83SPiotr Jasiukajtis       index2 = 2; 				/* point to pi/2 upper, lower	*/
24425c28e83SPiotr Jasiukajtis     }
24525c28e83SPiotr Jasiukajtis     else if (intf >= 0x3C800000)		/* if |x| >= (1/64)... 		*/
24625c28e83SPiotr Jasiukajtis     {
24725c28e83SPiotr Jasiukajtis       intz   = (intf + 0x00040000) & 0x7ff80000;/* round arg, keep upper	*/
24825c28e83SPiotr Jasiukajtis       pz[0]  = intz;				/* store as a float (z)		*/
24925c28e83SPiotr Jasiukajtis     f2 = (f2 - z)/(pone + f2*z);
25025c28e83SPiotr Jasiukajtis       index2 = (intz - 0x3C800000) >> 18;	/* (index >> 19) << 1)		*/
25125c28e83SPiotr Jasiukajtis       index2 = index2 + 4;			/* skip over 0,0,pi/2,pi/2	*/
25225c28e83SPiotr Jasiukajtis     }
25325c28e83SPiotr Jasiukajtis     else
25425c28e83SPiotr Jasiukajtis     {
25525c28e83SPiotr Jasiukajtis 	index2   = 0;				/* points to 0,0 in table	*/
25625c28e83SPiotr Jasiukajtis     }
257*55fea89dSDan Cross     yaddr2   = y;				/* address to store this answer */
25825c28e83SPiotr Jasiukajtis     x       += stridex;				/* point to next arg		*/
25925c28e83SPiotr Jasiukajtis     y       += stridey;				/* point to next result		*/
26025c28e83SPiotr Jasiukajtis     argcount = 3;				/* we now have 3 good arguments */
261*55fea89dSDan Cross     if (--n <=0)
26225c28e83SPiotr Jasiukajtis     {
26325c28e83SPiotr Jasiukajtis       goto UNROLL;				/* finish up with 2 good args 	*/
26425c28e83SPiotr Jasiukajtis     }
26525c28e83SPiotr Jasiukajtis 
26625c28e83SPiotr Jasiukajtis 
26725c28e83SPiotr Jasiukajtis     /*--------------------------------------------------------------------------*/
26825c28e83SPiotr Jasiukajtis     /*--------------------------------------------------------------------------*/
26925c28e83SPiotr Jasiukajtis     /*--------------------------------------------------------------------------*/
27025c28e83SPiotr Jasiukajtis 
27125c28e83SPiotr Jasiukajtis #ifdef UNROLL4
27225c28e83SPiotr Jasiukajtis   LOOP3:
27325c28e83SPiotr Jasiukajtis 
27425c28e83SPiotr Jasiukajtis 	intf     = *(int *) x;		/* upper half of x, as integer */
27525c28e83SPiotr Jasiukajtis 	f3 = *x;
27625c28e83SPiotr Jasiukajtis 	sign3 = pone;
27725c28e83SPiotr Jasiukajtis     	if (intf < 0) {
27825c28e83SPiotr Jasiukajtis     		intf = intf & ~0x80000000; /* abs(upper argument) */
27925c28e83SPiotr Jasiukajtis 		f3 = -f3;
28025c28e83SPiotr Jasiukajtis 		sign3 = -sign3;
28125c28e83SPiotr Jasiukajtis 	}
282*55fea89dSDan Cross 
28325c28e83SPiotr Jasiukajtis     if ((intf > 0x5B000000) || (intf < 0x31800000)) /* filter out special cases */
28425c28e83SPiotr Jasiukajtis     {
285*55fea89dSDan Cross       if (intf > 0x7f800000)
286*55fea89dSDan Cross       {
28725c28e83SPiotr Jasiukajtis 	ansf   = f3 - f3;			/* return NaN if x=NaN*/
28825c28e83SPiotr Jasiukajtis       }
28925c28e83SPiotr Jasiukajtis       else if (intf < 0x31800000) 		/* avoid underflow for small arg */
29025c28e83SPiotr Jasiukajtis       {
29125c28e83SPiotr Jasiukajtis         dummy = 1.0e37 + f3;
29225c28e83SPiotr Jasiukajtis         dummy = dummy;
29325c28e83SPiotr Jasiukajtis 	ansf   = f3;
29425c28e83SPiotr Jasiukajtis       }
29525c28e83SPiotr Jasiukajtis       else if (intf > 0x5B000000)		/* avoid underflow for big arg  */
29625c28e83SPiotr Jasiukajtis       {
29725c28e83SPiotr Jasiukajtis         index3 = 2;
29825c28e83SPiotr Jasiukajtis         ansf   = __vlibm_TBL_atan1[index3] ;/* pi/2 up */
29925c28e83SPiotr Jasiukajtis       }
30025c28e83SPiotr Jasiukajtis       *y      = sign3 * ansf;		/* store answer, with sign bit 	*/
30125c28e83SPiotr Jasiukajtis       x      += stridex;
30225c28e83SPiotr Jasiukajtis       y      += stridey;
30325c28e83SPiotr Jasiukajtis       argcount = 3;				/* we still have 3 good args 	*/
304*55fea89dSDan Cross       if (--n <=0)
30525c28e83SPiotr Jasiukajtis       {
30625c28e83SPiotr Jasiukajtis         goto UNROLL;				/* finish up with 3 good args 	*/
30725c28e83SPiotr Jasiukajtis       }
30825c28e83SPiotr Jasiukajtis       goto LOOP3;				/* otherwise, examine next arg  */
30925c28e83SPiotr Jasiukajtis     }
310*55fea89dSDan Cross 
31125c28e83SPiotr Jasiukajtis     if (intf > 0x42800000)			/* if (|x| > 64               	*/
312*55fea89dSDan Cross     {
31325c28e83SPiotr Jasiukajtis 	n3 = -pone;
31425c28e83SPiotr Jasiukajtis         d3 = f3;
31525c28e83SPiotr Jasiukajtis     f3 = n3/d3;
31625c28e83SPiotr Jasiukajtis       index3 = 2; 				/* point to pi/2 upper, lower	*/
31725c28e83SPiotr Jasiukajtis     }
31825c28e83SPiotr Jasiukajtis     else if (intf >= 0x3C800000)		/* if |x| >= (1/64)... 		*/
31925c28e83SPiotr Jasiukajtis     {
32025c28e83SPiotr Jasiukajtis       intz   = (intf + 0x00040000) & 0x7ff80000;/* round arg, keep upper	*/
32125c28e83SPiotr Jasiukajtis       pz[0]  = intz;				/* store as a float (z)		*/
32225c28e83SPiotr Jasiukajtis 	n3     = (f3 - z);
32325c28e83SPiotr Jasiukajtis 	d3     = (pone + f3*z); 		/* get reduced argument		*/
32425c28e83SPiotr Jasiukajtis     f3 = n3/d3;
32525c28e83SPiotr Jasiukajtis       index3 = (intz - 0x3C800000) >> 18;	/* (index >> 19) << 1)		*/
32625c28e83SPiotr Jasiukajtis       index3 = index3 + 4;			/* skip over 0,0,pi/2,pi/2	*/
32725c28e83SPiotr Jasiukajtis     }
32825c28e83SPiotr Jasiukajtis     else
32925c28e83SPiotr Jasiukajtis     {
33025c28e83SPiotr Jasiukajtis 	n3 = f3;
33125c28e83SPiotr Jasiukajtis 	d3 = pone;
33225c28e83SPiotr Jasiukajtis 	index3   = 0;				/* points to 0,0 in table	*/
33325c28e83SPiotr Jasiukajtis     }
334*55fea89dSDan Cross     yaddr3   = y;				/* address to store this answer */
33525c28e83SPiotr Jasiukajtis     x       += stridex;				/* point to next arg		*/
33625c28e83SPiotr Jasiukajtis     y       += stridey;				/* point to next result		*/
33725c28e83SPiotr Jasiukajtis     argcount = 4;				/* we now have 4 good arguments */
338*55fea89dSDan Cross     if (--n <=0)
33925c28e83SPiotr Jasiukajtis     {
34025c28e83SPiotr Jasiukajtis       goto UNROLL;				/* finish up with 3 good args 	*/
34125c28e83SPiotr Jasiukajtis     }
34225c28e83SPiotr Jasiukajtis #endif /* UNROLL4 */
34325c28e83SPiotr Jasiukajtis 
344*55fea89dSDan Cross /* here is the n-way unrolled section,
345*55fea89dSDan Cross    but we may actually have less than n
34625c28e83SPiotr Jasiukajtis    arguments at this point
34725c28e83SPiotr Jasiukajtis */
34825c28e83SPiotr Jasiukajtis 
34925c28e83SPiotr Jasiukajtis UNROLL:
35025c28e83SPiotr Jasiukajtis 
35125c28e83SPiotr Jasiukajtis #ifdef UNROLL4
35225c28e83SPiotr Jasiukajtis     if (argcount == 4)
35325c28e83SPiotr Jasiukajtis     {
35425c28e83SPiotr Jasiukajtis     conup0   = __vlibm_TBL_atan1[index0];
35525c28e83SPiotr Jasiukajtis     conup1   = __vlibm_TBL_atan1[index1];
35625c28e83SPiotr Jasiukajtis     conup2   = __vlibm_TBL_atan1[index2];
35725c28e83SPiotr Jasiukajtis     conup3   = __vlibm_TBL_atan1[index3];
35825c28e83SPiotr Jasiukajtis     poly0    = p1*f0*f0*f0 + f0;
35925c28e83SPiotr Jasiukajtis     ans0     = sign0 * (float)(conup0 + poly0);
36025c28e83SPiotr Jasiukajtis     poly1    = p1*f1*f1*f1 + f1;
36125c28e83SPiotr Jasiukajtis     ans1     = sign1 * (float)(conup1 + poly1);
36225c28e83SPiotr Jasiukajtis     poly2    = p1*f2*f2*f2 + f2;
36325c28e83SPiotr Jasiukajtis     ans2     = sign2 * (float)(conup2 + poly2);
36425c28e83SPiotr Jasiukajtis     poly3    = p1*f3*f3*f3 + f3;
36525c28e83SPiotr Jasiukajtis     ans3     = sign3 * (float)(conup3 + poly3);
36625c28e83SPiotr Jasiukajtis     *yaddr0  = ans0;
36725c28e83SPiotr Jasiukajtis     *yaddr1  = ans1;
36825c28e83SPiotr Jasiukajtis     *yaddr2  = ans2;
36925c28e83SPiotr Jasiukajtis     *yaddr3  = ans3;
37025c28e83SPiotr Jasiukajtis     }
371*55fea89dSDan Cross     else
37225c28e83SPiotr Jasiukajtis #endif
37325c28e83SPiotr Jasiukajtis     if (argcount == 3)
37425c28e83SPiotr Jasiukajtis     {
37525c28e83SPiotr Jasiukajtis     conup0   = __vlibm_TBL_atan1[index0];
37625c28e83SPiotr Jasiukajtis     conup1   = __vlibm_TBL_atan1[index1];
37725c28e83SPiotr Jasiukajtis     conup2   = __vlibm_TBL_atan1[index2];
37825c28e83SPiotr Jasiukajtis     poly0    = p1*f0*f0*f0 + f0;
37925c28e83SPiotr Jasiukajtis     poly1    = p1*f1*f1*f1 + f1;
38025c28e83SPiotr Jasiukajtis     poly2    = p1*f2*f2*f2 + f2;
38125c28e83SPiotr Jasiukajtis     ans0     = sign0 * (float)(conup0 + poly0);
38225c28e83SPiotr Jasiukajtis     ans1     = sign1 * (float)(conup1 + poly1);
38325c28e83SPiotr Jasiukajtis     ans2     = sign2 * (float)(conup2 + poly2);
38425c28e83SPiotr Jasiukajtis     *yaddr0  = ans0;
38525c28e83SPiotr Jasiukajtis     *yaddr1  = ans1;
38625c28e83SPiotr Jasiukajtis     *yaddr2  = ans2;
38725c28e83SPiotr Jasiukajtis     }
388*55fea89dSDan Cross     else
38925c28e83SPiotr Jasiukajtis     if (argcount == 2)
39025c28e83SPiotr Jasiukajtis     {
39125c28e83SPiotr Jasiukajtis     conup0   = __vlibm_TBL_atan1[index0];
39225c28e83SPiotr Jasiukajtis     conup1   = __vlibm_TBL_atan1[index1];
39325c28e83SPiotr Jasiukajtis     poly0    = p1*f0*f0*f0 + f0;
39425c28e83SPiotr Jasiukajtis     poly1    = p1*f1*f1*f1 + f1;
39525c28e83SPiotr Jasiukajtis     ans0     = sign0 * (float)(conup0 + poly0);
39625c28e83SPiotr Jasiukajtis     ans1     = sign1 * (float)(conup1 + poly1);
39725c28e83SPiotr Jasiukajtis     *yaddr0  = ans0;
39825c28e83SPiotr Jasiukajtis     *yaddr1  = ans1;
39925c28e83SPiotr Jasiukajtis     }
400*55fea89dSDan Cross     else
40125c28e83SPiotr Jasiukajtis     if (argcount == 1)
40225c28e83SPiotr Jasiukajtis     {
40325c28e83SPiotr Jasiukajtis     conup0   = __vlibm_TBL_atan1[index0];
40425c28e83SPiotr Jasiukajtis     poly0    = p1*f0*f0*f0 + f0;
40525c28e83SPiotr Jasiukajtis     ans0     = sign0 * (float)(conup0 + poly0);
40625c28e83SPiotr Jasiukajtis     *yaddr0  = ans0;
40725c28e83SPiotr Jasiukajtis      }
40825c28e83SPiotr Jasiukajtis 
40925c28e83SPiotr Jasiukajtis   }  while (n > 0);
41025c28e83SPiotr Jasiukajtis 
41125c28e83SPiotr Jasiukajtis }
412