125c28e83SPiotr Jasiukajtis /*
225c28e83SPiotr Jasiukajtis  * CDDL HEADER START
325c28e83SPiotr Jasiukajtis  *
425c28e83SPiotr Jasiukajtis  * The contents of this file are subject to the terms of the
525c28e83SPiotr Jasiukajtis  * Common Development and Distribution License (the "License").
625c28e83SPiotr Jasiukajtis  * You may not use this file except in compliance with the License.
725c28e83SPiotr Jasiukajtis  *
825c28e83SPiotr Jasiukajtis  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
925c28e83SPiotr Jasiukajtis  * or http://www.opensolaris.org/os/licensing.
1025c28e83SPiotr Jasiukajtis  * See the License for the specific language governing permissions
1125c28e83SPiotr Jasiukajtis  * and limitations under the License.
1225c28e83SPiotr Jasiukajtis  *
1325c28e83SPiotr Jasiukajtis  * When distributing Covered Code, include this CDDL HEADER in each
1425c28e83SPiotr Jasiukajtis  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
1525c28e83SPiotr Jasiukajtis  * If applicable, add the following below this CDDL HEADER, with the
1625c28e83SPiotr Jasiukajtis  * fields enclosed by brackets "[]" replaced with your own identifying
1725c28e83SPiotr Jasiukajtis  * information: Portions Copyright [yyyy] [name of copyright owner]
1825c28e83SPiotr Jasiukajtis  *
1925c28e83SPiotr Jasiukajtis  * CDDL HEADER END
2025c28e83SPiotr Jasiukajtis  */
2125c28e83SPiotr Jasiukajtis 
2225c28e83SPiotr Jasiukajtis /*
2325c28e83SPiotr Jasiukajtis  * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
2425c28e83SPiotr Jasiukajtis  * Use is subject to license terms.
2525c28e83SPiotr Jasiukajtis  */
2625c28e83SPiotr Jasiukajtis 
2725c28e83SPiotr Jasiukajtis /*
2825c28e83SPiotr Jasiukajtis  * Copyright 2011, Richard Lowe.
2925c28e83SPiotr Jasiukajtis  */
3025c28e83SPiotr Jasiukajtis 
3125c28e83SPiotr Jasiukajtis /* Functions in this file are duplicated in locallibm.il.  Keep them in sync */
3225c28e83SPiotr Jasiukajtis 
3325c28e83SPiotr Jasiukajtis #ifndef _LIBM_INLINES_H
3425c28e83SPiotr Jasiukajtis #define	_LIBM_INLINES_H
3525c28e83SPiotr Jasiukajtis 
3625c28e83SPiotr Jasiukajtis #ifdef __GNUC__
3725c28e83SPiotr Jasiukajtis 
3825c28e83SPiotr Jasiukajtis #include <sys/types.h>
3925c28e83SPiotr Jasiukajtis #include <sys/ieeefp.h>
4025c28e83SPiotr Jasiukajtis 
4125c28e83SPiotr Jasiukajtis #ifdef __cplusplus
4225c28e83SPiotr Jasiukajtis extern "C" {
4325c28e83SPiotr Jasiukajtis #endif
4425c28e83SPiotr Jasiukajtis 
45*7f11fd00SRichard Lowe extern __GNU_INLINE double
4625c28e83SPiotr Jasiukajtis __inline_sqrt(double d)
4725c28e83SPiotr Jasiukajtis {
4825c28e83SPiotr Jasiukajtis 	double ret;
4925c28e83SPiotr Jasiukajtis 
5025c28e83SPiotr Jasiukajtis 	__asm__ __volatile__("fsqrtd %1,%0\n\t" : "=e" (ret) : "e" (d));
5125c28e83SPiotr Jasiukajtis 	return (ret);
5225c28e83SPiotr Jasiukajtis }
5325c28e83SPiotr Jasiukajtis 
54*7f11fd00SRichard Lowe extern __GNU_INLINE float
5525c28e83SPiotr Jasiukajtis __inline_sqrtf(float f)
5625c28e83SPiotr Jasiukajtis {
5725c28e83SPiotr Jasiukajtis 	float ret;
5825c28e83SPiotr Jasiukajtis 
5925c28e83SPiotr Jasiukajtis 	__asm__ __volatile__("fsqrts %1,%0\n\t" : "=f" (ret) : "f" (f));
6025c28e83SPiotr Jasiukajtis 	return (ret);
6125c28e83SPiotr Jasiukajtis }
6225c28e83SPiotr Jasiukajtis 
63*7f11fd00SRichard Lowe extern __GNU_INLINE enum fp_class_type
6425c28e83SPiotr Jasiukajtis fp_classf(float f)
6525c28e83SPiotr Jasiukajtis {
6625c28e83SPiotr Jasiukajtis 	enum fp_class_type ret;
6725c28e83SPiotr Jasiukajtis 	uint32_t tmp;
6825c28e83SPiotr Jasiukajtis 
6925c28e83SPiotr Jasiukajtis 	/* XXX: Separate input and output */
7025c28e83SPiotr Jasiukajtis 	__asm__ __volatile__(
7125c28e83SPiotr Jasiukajtis 	    "sethi  %%hi(0x80000000),%1\n\t"
7225c28e83SPiotr Jasiukajtis 	    "andncc %2,%1,%0\n\t"
7325c28e83SPiotr Jasiukajtis 	    "bne    1f\n\t"
7425c28e83SPiotr Jasiukajtis 	    "nop\n\t"
7525c28e83SPiotr Jasiukajtis 	    "mov    0,%0\n\t"
7625c28e83SPiotr Jasiukajtis 	    "ba	2f\n\t"		/* x is 0 */
7725c28e83SPiotr Jasiukajtis 	    "nop\n\t"
7825c28e83SPiotr Jasiukajtis 	    "1:\n\t"
7925c28e83SPiotr Jasiukajtis 	    "sethi  %%hi(0x7f800000),%1\n\t"
8025c28e83SPiotr Jasiukajtis 	    "andcc  %0,%1,%%g0\n\t"
8125c28e83SPiotr Jasiukajtis 	    "bne    1f\n\t"
8225c28e83SPiotr Jasiukajtis 	    "nop\n\t"
8325c28e83SPiotr Jasiukajtis 	    "mov    1,%0\n\t"
8425c28e83SPiotr Jasiukajtis 	    "ba	    2f\n\t"	/* x is subnormal */
8525c28e83SPiotr Jasiukajtis 	    "nop\n\t"
8625c28e83SPiotr Jasiukajtis 	    "1:\n\t"
8725c28e83SPiotr Jasiukajtis 	    "cmp    %0,%1\n\t"
8825c28e83SPiotr Jasiukajtis 	    "bge    1f\n\t"
8925c28e83SPiotr Jasiukajtis 	    "nop\n\t"
9025c28e83SPiotr Jasiukajtis 	    "mov    2,%0\n\t"
9125c28e83SPiotr Jasiukajtis 	    "ba	    2f\n\t"	/* x is normal */
9225c28e83SPiotr Jasiukajtis 	    "nop\n\t"
9325c28e83SPiotr Jasiukajtis 	    "1:\n\t"
9425c28e83SPiotr Jasiukajtis 	    "bg	    1f\n\t"
9525c28e83SPiotr Jasiukajtis 	    "nop\n\t"
9625c28e83SPiotr Jasiukajtis 	    "mov    3,%0\n\t"
9725c28e83SPiotr Jasiukajtis 	    "ba	    2f\n\t"	/* x is __infinity */
9825c28e83SPiotr Jasiukajtis 	    "nop\n\t"
9925c28e83SPiotr Jasiukajtis 	    "1:\n\t"
10025c28e83SPiotr Jasiukajtis 	    "sethi  %%hi(0x00400000),%1\n\t"
10125c28e83SPiotr Jasiukajtis 	    "andcc  %0,%1,%%g0\n\t"
10225c28e83SPiotr Jasiukajtis 	    "mov    4,%0\n\t"	/* x is quiet NaN */
10325c28e83SPiotr Jasiukajtis 	    "bne    2f\n\t"
10425c28e83SPiotr Jasiukajtis 	    "nop\n\t"
10525c28e83SPiotr Jasiukajtis 	    "mov    5,%0\n\t"	/* x is signaling NaN */
10625c28e83SPiotr Jasiukajtis 	    "2:\n\t"
10725c28e83SPiotr Jasiukajtis 	    : "=r" (ret), "=&r" (tmp)
10825c28e83SPiotr Jasiukajtis 	    : "r" (f)
10925c28e83SPiotr Jasiukajtis 	    : "cc");
11025c28e83SPiotr Jasiukajtis 	return (ret);
11125c28e83SPiotr Jasiukajtis }
11225c28e83SPiotr Jasiukajtis 
11325c28e83SPiotr Jasiukajtis #define	_HI_WORD(x)	((uint32_t *)&x)[0]
11425c28e83SPiotr Jasiukajtis #define	_LO_WORD(x)	((uint32_t *)&x)[1]
11525c28e83SPiotr Jasiukajtis 
116*7f11fd00SRichard Lowe extern __GNU_INLINE enum fp_class_type
11725c28e83SPiotr Jasiukajtis fp_class(double d)
11825c28e83SPiotr Jasiukajtis {
11925c28e83SPiotr Jasiukajtis 	enum fp_class_type ret;
12025c28e83SPiotr Jasiukajtis 	uint32_t tmp;
12125c28e83SPiotr Jasiukajtis 
12225c28e83SPiotr Jasiukajtis 	__asm__ __volatile__(
12325c28e83SPiotr Jasiukajtis 	    "sethi %%hi(0x80000000),%1\n\t"	/* %1 gets 80000000 */
12425c28e83SPiotr Jasiukajtis 	    "andn  %2,%1,%0\n\t"		/* %2-%0 gets abs(x) */
12525c28e83SPiotr Jasiukajtis 	    "orcc  %0,%3,%%g0\n\t"		/* set cc as x is zero/nonzero */
12625c28e83SPiotr Jasiukajtis 	    "bne   1f\n\t"			/* branch if x is nonzero */
12725c28e83SPiotr Jasiukajtis 	    "nop\n\t"
12825c28e83SPiotr Jasiukajtis 	    "mov   0,%0\n\t"
12925c28e83SPiotr Jasiukajtis 	    "ba	   2f\n\t"			/* x is 0 */
13025c28e83SPiotr Jasiukajtis 	    "nop\n\t"
13125c28e83SPiotr Jasiukajtis 	    "1:\n\t"
13225c28e83SPiotr Jasiukajtis 	    "sethi %%hi(0x7ff00000),%1\n\t"	/* %1 gets 7ff00000 */
13325c28e83SPiotr Jasiukajtis 	    "andcc %0,%1,%%g0\n\t"		/* cc set by __exp field of x */
13425c28e83SPiotr Jasiukajtis 	    "bne   1f\n\t"			/* branch if normal or max __exp */
13525c28e83SPiotr Jasiukajtis 	    "nop\n\t"
13625c28e83SPiotr Jasiukajtis 	    "mov   1,%0\n\t"
13725c28e83SPiotr Jasiukajtis 	    "ba	   2f\n\t"			/* x is subnormal */
13825c28e83SPiotr Jasiukajtis 	    "nop\n\t"
13925c28e83SPiotr Jasiukajtis 	    "1:\n\t"
14025c28e83SPiotr Jasiukajtis 	    "cmp   %0,%1\n\t"
14125c28e83SPiotr Jasiukajtis 	    "bge   1f\n\t"			/* branch if x is max __exp */
14225c28e83SPiotr Jasiukajtis 	    "nop\n\t"
14325c28e83SPiotr Jasiukajtis 	    "mov   2,%0\n\t"
14425c28e83SPiotr Jasiukajtis 	    "ba	   2f\n\t"			/* x is normal */
14525c28e83SPiotr Jasiukajtis 	    "nop\n\t"
14625c28e83SPiotr Jasiukajtis 	    "1:\n\t"
14725c28e83SPiotr Jasiukajtis 	    "andn  %0,%1,%0\n\t"		/* o0 gets msw __significand field */
14825c28e83SPiotr Jasiukajtis 	    "orcc  %0,%3,%%g0\n\t"		/* set cc by OR __significand */
14925c28e83SPiotr Jasiukajtis 	    "bne   1f\n\t"			/* Branch if __nan */
15025c28e83SPiotr Jasiukajtis 	    "nop\n\t"
15125c28e83SPiotr Jasiukajtis 	    "mov   3,%0\n\t"
15225c28e83SPiotr Jasiukajtis 	    "ba	   2f\n\t"			/* x is __infinity */
15325c28e83SPiotr Jasiukajtis 	    "nop\n\t"
15425c28e83SPiotr Jasiukajtis 	    "1:\n\t"
15525c28e83SPiotr Jasiukajtis 	    "sethi %%hi(0x00080000),%1\n\t"
15625c28e83SPiotr Jasiukajtis 	    "andcc %0,%1,%%g0\n\t"		/* set cc by quiet/sig bit */
15725c28e83SPiotr Jasiukajtis 	    "be	   1f\n\t"			/* Branch if signaling */
15825c28e83SPiotr Jasiukajtis 	    "nop\n\t"
15925c28e83SPiotr Jasiukajtis 	    "mov   4,%0\n\t"			/* x is quiet NaN */
16025c28e83SPiotr Jasiukajtis 	    "ba	   2f\n\t"
16125c28e83SPiotr Jasiukajtis 	    "nop\n\t"
16225c28e83SPiotr Jasiukajtis 	    "1:\n\t"
16325c28e83SPiotr Jasiukajtis 	    "mov   5,%0\n\t"			/* x is signaling NaN */
16425c28e83SPiotr Jasiukajtis 	    "2:\n\t"
16525c28e83SPiotr Jasiukajtis 	    : "=&r" (ret), "=&r" (tmp)
16625c28e83SPiotr Jasiukajtis 	    : "r" (_HI_WORD(d)), "r" (_LO_WORD(d))
16725c28e83SPiotr Jasiukajtis 	    : "cc");
16825c28e83SPiotr Jasiukajtis 
16925c28e83SPiotr Jasiukajtis 	return (ret);
17025c28e83SPiotr Jasiukajtis }
17125c28e83SPiotr Jasiukajtis 
172*7f11fd00SRichard Lowe extern __GNU_INLINE int
17325c28e83SPiotr Jasiukajtis __swapEX(int i)
17425c28e83SPiotr Jasiukajtis {
17525c28e83SPiotr Jasiukajtis 	int ret;
17625c28e83SPiotr Jasiukajtis 	uint32_t fsr;
17725c28e83SPiotr Jasiukajtis 	uint32_t tmp1, tmp2;
17825c28e83SPiotr Jasiukajtis 
17925c28e83SPiotr Jasiukajtis 	__asm__ __volatile__(
18025c28e83SPiotr Jasiukajtis 	    "and  %4,0x1f,%2\n\t" /* tmp1 = %2 = %o1 */
18125c28e83SPiotr Jasiukajtis 	    "sll  %2,5,%2\n\t"	/* shift input to aexc bit location */
18225c28e83SPiotr Jasiukajtis 	    ".volatile\n\t"
18325c28e83SPiotr Jasiukajtis 	    "st   %%fsr,%1\n\t"
18425c28e83SPiotr Jasiukajtis 	    "ld   %1,%0\n\t"	/* %0 = fsr */
18525c28e83SPiotr Jasiukajtis 	    "andn %0,0x3e0,%3\n\t" /* tmp2 = %3 = %o2 */
18625c28e83SPiotr Jasiukajtis 	    "or   %2,%3,%2\n\t"	/* %2 = new fsr */
18725c28e83SPiotr Jasiukajtis 	    "st	  %2,%1\n\t"
18825c28e83SPiotr Jasiukajtis 	    "ld	  %1,%%fsr\n\t"
18925c28e83SPiotr Jasiukajtis 	    "srl  %0,5,%0\n\t"
19025c28e83SPiotr Jasiukajtis 	    "and  %0,0x1f,%0\n\t" /* %0 = ret = %o0 */
19125c28e83SPiotr Jasiukajtis 	    ".nonvolatile\n\t"
19225c28e83SPiotr Jasiukajtis 	    : "=r" (ret), "=m" (fsr), "=r" (tmp1), "=r" (tmp2)
19325c28e83SPiotr Jasiukajtis 	    : "r" (i)
19425c28e83SPiotr Jasiukajtis 	    : "cc");
19525c28e83SPiotr Jasiukajtis 
19625c28e83SPiotr Jasiukajtis 	return (ret);
19725c28e83SPiotr Jasiukajtis }
19825c28e83SPiotr Jasiukajtis 
19925c28e83SPiotr Jasiukajtis /*
20025c28e83SPiotr Jasiukajtis  * On the SPARC, __swapRP is a no-op; always return 0 for backward
20125c28e83SPiotr Jasiukajtis  * compatibility
20225c28e83SPiotr Jasiukajtis  */
20325c28e83SPiotr Jasiukajtis /* ARGSUSED */
204*7f11fd00SRichard Lowe extern __GNU_INLINE enum fp_precision_type
20525c28e83SPiotr Jasiukajtis __swapRP(enum fp_precision_type i)
20625c28e83SPiotr Jasiukajtis {
20725c28e83SPiotr Jasiukajtis 	return (0);
20825c28e83SPiotr Jasiukajtis }
20925c28e83SPiotr Jasiukajtis 
210*7f11fd00SRichard Lowe extern __GNU_INLINE enum fp_direction_type
21125c28e83SPiotr Jasiukajtis __swapRD(enum fp_direction_type d)
21225c28e83SPiotr Jasiukajtis {
21325c28e83SPiotr Jasiukajtis 	enum fp_direction_type ret;
21425c28e83SPiotr Jasiukajtis 	uint32_t fsr;
21525c28e83SPiotr Jasiukajtis 	uint32_t tmp1, tmp2, tmp3;
21625c28e83SPiotr Jasiukajtis 
21725c28e83SPiotr Jasiukajtis 	__asm__ __volatile__(
21825c28e83SPiotr Jasiukajtis 	    "and  %5,0x3,%0\n\t"
21925c28e83SPiotr Jasiukajtis 	    "sll  %0,30,%2\n\t"		/* shift input to RD bit location */
22025c28e83SPiotr Jasiukajtis 	    ".volatile\n\t"
22125c28e83SPiotr Jasiukajtis 	    "st   %%fsr,%1\n\t"
22225c28e83SPiotr Jasiukajtis 	    "ld	  %1,%0\n\t"		/* %0 = fsr */
22325c28e83SPiotr Jasiukajtis 	    "set  0xc0000000,%4\n\t"	/* mask of rounding direction bits */
22425c28e83SPiotr Jasiukajtis 	    "andn %0,%4,%3\n\t"
22525c28e83SPiotr Jasiukajtis 	    "or   %2,%3,%2\n\t"		/* %2 = new fsr */
22625c28e83SPiotr Jasiukajtis 	    "st	  %2,%1\n\t"
22725c28e83SPiotr Jasiukajtis 	    "ld	  %1,%%fsr\n\t"
22825c28e83SPiotr Jasiukajtis 	    "srl  %0,30,%0\n\t"
22925c28e83SPiotr Jasiukajtis 	    "and  %0,0x3,%0\n\t"
23025c28e83SPiotr Jasiukajtis 	    ".nonvolatile\n\t"
23125c28e83SPiotr Jasiukajtis 	    : "=r" (ret), "=m" (fsr), "=r" (tmp1), "=r" (tmp2), "=r" (tmp3)
23225c28e83SPiotr Jasiukajtis 	    : "r" (d)
23325c28e83SPiotr Jasiukajtis 	    : "cc");
23425c28e83SPiotr Jasiukajtis 
23525c28e83SPiotr Jasiukajtis 	return (ret);
23625c28e83SPiotr Jasiukajtis }
23725c28e83SPiotr Jasiukajtis 
238*7f11fd00SRichard Lowe extern __GNU_INLINE int
23925c28e83SPiotr Jasiukajtis __swapTE(int i)
24025c28e83SPiotr Jasiukajtis {
24125c28e83SPiotr Jasiukajtis 	int ret;
24225c28e83SPiotr Jasiukajtis 	uint32_t fsr, tmp1, tmp2;
24325c28e83SPiotr Jasiukajtis 
24425c28e83SPiotr Jasiukajtis 	__asm__ __volatile__(
24525c28e83SPiotr Jasiukajtis 	    "and  %4,0x1f,%0\n\t"
24625c28e83SPiotr Jasiukajtis 	    "sll  %0,23,%2\n\t"		/* shift input to TEM bit location */
24725c28e83SPiotr Jasiukajtis 	    ".volatile\n\t"
24825c28e83SPiotr Jasiukajtis 	    "st   %%fsr,%1\n\t"
24925c28e83SPiotr Jasiukajtis 	    "ld	  %1,%0\n\t"		/* %0 = fsr */
25025c28e83SPiotr Jasiukajtis 	    "set  0x0f800000,%3\n\t"	/* mask of TEM (Trap Enable Mode bits) */
25125c28e83SPiotr Jasiukajtis 	    "andn %0,%3,%3\n\t"
25225c28e83SPiotr Jasiukajtis 	    "or   %2,%3,%2\n\t"		/* %2 = new fsr */
25325c28e83SPiotr Jasiukajtis 	    "st	  %2,%1\n\t"
25425c28e83SPiotr Jasiukajtis 	    "ld	  %1,%%fsr\n\t"
25525c28e83SPiotr Jasiukajtis 	    "srl  %0,23,%0\n\t"
25625c28e83SPiotr Jasiukajtis 	    "and  %0,0x1f,%0\n\t"
25725c28e83SPiotr Jasiukajtis 	    ".nonvolatile\n\t"
25825c28e83SPiotr Jasiukajtis 	    : "=r" (ret), "=m" (fsr), "=r" (tmp1), "=r" (tmp2)
25925c28e83SPiotr Jasiukajtis 	    : "r" (i)
26025c28e83SPiotr Jasiukajtis 	    : "cc");
26125c28e83SPiotr Jasiukajtis 
26225c28e83SPiotr Jasiukajtis 	return (ret);
26325c28e83SPiotr Jasiukajtis }
26425c28e83SPiotr Jasiukajtis 
265*7f11fd00SRichard Lowe extern __GNU_INLINE double
26625c28e83SPiotr Jasiukajtis sqrt(double d)
26725c28e83SPiotr Jasiukajtis {
26825c28e83SPiotr Jasiukajtis 	return (__inline_sqrt(d));
26925c28e83SPiotr Jasiukajtis }
27025c28e83SPiotr Jasiukajtis 
271*7f11fd00SRichard Lowe extern __GNU_INLINE float
27225c28e83SPiotr Jasiukajtis sqrtf(float f)
27325c28e83SPiotr Jasiukajtis {
27425c28e83SPiotr Jasiukajtis 	return (__inline_sqrtf(f));
27525c28e83SPiotr Jasiukajtis }
27625c28e83SPiotr Jasiukajtis 
277*7f11fd00SRichard Lowe extern __GNU_INLINE double
27825c28e83SPiotr Jasiukajtis fabs(double d)
27925c28e83SPiotr Jasiukajtis {
28025c28e83SPiotr Jasiukajtis 	double ret;
28125c28e83SPiotr Jasiukajtis 
28225c28e83SPiotr Jasiukajtis 	__asm__ __volatile__("fabsd %1,%0\n\t" : "=e" (ret) : "e" (d));
28325c28e83SPiotr Jasiukajtis 	return (ret);
28425c28e83SPiotr Jasiukajtis }
28525c28e83SPiotr Jasiukajtis 
286*7f11fd00SRichard Lowe extern __GNU_INLINE float
28725c28e83SPiotr Jasiukajtis fabsf(float f)
28825c28e83SPiotr Jasiukajtis {
28925c28e83SPiotr Jasiukajtis 	float ret;
29025c28e83SPiotr Jasiukajtis 
29125c28e83SPiotr Jasiukajtis 	__asm__ __volatile__("fabss %1,%0\n\t" : "=f" (ret) : "f" (f));
29225c28e83SPiotr Jasiukajtis 	return (ret);
29325c28e83SPiotr Jasiukajtis }
29425c28e83SPiotr Jasiukajtis 
29525c28e83SPiotr Jasiukajtis #ifdef __cplusplus
29625c28e83SPiotr Jasiukajtis }
29725c28e83SPiotr Jasiukajtis #endif
29825c28e83SPiotr Jasiukajtis 
29925c28e83SPiotr Jasiukajtis #endif	/* __GNUC */
30025c28e83SPiotr Jasiukajtis 
30125c28e83SPiotr Jasiukajtis #endif /* _LIBM_INLINES_H */
302