125c28e83SPiotr Jasiukajtis /*
225c28e83SPiotr Jasiukajtis * CDDL HEADER START
325c28e83SPiotr Jasiukajtis *
425c28e83SPiotr Jasiukajtis * The contents of this file are subject to the terms of the
525c28e83SPiotr Jasiukajtis * Common Development and Distribution License (the "License").
625c28e83SPiotr Jasiukajtis * You may not use this file except in compliance with the License.
725c28e83SPiotr Jasiukajtis *
825c28e83SPiotr Jasiukajtis * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
925c28e83SPiotr Jasiukajtis * or http://www.opensolaris.org/os/licensing.
1025c28e83SPiotr Jasiukajtis * See the License for the specific language governing permissions
1125c28e83SPiotr Jasiukajtis * and limitations under the License.
1225c28e83SPiotr Jasiukajtis *
1325c28e83SPiotr Jasiukajtis * When distributing Covered Code, include this CDDL HEADER in each
1425c28e83SPiotr Jasiukajtis * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
1525c28e83SPiotr Jasiukajtis * If applicable, add the following below this CDDL HEADER, with the
1625c28e83SPiotr Jasiukajtis * fields enclosed by brackets "[]" replaced with your own identifying
1725c28e83SPiotr Jasiukajtis * information: Portions Copyright [yyyy] [name of copyright owner]
1825c28e83SPiotr Jasiukajtis *
1925c28e83SPiotr Jasiukajtis * CDDL HEADER END
2025c28e83SPiotr Jasiukajtis */
2125c28e83SPiotr Jasiukajtis
2225c28e83SPiotr Jasiukajtis /*
2325c28e83SPiotr Jasiukajtis * Copyright 2006 Sun Microsystems, Inc. All rights reserved.
2425c28e83SPiotr Jasiukajtis * Use is subject to license terms.
2525c28e83SPiotr Jasiukajtis */
2625c28e83SPiotr Jasiukajtis
2725c28e83SPiotr Jasiukajtis /*
2825c28e83SPiotr Jasiukajtis * Copyright 2011, Richard Lowe.
2925c28e83SPiotr Jasiukajtis */
3025c28e83SPiotr Jasiukajtis
3125c28e83SPiotr Jasiukajtis #ifndef _LIBM_INLINES_H
3225c28e83SPiotr Jasiukajtis #define _LIBM_INLINES_H
3325c28e83SPiotr Jasiukajtis
3425c28e83SPiotr Jasiukajtis #ifdef __GNUC__
3525c28e83SPiotr Jasiukajtis
3625c28e83SPiotr Jasiukajtis #include <sys/types.h>
3725c28e83SPiotr Jasiukajtis #include <sys/ieeefp.h>
3825c28e83SPiotr Jasiukajtis
3925c28e83SPiotr Jasiukajtis #ifdef __cplusplus
4025c28e83SPiotr Jasiukajtis extern "C" {
4125c28e83SPiotr Jasiukajtis #endif
4225c28e83SPiotr Jasiukajtis
437f11fd00SRichard Lowe extern __GNU_INLINE double
__inline_sqrt(double d)4425c28e83SPiotr Jasiukajtis __inline_sqrt(double d)
4525c28e83SPiotr Jasiukajtis {
4625c28e83SPiotr Jasiukajtis double ret;
4725c28e83SPiotr Jasiukajtis
4825c28e83SPiotr Jasiukajtis __asm__ __volatile__("fsqrtd %1,%0\n\t" : "=e" (ret) : "e" (d));
4925c28e83SPiotr Jasiukajtis return (ret);
5025c28e83SPiotr Jasiukajtis }
5125c28e83SPiotr Jasiukajtis
527f11fd00SRichard Lowe extern __GNU_INLINE float
__inline_sqrtf(float f)5325c28e83SPiotr Jasiukajtis __inline_sqrtf(float f)
5425c28e83SPiotr Jasiukajtis {
5525c28e83SPiotr Jasiukajtis float ret;
5625c28e83SPiotr Jasiukajtis
5725c28e83SPiotr Jasiukajtis __asm__ __volatile__("fsqrts %1,%0\n\t" : "=f" (ret) : "f" (f));
5825c28e83SPiotr Jasiukajtis return (ret);
5925c28e83SPiotr Jasiukajtis }
6025c28e83SPiotr Jasiukajtis
617f11fd00SRichard Lowe extern __GNU_INLINE enum fp_class_type
fp_classf(float f)6225c28e83SPiotr Jasiukajtis fp_classf(float f)
6325c28e83SPiotr Jasiukajtis {
6425c28e83SPiotr Jasiukajtis enum fp_class_type ret;
6525c28e83SPiotr Jasiukajtis uint32_t tmp;
6625c28e83SPiotr Jasiukajtis
6725c28e83SPiotr Jasiukajtis /* XXX: Separate input and output */
6825c28e83SPiotr Jasiukajtis __asm__ __volatile__(
6925c28e83SPiotr Jasiukajtis "sethi %%hi(0x80000000),%1\n\t"
7025c28e83SPiotr Jasiukajtis "andncc %2,%1,%0\n\t"
7125c28e83SPiotr Jasiukajtis "bne 1f\n\t"
7225c28e83SPiotr Jasiukajtis "nop\n\t"
7325c28e83SPiotr Jasiukajtis "mov 0,%0\n\t"
7425c28e83SPiotr Jasiukajtis "ba 2f\n\t" /* x is 0 */
7525c28e83SPiotr Jasiukajtis "nop\n\t"
7625c28e83SPiotr Jasiukajtis "1:\n\t"
7725c28e83SPiotr Jasiukajtis "sethi %%hi(0x7f800000),%1\n\t"
7825c28e83SPiotr Jasiukajtis "andcc %0,%1,%%g0\n\t"
7925c28e83SPiotr Jasiukajtis "bne 1f\n\t"
8025c28e83SPiotr Jasiukajtis "nop\n\t"
8125c28e83SPiotr Jasiukajtis "mov 1,%0\n\t"
8225c28e83SPiotr Jasiukajtis "ba 2f\n\t" /* x is subnormal */
8325c28e83SPiotr Jasiukajtis "nop\n\t"
8425c28e83SPiotr Jasiukajtis "1:\n\t"
8525c28e83SPiotr Jasiukajtis "cmp %0,%1\n\t"
8625c28e83SPiotr Jasiukajtis "bge 1f\n\t"
8725c28e83SPiotr Jasiukajtis "nop\n\t"
8825c28e83SPiotr Jasiukajtis "mov 2,%0\n\t"
8925c28e83SPiotr Jasiukajtis "ba 2f\n\t" /* x is normal */
9025c28e83SPiotr Jasiukajtis "nop\n\t"
9125c28e83SPiotr Jasiukajtis "1:\n\t"
9225c28e83SPiotr Jasiukajtis "bg 1f\n\t"
9325c28e83SPiotr Jasiukajtis "nop\n\t"
9425c28e83SPiotr Jasiukajtis "mov 3,%0\n\t"
9525c28e83SPiotr Jasiukajtis "ba 2f\n\t" /* x is __infinity */
9625c28e83SPiotr Jasiukajtis "nop\n\t"
9725c28e83SPiotr Jasiukajtis "1:\n\t"
9825c28e83SPiotr Jasiukajtis "sethi %%hi(0x00400000),%1\n\t"
9925c28e83SPiotr Jasiukajtis "andcc %0,%1,%%g0\n\t"
10025c28e83SPiotr Jasiukajtis "mov 4,%0\n\t" /* x is quiet NaN */
10125c28e83SPiotr Jasiukajtis "bne 2f\n\t"
10225c28e83SPiotr Jasiukajtis "nop\n\t"
10325c28e83SPiotr Jasiukajtis "mov 5,%0\n\t" /* x is signaling NaN */
10425c28e83SPiotr Jasiukajtis "2:\n\t"
10525c28e83SPiotr Jasiukajtis : "=r" (ret), "=&r" (tmp)
10625c28e83SPiotr Jasiukajtis : "r" (f)
10725c28e83SPiotr Jasiukajtis : "cc");
10825c28e83SPiotr Jasiukajtis return (ret);
10925c28e83SPiotr Jasiukajtis }
11025c28e83SPiotr Jasiukajtis
11125c28e83SPiotr Jasiukajtis #define _HI_WORD(x) ((uint32_t *)&x)[0]
11225c28e83SPiotr Jasiukajtis #define _LO_WORD(x) ((uint32_t *)&x)[1]
11325c28e83SPiotr Jasiukajtis
1147f11fd00SRichard Lowe extern __GNU_INLINE enum fp_class_type
fp_class(double d)11525c28e83SPiotr Jasiukajtis fp_class(double d)
11625c28e83SPiotr Jasiukajtis {
11725c28e83SPiotr Jasiukajtis enum fp_class_type ret;
11825c28e83SPiotr Jasiukajtis uint32_t tmp;
11925c28e83SPiotr Jasiukajtis
120*564d5236SRichard Lowe /* BEGIN CSTYLED */
12125c28e83SPiotr Jasiukajtis __asm__ __volatile__(
12225c28e83SPiotr Jasiukajtis "sethi %%hi(0x80000000),%1\n\t" /* %1 gets 80000000 */
12325c28e83SPiotr Jasiukajtis "andn %2,%1,%0\n\t" /* %2-%0 gets abs(x) */
12425c28e83SPiotr Jasiukajtis "orcc %0,%3,%%g0\n\t" /* set cc as x is zero/nonzero */
12525c28e83SPiotr Jasiukajtis "bne 1f\n\t" /* branch if x is nonzero */
12625c28e83SPiotr Jasiukajtis "nop\n\t"
12725c28e83SPiotr Jasiukajtis "mov 0,%0\n\t"
12825c28e83SPiotr Jasiukajtis "ba 2f\n\t" /* x is 0 */
12925c28e83SPiotr Jasiukajtis "nop\n\t"
13025c28e83SPiotr Jasiukajtis "1:\n\t"
13125c28e83SPiotr Jasiukajtis "sethi %%hi(0x7ff00000),%1\n\t" /* %1 gets 7ff00000 */
13225c28e83SPiotr Jasiukajtis "andcc %0,%1,%%g0\n\t" /* cc set by __exp field of x */
13325c28e83SPiotr Jasiukajtis "bne 1f\n\t" /* branch if normal or max __exp */
13425c28e83SPiotr Jasiukajtis "nop\n\t"
13525c28e83SPiotr Jasiukajtis "mov 1,%0\n\t"
13625c28e83SPiotr Jasiukajtis "ba 2f\n\t" /* x is subnormal */
13725c28e83SPiotr Jasiukajtis "nop\n\t"
13825c28e83SPiotr Jasiukajtis "1:\n\t"
13925c28e83SPiotr Jasiukajtis "cmp %0,%1\n\t"
14025c28e83SPiotr Jasiukajtis "bge 1f\n\t" /* branch if x is max __exp */
14125c28e83SPiotr Jasiukajtis "nop\n\t"
14225c28e83SPiotr Jasiukajtis "mov 2,%0\n\t"
14325c28e83SPiotr Jasiukajtis "ba 2f\n\t" /* x is normal */
14425c28e83SPiotr Jasiukajtis "nop\n\t"
14525c28e83SPiotr Jasiukajtis "1:\n\t"
14625c28e83SPiotr Jasiukajtis "andn %0,%1,%0\n\t" /* o0 gets msw __significand field */
14725c28e83SPiotr Jasiukajtis "orcc %0,%3,%%g0\n\t" /* set cc by OR __significand */
14825c28e83SPiotr Jasiukajtis "bne 1f\n\t" /* Branch if __nan */
14925c28e83SPiotr Jasiukajtis "nop\n\t"
15025c28e83SPiotr Jasiukajtis "mov 3,%0\n\t"
15125c28e83SPiotr Jasiukajtis "ba 2f\n\t" /* x is __infinity */
15225c28e83SPiotr Jasiukajtis "nop\n\t"
15325c28e83SPiotr Jasiukajtis "1:\n\t"
15425c28e83SPiotr Jasiukajtis "sethi %%hi(0x00080000),%1\n\t"
15525c28e83SPiotr Jasiukajtis "andcc %0,%1,%%g0\n\t" /* set cc by quiet/sig bit */
15625c28e83SPiotr Jasiukajtis "be 1f\n\t" /* Branch if signaling */
15725c28e83SPiotr Jasiukajtis "nop\n\t"
15825c28e83SPiotr Jasiukajtis "mov 4,%0\n\t" /* x is quiet NaN */
15925c28e83SPiotr Jasiukajtis "ba 2f\n\t"
16025c28e83SPiotr Jasiukajtis "nop\n\t"
16125c28e83SPiotr Jasiukajtis "1:\n\t"
16225c28e83SPiotr Jasiukajtis "mov 5,%0\n\t" /* x is signaling NaN */
16325c28e83SPiotr Jasiukajtis "2:\n\t"
16425c28e83SPiotr Jasiukajtis : "=&r" (ret), "=&r" (tmp)
16525c28e83SPiotr Jasiukajtis : "r" (_HI_WORD(d)), "r" (_LO_WORD(d))
16625c28e83SPiotr Jasiukajtis : "cc");
167*564d5236SRichard Lowe /* END CSTYLED */
16825c28e83SPiotr Jasiukajtis
16925c28e83SPiotr Jasiukajtis return (ret);
17025c28e83SPiotr Jasiukajtis }
17125c28e83SPiotr Jasiukajtis
1727f11fd00SRichard Lowe extern __GNU_INLINE int
__swapEX(int i)17325c28e83SPiotr Jasiukajtis __swapEX(int i)
17425c28e83SPiotr Jasiukajtis {
17525c28e83SPiotr Jasiukajtis int ret;
17625c28e83SPiotr Jasiukajtis uint32_t fsr;
17725c28e83SPiotr Jasiukajtis uint32_t tmp1, tmp2;
17825c28e83SPiotr Jasiukajtis
17925c28e83SPiotr Jasiukajtis __asm__ __volatile__(
18025c28e83SPiotr Jasiukajtis "and %4,0x1f,%2\n\t" /* tmp1 = %2 = %o1 */
18125c28e83SPiotr Jasiukajtis "sll %2,5,%2\n\t" /* shift input to aexc bit location */
18225c28e83SPiotr Jasiukajtis ".volatile\n\t"
18325c28e83SPiotr Jasiukajtis "st %%fsr,%1\n\t"
18425c28e83SPiotr Jasiukajtis "ld %1,%0\n\t" /* %0 = fsr */
18525c28e83SPiotr Jasiukajtis "andn %0,0x3e0,%3\n\t" /* tmp2 = %3 = %o2 */
18625c28e83SPiotr Jasiukajtis "or %2,%3,%2\n\t" /* %2 = new fsr */
18725c28e83SPiotr Jasiukajtis "st %2,%1\n\t"
18825c28e83SPiotr Jasiukajtis "ld %1,%%fsr\n\t"
18925c28e83SPiotr Jasiukajtis "srl %0,5,%0\n\t"
19025c28e83SPiotr Jasiukajtis "and %0,0x1f,%0\n\t" /* %0 = ret = %o0 */
19125c28e83SPiotr Jasiukajtis ".nonvolatile\n\t"
19225c28e83SPiotr Jasiukajtis : "=r" (ret), "=m" (fsr), "=r" (tmp1), "=r" (tmp2)
19325c28e83SPiotr Jasiukajtis : "r" (i)
19425c28e83SPiotr Jasiukajtis : "cc");
19525c28e83SPiotr Jasiukajtis
19625c28e83SPiotr Jasiukajtis return (ret);
19725c28e83SPiotr Jasiukajtis }
19825c28e83SPiotr Jasiukajtis
19925c28e83SPiotr Jasiukajtis /*
20025c28e83SPiotr Jasiukajtis * On the SPARC, __swapRP is a no-op; always return 0 for backward
20125c28e83SPiotr Jasiukajtis * compatibility
20225c28e83SPiotr Jasiukajtis */
20325c28e83SPiotr Jasiukajtis /* ARGSUSED */
2047f11fd00SRichard Lowe extern __GNU_INLINE enum fp_precision_type
__swapRP(enum fp_precision_type i)20525c28e83SPiotr Jasiukajtis __swapRP(enum fp_precision_type i)
20625c28e83SPiotr Jasiukajtis {
20725c28e83SPiotr Jasiukajtis return (0);
20825c28e83SPiotr Jasiukajtis }
20925c28e83SPiotr Jasiukajtis
2107f11fd00SRichard Lowe extern __GNU_INLINE enum fp_direction_type
__swapRD(enum fp_direction_type d)21125c28e83SPiotr Jasiukajtis __swapRD(enum fp_direction_type d)
21225c28e83SPiotr Jasiukajtis {
21325c28e83SPiotr Jasiukajtis enum fp_direction_type ret;
21425c28e83SPiotr Jasiukajtis uint32_t fsr;
21525c28e83SPiotr Jasiukajtis uint32_t tmp1, tmp2, tmp3;
21625c28e83SPiotr Jasiukajtis
21725c28e83SPiotr Jasiukajtis __asm__ __volatile__(
21825c28e83SPiotr Jasiukajtis "and %5,0x3,%0\n\t"
21925c28e83SPiotr Jasiukajtis "sll %0,30,%2\n\t" /* shift input to RD bit location */
22025c28e83SPiotr Jasiukajtis ".volatile\n\t"
22125c28e83SPiotr Jasiukajtis "st %%fsr,%1\n\t"
22225c28e83SPiotr Jasiukajtis "ld %1,%0\n\t" /* %0 = fsr */
22325c28e83SPiotr Jasiukajtis "set 0xc0000000,%4\n\t" /* mask of rounding direction bits */
22425c28e83SPiotr Jasiukajtis "andn %0,%4,%3\n\t"
22525c28e83SPiotr Jasiukajtis "or %2,%3,%2\n\t" /* %2 = new fsr */
22625c28e83SPiotr Jasiukajtis "st %2,%1\n\t"
22725c28e83SPiotr Jasiukajtis "ld %1,%%fsr\n\t"
22825c28e83SPiotr Jasiukajtis "srl %0,30,%0\n\t"
22925c28e83SPiotr Jasiukajtis "and %0,0x3,%0\n\t"
23025c28e83SPiotr Jasiukajtis ".nonvolatile\n\t"
23125c28e83SPiotr Jasiukajtis : "=r" (ret), "=m" (fsr), "=r" (tmp1), "=r" (tmp2), "=r" (tmp3)
23225c28e83SPiotr Jasiukajtis : "r" (d)
23325c28e83SPiotr Jasiukajtis : "cc");
23425c28e83SPiotr Jasiukajtis
23525c28e83SPiotr Jasiukajtis return (ret);
23625c28e83SPiotr Jasiukajtis }
23725c28e83SPiotr Jasiukajtis
2387f11fd00SRichard Lowe extern __GNU_INLINE int
__swapTE(int i)23925c28e83SPiotr Jasiukajtis __swapTE(int i)
24025c28e83SPiotr Jasiukajtis {
24125c28e83SPiotr Jasiukajtis int ret;
24225c28e83SPiotr Jasiukajtis uint32_t fsr, tmp1, tmp2;
24325c28e83SPiotr Jasiukajtis
244*564d5236SRichard Lowe /* BEGIN CSTYLED */
24525c28e83SPiotr Jasiukajtis __asm__ __volatile__(
24625c28e83SPiotr Jasiukajtis "and %4,0x1f,%0\n\t"
24725c28e83SPiotr Jasiukajtis "sll %0,23,%2\n\t" /* shift input to TEM bit location */
24825c28e83SPiotr Jasiukajtis ".volatile\n\t"
24925c28e83SPiotr Jasiukajtis "st %%fsr,%1\n\t"
25025c28e83SPiotr Jasiukajtis "ld %1,%0\n\t" /* %0 = fsr */
25125c28e83SPiotr Jasiukajtis "set 0x0f800000,%3\n\t" /* mask of TEM (Trap Enable Mode bits) */
25225c28e83SPiotr Jasiukajtis "andn %0,%3,%3\n\t"
25325c28e83SPiotr Jasiukajtis "or %2,%3,%2\n\t" /* %2 = new fsr */
25425c28e83SPiotr Jasiukajtis "st %2,%1\n\t"
25525c28e83SPiotr Jasiukajtis "ld %1,%%fsr\n\t"
25625c28e83SPiotr Jasiukajtis "srl %0,23,%0\n\t"
25725c28e83SPiotr Jasiukajtis "and %0,0x1f,%0\n\t"
25825c28e83SPiotr Jasiukajtis ".nonvolatile\n\t"
25925c28e83SPiotr Jasiukajtis : "=r" (ret), "=m" (fsr), "=r" (tmp1), "=r" (tmp2)
26025c28e83SPiotr Jasiukajtis : "r" (i)
26125c28e83SPiotr Jasiukajtis : "cc");
262*564d5236SRichard Lowe /* END CSTYLED */
26325c28e83SPiotr Jasiukajtis
26425c28e83SPiotr Jasiukajtis return (ret);
26525c28e83SPiotr Jasiukajtis }
26625c28e83SPiotr Jasiukajtis
2677f11fd00SRichard Lowe extern __GNU_INLINE double
sqrt(double d)26825c28e83SPiotr Jasiukajtis sqrt(double d)
26925c28e83SPiotr Jasiukajtis {
27025c28e83SPiotr Jasiukajtis return (__inline_sqrt(d));
27125c28e83SPiotr Jasiukajtis }
27225c28e83SPiotr Jasiukajtis
2737f11fd00SRichard Lowe extern __GNU_INLINE float
sqrtf(float f)27425c28e83SPiotr Jasiukajtis sqrtf(float f)
27525c28e83SPiotr Jasiukajtis {
27625c28e83SPiotr Jasiukajtis return (__inline_sqrtf(f));
27725c28e83SPiotr Jasiukajtis }
27825c28e83SPiotr Jasiukajtis
2797f11fd00SRichard Lowe extern __GNU_INLINE double
fabs(double d)28025c28e83SPiotr Jasiukajtis fabs(double d)
28125c28e83SPiotr Jasiukajtis {
28225c28e83SPiotr Jasiukajtis double ret;
28325c28e83SPiotr Jasiukajtis
28425c28e83SPiotr Jasiukajtis __asm__ __volatile__("fabsd %1,%0\n\t" : "=e" (ret) : "e" (d));
28525c28e83SPiotr Jasiukajtis return (ret);
28625c28e83SPiotr Jasiukajtis }
28725c28e83SPiotr Jasiukajtis
2887f11fd00SRichard Lowe extern __GNU_INLINE float
fabsf(float f)28925c28e83SPiotr Jasiukajtis fabsf(float f)
29025c28e83SPiotr Jasiukajtis {
29125c28e83SPiotr Jasiukajtis float ret;
29225c28e83SPiotr Jasiukajtis
29325c28e83SPiotr Jasiukajtis __asm__ __volatile__("fabss %1,%0\n\t" : "=f" (ret) : "f" (f));
29425c28e83SPiotr Jasiukajtis return (ret);
29525c28e83SPiotr Jasiukajtis }
29625c28e83SPiotr Jasiukajtis
29725c28e83SPiotr Jasiukajtis #ifdef __cplusplus
29825c28e83SPiotr Jasiukajtis }
29925c28e83SPiotr Jasiukajtis #endif
30025c28e83SPiotr Jasiukajtis
30125c28e83SPiotr Jasiukajtis #endif /* __GNUC */
30225c28e83SPiotr Jasiukajtis
30325c28e83SPiotr Jasiukajtis #endif /* _LIBM_INLINES_H */
304