xref: /illumos-gate/usr/src/lib/libm/amd64/src/rndintl.S (revision 55fea89d)
125c28e83SPiotr Jasiukajtis/*
225c28e83SPiotr Jasiukajtis * CDDL HEADER START
325c28e83SPiotr Jasiukajtis *
425c28e83SPiotr Jasiukajtis * The contents of this file are subject to the terms of the
525c28e83SPiotr Jasiukajtis * Common Development and Distribution License (the "License").
625c28e83SPiotr Jasiukajtis * You may not use this file except in compliance with the License.
725c28e83SPiotr Jasiukajtis *
825c28e83SPiotr Jasiukajtis * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
925c28e83SPiotr Jasiukajtis * or http://www.opensolaris.org/os/licensing.
1025c28e83SPiotr Jasiukajtis * See the License for the specific language governing permissions
1125c28e83SPiotr Jasiukajtis * and limitations under the License.
1225c28e83SPiotr Jasiukajtis *
1325c28e83SPiotr Jasiukajtis * When distributing Covered Code, include this CDDL HEADER in each
1425c28e83SPiotr Jasiukajtis * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
1525c28e83SPiotr Jasiukajtis * If applicable, add the following below this CDDL HEADER, with the
1625c28e83SPiotr Jasiukajtis * fields enclosed by brackets "[]" replaced with your own identifying
1725c28e83SPiotr Jasiukajtis * information: Portions Copyright [yyyy] [name of copyright owner]
1825c28e83SPiotr Jasiukajtis *
1925c28e83SPiotr Jasiukajtis * CDDL HEADER END
2025c28e83SPiotr Jasiukajtis */
2125c28e83SPiotr Jasiukajtis/*
2225c28e83SPiotr Jasiukajtis * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
2325c28e83SPiotr Jasiukajtis */
2425c28e83SPiotr Jasiukajtis/*
2525c28e83SPiotr Jasiukajtis * Copyright 2005 Sun Microsystems, Inc.  All rights reserved.
2625c28e83SPiotr Jasiukajtis * Use is subject to license terms.
2725c28e83SPiotr Jasiukajtis */
2825c28e83SPiotr Jasiukajtis
2925c28e83SPiotr Jasiukajtis        .file "rndintl.s"
3025c28e83SPiotr Jasiukajtis
3125c28e83SPiotr Jasiukajtis#include "libm.h"
3225c28e83SPiotr Jasiukajtis
3325c28e83SPiotr Jasiukajtis	ENTRY(aintl)
3425c28e83SPiotr Jasiukajtis	movq	%rsp,%rax
3525c28e83SPiotr Jasiukajtis	subq	$16,%rsp
3625c28e83SPiotr Jasiukajtis	fstcw	-8(%rax)
3725c28e83SPiotr Jasiukajtis	fldt	8(%rax)
3825c28e83SPiotr Jasiukajtis	movw	-8(%rax),%cx
3925c28e83SPiotr Jasiukajtis	orw	$0x0c00,%cx
4025c28e83SPiotr Jasiukajtis	movw	%cx,-4(%rax)
4125c28e83SPiotr Jasiukajtis	fldcw	-4(%rax)		/ set RD = to_zero
4225c28e83SPiotr Jasiukajtis	frndint
4325c28e83SPiotr Jasiukajtis	fstcw	-4(%rax)
4425c28e83SPiotr Jasiukajtis	movw	-4(%rax),%dx
4525c28e83SPiotr Jasiukajtis	andw	$0xf3ff,%dx
4625c28e83SPiotr Jasiukajtis	movw	-8(%rax),%cx
4725c28e83SPiotr Jasiukajtis	andw	$0x0c00,%cx
4825c28e83SPiotr Jasiukajtis	orw	%dx,%cx
4925c28e83SPiotr Jasiukajtis	movw	%cx,-8(%rax)
5025c28e83SPiotr Jasiukajtis	fldcw	-8(%rax)		/ restore RD
5125c28e83SPiotr Jasiukajtis	addq	$16,%rsp
5225c28e83SPiotr Jasiukajtis	ret
5325c28e83SPiotr Jasiukajtis	.align	16
5425c28e83SPiotr Jasiukajtis	SET_SIZE(aintl)
5525c28e83SPiotr Jasiukajtis
5625c28e83SPiotr Jasiukajtis	ENTRY(irintl)
5725c28e83SPiotr Jasiukajtis	movq	%rsp,%rcx
5825c28e83SPiotr Jasiukajtis	subq	$16,%rsp
5925c28e83SPiotr Jasiukajtis	fldt	8(%rcx)			/ load x
6025c28e83SPiotr Jasiukajtis	fistpl	-8(%rcx)		/ [x]
6125c28e83SPiotr Jasiukajtis	fwait
6225c28e83SPiotr Jasiukajtis	movslq	-8(%rcx),%rax
6325c28e83SPiotr Jasiukajtis	addq	$16,%rsp
6425c28e83SPiotr Jasiukajtis	ret
6525c28e83SPiotr Jasiukajtis	.align	16
6625c28e83SPiotr Jasiukajtis	SET_SIZE(irintl)
6725c28e83SPiotr Jasiukajtis
6825c28e83SPiotr Jasiukajtis	.data
6925c28e83SPiotr Jasiukajtis	.align	16
7025c28e83SPiotr Jasiukajtishalf:	.float	0.5
7125c28e83SPiotr Jasiukajtis
7225c28e83SPiotr Jasiukajtis	ENTRY(anintl)
7325c28e83SPiotr Jasiukajtis.Lanintl:
7425c28e83SPiotr Jasiukajtis	movq	%rsp,%rcx
7525c28e83SPiotr Jasiukajtis	subq	$16,%rsp
7625c28e83SPiotr Jasiukajtis	fstcw	-8(%rcx)
7725c28e83SPiotr Jasiukajtis	fldt	8(%rcx)
7825c28e83SPiotr Jasiukajtis	movw	-8(%rcx),%dx
7925c28e83SPiotr Jasiukajtis	andw	$0xf3ff,%dx
8025c28e83SPiotr Jasiukajtis	movw	%dx,-4(%rcx)
8125c28e83SPiotr Jasiukajtis	fldcw	-4(%rcx)		/ set RD = to_nearest
8225c28e83SPiotr Jasiukajtis	fld	%st(0)
8325c28e83SPiotr Jasiukajtis	frndint				/ [x],x
8425c28e83SPiotr Jasiukajtis	fstcw	-4(%rcx)
8525c28e83SPiotr Jasiukajtis	movw	-4(%rcx),%dx
8625c28e83SPiotr Jasiukajtis	andw	$0xf3ff,%dx
8725c28e83SPiotr Jasiukajtis	movw	-8(%rcx),%ax
8825c28e83SPiotr Jasiukajtis	andw	$0x0c00,%ax
8925c28e83SPiotr Jasiukajtis	orw	%dx,%ax
9025c28e83SPiotr Jasiukajtis	movw	%ax,-8(%rcx)
9125c28e83SPiotr Jasiukajtis	fldcw	-8(%rcx)		/ restore RD
9225c28e83SPiotr Jasiukajtis	fucomi	%st(1),%st		/ check if x is already an integer
9325c28e83SPiotr Jasiukajtis	jp	.L0
9425c28e83SPiotr Jasiukajtis	je	.L0
9525c28e83SPiotr Jasiukajtis	fxch				/ x,[x]
9625c28e83SPiotr Jasiukajtis	fsub	%st(1),%st		/ x-[x],[x]
9725c28e83SPiotr Jasiukajtis	fabs				/ |x-[x]|,[x]
9825c28e83SPiotr Jasiukajtis	PIC_SETUP(1)
9925c28e83SPiotr Jasiukajtis	flds	PIC_L(half)
10025c28e83SPiotr Jasiukajtis	fcomip	%st(1),%st		/ compare 0.5 with |x-[x]|
10125c28e83SPiotr Jasiukajtis	PIC_WRAPUP
102*55fea89dSDan Cross	je	.halfway		/ if 0.5 = |x-[x]| goto halfway,
10325c28e83SPiotr Jasiukajtis					/ most cases will not take branch.
10425c28e83SPiotr Jasiukajtis.L0:
10525c28e83SPiotr Jasiukajtis	addq	$16,%rsp
10625c28e83SPiotr Jasiukajtis	fstp	%st(0)
10725c28e83SPiotr Jasiukajtis	ret
10825c28e83SPiotr Jasiukajtis.halfway:
10925c28e83SPiotr Jasiukajtis	/ x = n+0.5, recompute anint(x) as x+sign(x)*0.5
11025c28e83SPiotr Jasiukajtis	fldt	8(%rcx)			/ x, 0.5, [x]
11125c28e83SPiotr Jasiukajtis	movw	16(%rcx),%ax		/ sign+exp part of x
11225c28e83SPiotr Jasiukajtis	andw	$0x8000,%ax		/ look at sign bit
11325c28e83SPiotr Jasiukajtis	jnz	.x_neg
11425c28e83SPiotr Jasiukajtis	faddp
11525c28e83SPiotr Jasiukajtis	addq	$16,%rsp
11625c28e83SPiotr Jasiukajtis	fstp	%st(1)
11725c28e83SPiotr Jasiukajtis	ret
11825c28e83SPiotr Jasiukajtis.x_neg:
11925c28e83SPiotr Jasiukajtis	/ here, x is negative, so return x-0.5
12025c28e83SPiotr Jasiukajtis	fsubp	%st,%st(1)		/ x-0.5,[x]
12125c28e83SPiotr Jasiukajtis	addq	$16,%rsp
12225c28e83SPiotr Jasiukajtis	fstp	%st(1)
12325c28e83SPiotr Jasiukajtis	ret
12425c28e83SPiotr Jasiukajtis	.align	16
12525c28e83SPiotr Jasiukajtis	SET_SIZE(anintl)
12625c28e83SPiotr Jasiukajtis
12725c28e83SPiotr Jasiukajtis	ENTRY(nintl)
12825c28e83SPiotr Jasiukajtis	pushq	%rbp
12925c28e83SPiotr Jasiukajtis	movq	%rsp,%rbp
13025c28e83SPiotr Jasiukajtis	subq	$16,%rsp
13125c28e83SPiotr Jasiukajtis	pushq	24(%rbp)
13225c28e83SPiotr Jasiukajtis	pushq	16(%rbp)
13325c28e83SPiotr Jasiukajtis	call	.Lanintl		/// LOCAL
13425c28e83SPiotr Jasiukajtis	fistpl	-8(%rbp)
13525c28e83SPiotr Jasiukajtis	fwait
13625c28e83SPiotr Jasiukajtis	movslq	-8(%rbp),%rax
13725c28e83SPiotr Jasiukajtis	leave
13825c28e83SPiotr Jasiukajtis	ret
13925c28e83SPiotr Jasiukajtis	.align	16
14025c28e83SPiotr Jasiukajtis	SET_SIZE(nintl)
141