xref: /illumos-gate/usr/src/lib/libm/i386/src/lround.S (revision 55fea89d)
125c28e83SPiotr Jasiukajtis/*
225c28e83SPiotr Jasiukajtis * CDDL HEADER START
325c28e83SPiotr Jasiukajtis *
425c28e83SPiotr Jasiukajtis * The contents of this file are subject to the terms of the
525c28e83SPiotr Jasiukajtis * Common Development and Distribution License (the "License").
625c28e83SPiotr Jasiukajtis * You may not use this file except in compliance with the License.
725c28e83SPiotr Jasiukajtis *
825c28e83SPiotr Jasiukajtis * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
925c28e83SPiotr Jasiukajtis * or http://www.opensolaris.org/os/licensing.
1025c28e83SPiotr Jasiukajtis * See the License for the specific language governing permissions
1125c28e83SPiotr Jasiukajtis * and limitations under the License.
1225c28e83SPiotr Jasiukajtis *
1325c28e83SPiotr Jasiukajtis * When distributing Covered Code, include this CDDL HEADER in each
1425c28e83SPiotr Jasiukajtis * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
1525c28e83SPiotr Jasiukajtis * If applicable, add the following below this CDDL HEADER, with the
1625c28e83SPiotr Jasiukajtis * fields enclosed by brackets "[]" replaced with your own identifying
1725c28e83SPiotr Jasiukajtis * information: Portions Copyright [yyyy] [name of copyright owner]
1825c28e83SPiotr Jasiukajtis *
1925c28e83SPiotr Jasiukajtis * CDDL HEADER END
2025c28e83SPiotr Jasiukajtis */
2125c28e83SPiotr Jasiukajtis/*
2225c28e83SPiotr Jasiukajtis * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
2325c28e83SPiotr Jasiukajtis */
2425c28e83SPiotr Jasiukajtis/*
2525c28e83SPiotr Jasiukajtis * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
2625c28e83SPiotr Jasiukajtis * Use is subject to license terms.
2725c28e83SPiotr Jasiukajtis */
2825c28e83SPiotr Jasiukajtis
2925c28e83SPiotr Jasiukajtis	.file	"lround.s"
3025c28e83SPiotr Jasiukajtis
3125c28e83SPiotr Jasiukajtis#include "libm.h"
3225c28e83SPiotr JasiukajtisLIBM_ANSI_PRAGMA_WEAK(lround,function)
3325c28e83SPiotr Jasiukajtis
3425c28e83SPiotr Jasiukajtis	.section .rodata
3525c28e83SPiotr Jasiukajtis	.align	4
3625c28e83SPiotr Jasiukajtis.Lhalf:	.float	0.5
3725c28e83SPiotr Jasiukajtis
3825c28e83SPiotr Jasiukajtis	ENTRY(lround)
3925c28e83SPiotr Jasiukajtis	movl	%esp,%ecx
4025c28e83SPiotr Jasiukajtis	subl	$8,%esp
4125c28e83SPiotr Jasiukajtis	fstcw	-8(%ecx)
4225c28e83SPiotr Jasiukajtis	fldl	4(%ecx)
4325c28e83SPiotr Jasiukajtis	movw	-8(%ecx),%dx
4425c28e83SPiotr Jasiukajtis	andw	$0xf3ff,%dx
4525c28e83SPiotr Jasiukajtis	movw	%dx,-4(%ecx)
4625c28e83SPiotr Jasiukajtis	fldcw	-4(%ecx)		/ set RD = to_nearest
4725c28e83SPiotr Jasiukajtis	fld	%st(0)
4825c28e83SPiotr Jasiukajtis	frndint				/ [x],x
4925c28e83SPiotr Jasiukajtis	fstcw	-4(%ecx)
5025c28e83SPiotr Jasiukajtis	movw	-4(%ecx),%dx
5125c28e83SPiotr Jasiukajtis	andw	$0xf3ff,%dx
5225c28e83SPiotr Jasiukajtis	movw	-8(%ecx),%ax
5325c28e83SPiotr Jasiukajtis	andw	$0x0c00,%ax
5425c28e83SPiotr Jasiukajtis	orw	%dx,%ax
5525c28e83SPiotr Jasiukajtis	movw	%ax,-8(%ecx)
5625c28e83SPiotr Jasiukajtis	fldcw	-8(%ecx)		/ restore RD
5725c28e83SPiotr Jasiukajtis	fucom				/ check if x is already an integer
5825c28e83SPiotr Jasiukajtis	fstsw	%ax
5925c28e83SPiotr Jasiukajtis	sahf
6025c28e83SPiotr Jasiukajtis	jp	0f
6125c28e83SPiotr Jasiukajtis	je	0f
6225c28e83SPiotr Jasiukajtis	fxch				/ x,[x]
6325c28e83SPiotr Jasiukajtis	fsub	%st(1),%st		/ x-[x],[x]
6425c28e83SPiotr Jasiukajtis	fabs				/ |x-[x]|,[x]
6525c28e83SPiotr Jasiukajtis	PIC_SETUP(1)
6625c28e83SPiotr Jasiukajtis	fcoms	PIC_L(.Lhalf)
6725c28e83SPiotr Jasiukajtis	PIC_WRAPUP
6825c28e83SPiotr Jasiukajtis	fnstsw	%ax
6925c28e83SPiotr Jasiukajtis	sahf
70*55fea89dSDan Cross	jae	2f			/ if |x-[x]| = 0.5 goto halfway,
7125c28e83SPiotr Jasiukajtis					/ most cases will not take branch.
7225c28e83SPiotr Jasiukajtis0:
7325c28e83SPiotr Jasiukajtis	fstp	%st(0)
7425c28e83SPiotr Jasiukajtis1:
7525c28e83SPiotr Jasiukajtis	fistpl	-8(%ecx)
7625c28e83SPiotr Jasiukajtis	fwait
7725c28e83SPiotr Jasiukajtis	movl	-8(%ecx),%eax
7825c28e83SPiotr Jasiukajtis	addl	$8,%esp
7925c28e83SPiotr Jasiukajtis	ret
8025c28e83SPiotr Jasiukajtis2:
8125c28e83SPiotr Jasiukajtis    / x = n+0.5, recompute lround(x) as x+sign(x)*0.5
8225c28e83SPiotr Jasiukajtis	fldl	4(%ecx)			/ x, 0.5, [x]
8325c28e83SPiotr Jasiukajtis	movl	8(%ecx),%eax		/ high part of x
8425c28e83SPiotr Jasiukajtis	andl	$0x80000000,%eax
8525c28e83SPiotr Jasiukajtis	jnz	3f
8625c28e83SPiotr Jasiukajtis	faddp
8725c28e83SPiotr Jasiukajtis	fstp	%st(1)
8825c28e83SPiotr Jasiukajtis	jmp	1b
8925c28e83SPiotr Jasiukajtis3:
9025c28e83SPiotr Jasiukajtis	/ here, x is negative, so return x-0.5
9125c28e83SPiotr Jasiukajtis	fsubp	%st,%st(1)		/ x-0.5,[x]
9225c28e83SPiotr Jasiukajtis	fstp	%st(1)
9325c28e83SPiotr Jasiukajtis	jmp	1b
9425c28e83SPiotr Jasiukajtis	.align	4
9525c28e83SPiotr Jasiukajtis	SET_SIZE(lround)
96