Blame sysdeps/powerpc/powerpc32/fpu/s_lround.S

Packit 6c4009
/* lround function.  PowerPC32 version.
Packit 6c4009
   Copyright (C) 2004-2018 Free Software Foundation, Inc.
Packit 6c4009
   This file is part of the GNU C Library.
Packit 6c4009
Packit 6c4009
   The GNU C Library is free software; you can redistribute it and/or
Packit 6c4009
   modify it under the terms of the GNU Lesser General Public
Packit 6c4009
   License as published by the Free Software Foundation; either
Packit 6c4009
   version 2.1 of the License, or (at your option) any later version.
Packit 6c4009
Packit 6c4009
   The GNU C Library is distributed in the hope that it will be useful,
Packit 6c4009
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 6c4009
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 6c4009
   Lesser General Public License for more details.
Packit 6c4009
Packit 6c4009
   You should have received a copy of the GNU Lesser General Public
Packit 6c4009
   License along with the GNU C Library; if not, see
Packit 6c4009
   <http://www.gnu.org/licenses/>.  */
Packit 6c4009
Packit 6c4009
#include <sysdep.h>
Packit 6c4009
#include <math_ldbl_opt.h>
Packit 6c4009
#include <libm-alias-float.h>
Packit 6c4009
#include <libm-alias-double.h>
Packit 6c4009
Packit 6c4009
	.section	.rodata.cst4,"aM",@progbits,4
Packit 6c4009
	.align	2
Packit 6c4009
.LC0:	/* 0.5 */
Packit 6c4009
	.long 0x3f000000
Packit 6c4009
.LC1:	/* 2^52.  */
Packit 6c4009
	.long 0x59800000
Packit 6c4009
	.section	.rodata.cst8,"aM",@progbits,8
Packit 6c4009
	.align	3
Packit 6c4009
.LC2:	/* 0x7fffffff.8p0.  */
Packit 6c4009
	.long 0x41dfffff
Packit 6c4009
	.long 0xffe00000
Packit 6c4009
.LC3:	/* -0x80000000.8p0.  */
Packit 6c4009
	.long 0xc1e00000
Packit 6c4009
	.long 0x00100000
Packit 6c4009
	.section	".text"
Packit 6c4009
Packit 6c4009
/* long [r3] lround (float x [fp1])
Packit 6c4009
   IEEE 1003.1 lround function.  IEEE specifies "round to the nearest
Packit 6c4009
   integer value, rounding halfway cases away from zero, regardless of
Packit 6c4009
   the current rounding mode."  However PowerPC Architecture defines
Packit 6c4009
   "round to Nearest" as "Choose the best approximation. In case of a
Packit 6c4009
   tie, choose the one that is even (least significant bit o).".
Packit 6c4009
   So we can't use the PowerPC "round to Nearest" mode. Instead we set
Packit 6c4009
   "round toward Zero" mode and round by adding +-0.5 before rounding
Packit 6c4009
   to the integer value.  It is necessary to detect when x is
Packit 6c4009
   (+-)0x1.fffffffffffffp-2 because adding +-0.5 in this case will
Packit 6c4009
   cause an erroneous shift, carry and round.  We simply return 0 if
Packit 6c4009
   0.5 > x > -0.5.  */
Packit 6c4009
Packit 6c4009
ENTRY (__lround)
Packit 6c4009
	stwu    r1,-16(r1)
Packit 6c4009
	cfi_adjust_cfa_offset (16)
Packit 6c4009
#ifdef SHARED
Packit 6c4009
	mflr	r11
Packit 6c4009
	cfi_register(lr,r11)
Packit 6c4009
	SETUP_GOT_ACCESS(r9,got_label)
Packit 6c4009
	addis	r10,r9,.LC0-got_label@ha
Packit 6c4009
	lfs	fp10,.LC0-got_label@l(r10)
Packit 6c4009
	addis	r10,r9,.LC1-got_label@ha
Packit 6c4009
	lfs	fp11,.LC1-got_label@l(r10)
Packit 6c4009
	addis	r10,r9,.LC2-got_label@ha
Packit 6c4009
	lfd	fp9,.LC2-got_label@l(r10)
Packit 6c4009
	addis	r10,r9,.LC3-got_label@ha
Packit 6c4009
	lfd	fp8,.LC3-got_label@l(r10)
Packit 6c4009
	mtlr	r11
Packit 6c4009
	cfi_same_value (lr)
Packit 6c4009
#else
Packit 6c4009
	lis	r9,.LC0@ha
Packit 6c4009
	lfs	fp10,.LC0@l(r9)
Packit 6c4009
	lis	r9,.LC1@ha
Packit 6c4009
	lfs	fp11,.LC1@l(r9)
Packit 6c4009
	lis	r9,.LC2@ha
Packit 6c4009
	lfd	fp9,.LC2@l(r9)
Packit 6c4009
	lis	r9,.LC3@ha
Packit 6c4009
	lfd	fp8,.LC3@l(r9)
Packit 6c4009
#endif
Packit 6c4009
	fabs	fp2, fp1	/* Get the absolute value of x.  */
Packit 6c4009
	fsub	fp12,fp10,fp10	/* Compute 0.0.  */
Packit 6c4009
	fcmpu	cr6, fp2, fp10	/* if |x| < 0.5  */
Packit 6c4009
	fcmpu	cr5, fp1, fp9	/* if x >= 0x7fffffff.8p0  */
Packit 6c4009
	fcmpu	cr1, fp1, fp8	/* if x <= -0x80000000.8p0  */
Packit 6c4009
	fcmpu	cr7, fp1, fp12	/* x is negative? x < 0.0  */
Packit 6c4009
	blt-	cr6,.Lretzero
Packit 6c4009
	bge-	cr5,.Loflow
Packit 6c4009
	ble-	cr1,.Loflow
Packit 6c4009
	/* Test whether an integer to avoid spurious "inexact".  */
Packit 6c4009
	fadd	fp3,fp2,fp11
Packit 6c4009
	fsub	fp3,fp3,fp11
Packit 6c4009
	fcmpu	cr5, fp2, fp3
Packit 6c4009
	beq	cr5,.Lnobias
Packit 6c4009
	fadd	fp3,fp2,fp10	/* |x|+=0.5 bias to prepare to round.  */
Packit 6c4009
	bge	cr7,.Lconvert	/* x is positive so don't negate x.  */
Packit 6c4009
	fnabs	fp3,fp3		/* -(|x|+=0.5)  */
Packit 6c4009
.Lconvert:
Packit 6c4009
	fctiwz	fp4,fp3		/* Convert to Integer word lround toward 0.  */
Packit 6c4009
	stfd	fp4,8(r1)
Packit 6c4009
	nop	/* Ensure the following load is in a different dispatch  */
Packit 6c4009
	nop	/* group to avoid pipe stall on POWER4&5.  */
Packit 6c4009
	nop
Packit 6c4009
	lwz	r3,8+LOWORD(r1)	/* Load return as integer.  */
Packit 6c4009
.Lout:
Packit 6c4009
	addi	r1,r1,16
Packit 6c4009
	blr
Packit 6c4009
.Lretzero:			/* when 0.5 > x > -0.5  */
Packit 6c4009
	li	r3,0		/* return 0.  */
Packit 6c4009
	b	.Lout
Packit 6c4009
.Lnobias:
Packit 6c4009
	fmr	fp3,fp1
Packit 6c4009
	b	.Lconvert
Packit 6c4009
.Loflow:
Packit 6c4009
	fmr	fp3,fp11
Packit 6c4009
	bge	cr7,.Lconvert
Packit 6c4009
	fnabs	fp3,fp3
Packit 6c4009
	b	.Lconvert
Packit 6c4009
	END (__lround)
Packit 6c4009
Packit 6c4009
libm_alias_double (__lround, lround)
Packit 6c4009
Packit 6c4009
strong_alias (__lround, __lroundf)
Packit 6c4009
libm_alias_float (__lround, lround)