Blame sysdeps/powerpc/powerpc64/lshift.S

Packit 6c4009
/* PowerPC64 mpn_lshift -- rp[] = up[] << cnt
Packit 6c4009
   Copyright (C) 2003-2018 Free Software Foundation, Inc.
Packit 6c4009
   This file is part of the GNU C Library.
Packit 6c4009
Packit 6c4009
   The GNU C Library is free software; you can redistribute it and/or
Packit 6c4009
   modify it under the terms of the GNU Lesser General Public
Packit 6c4009
   License as published by the Free Software Foundation; either
Packit 6c4009
   version 2.1 of the License, or (at your option) any later version.
Packit 6c4009
Packit 6c4009
   The GNU C Library is distributed in the hope that it will be useful,
Packit 6c4009
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 6c4009
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 6c4009
   Lesser General Public License for more details.
Packit 6c4009
Packit 6c4009
   You should have received a copy of the GNU Lesser General Public
Packit 6c4009
   License along with the GNU C Library; if not, see
Packit 6c4009
   <http://www.gnu.org/licenses/>.  */
Packit 6c4009
Packit 6c4009
#include <sysdep.h>
Packit 6c4009
Packit 6c4009
#define RP       r3
Packit 6c4009
#define UP       r4
Packit 6c4009
#define N        r5
Packit 6c4009
#define CNT      r6
Packit 6c4009
Packit 6c4009
#define TNC      r0
Packit 6c4009
#define U0      r30
Packit 6c4009
#define U1      r31
Packit Service caa92d
#define U0SAVE  (-16)
Packit Service caa92d
#define U1SAVE  (-8)
Packit 6c4009
#define RETVAL   r5
Packit 6c4009
Packit 6c4009
ENTRY_TOCLESS (__mpn_lshift, 5)
Packit Service caa92d
	std	U1, U1SAVE(r1)
Packit Service caa92d
	std	U0, U0SAVE(r1)
Packit Service caa92d
	cfi_offset(U1, U1SAVE)
Packit Service caa92d
	cfi_offset(U0, U0SAVE)
Packit 6c4009
	subfic	TNC, CNT, 64
Packit 6c4009
	sldi	r7, N, RP
Packit 6c4009
	add	UP, UP, r7
Packit 6c4009
	add	RP, RP, r7
Packit 6c4009
	rldicl.	U0, N, 0, 62
Packit 6c4009
	cmpdi	CNT, U0, 2
Packit 6c4009
	addi	U1, N, RP
Packit 6c4009
	ld	r10, -8(UP)
Packit 6c4009
	srd	RETVAL, r10, TNC
Packit 6c4009
Packit 6c4009
	srdi	U1, U1, 2
Packit 6c4009
	mtctr	U1
Packit 6c4009
	beq	cr0, L(b00)
Packit 6c4009
	blt	cr6, L(b01)
Packit 6c4009
	ld	r11, -16(UP)
Packit 6c4009
	beq	cr6, L(b10)
Packit 6c4009
Packit 6c4009
	.align	4
Packit 6c4009
L(b11):	sld	r8, r10, CNT
Packit 6c4009
	srd	r9, r11, TNC
Packit 6c4009
	ld	U1, -24(UP)
Packit 6c4009
	addi	UP, UP, -24
Packit 6c4009
	sld	r12, r11, CNT
Packit 6c4009
	srd	r7, U1, TNC
Packit 6c4009
	addi	RP, RP, 16
Packit 6c4009
	bdnz	L(gt3)
Packit 6c4009
Packit 6c4009
	or	r11, r8, r9
Packit 6c4009
	sld	r8, U1, CNT
Packit 6c4009
	b	L(cj3)
Packit 6c4009
Packit 6c4009
	.align	4
Packit 6c4009
L(gt3):	ld	U0, -8(UP)
Packit 6c4009
	or	r11, r8, r9
Packit 6c4009
	sld	r8, U1, CNT
Packit 6c4009
	srd	r9, U0, TNC
Packit 6c4009
	ld	U1, -16(UP)
Packit 6c4009
	or	r10, r12, r7
Packit 6c4009
	b	L(L11)
Packit 6c4009
Packit 6c4009
	.align	5
Packit 6c4009
L(b10):	sld	r12, r10, CNT
Packit 6c4009
	addi	RP, RP, 24
Packit 6c4009
	srd	r7, r11, TNC
Packit 6c4009
	bdnz	L(gt2)
Packit 6c4009
Packit 6c4009
	sld	r8, r11, CNT
Packit 6c4009
	or	r10, r12, r7
Packit 6c4009
	b	L(cj2)
Packit 6c4009
Packit 6c4009
L(gt2):	ld	U0, -24(UP)
Packit 6c4009
	sld	r8, r11, CNT
Packit 6c4009
	srd	r9, U0, TNC
Packit 6c4009
	ld	U1, -32(UP)
Packit 6c4009
	or	r10, r12, r7
Packit 6c4009
	sld	r12, U0, CNT
Packit 6c4009
	srd	r7, U1, 0
Packit 6c4009
	ld	U0, -40(UP)
Packit 6c4009
	or	r11, r8, r9
Packit 6c4009
	addi	UP, UP, -16
Packit 6c4009
	b	L(L10)
Packit 6c4009
Packit 6c4009
	.align	4
Packit 6c4009
L(b00):	ld	U1, -16(UP)
Packit 6c4009
	sld	r12, r10, CNT
Packit 6c4009
	srd	r7, U1, TNC
Packit 6c4009
	ld	U0, -24(UP)
Packit 6c4009
	sld	r8, U1, CNT
Packit 6c4009
	srd	r9, U0, TNC
Packit 6c4009
	ld	U1, -32(UP)
Packit 6c4009
	or	r10, r12, r7
Packit 6c4009
	sld	r12, U0, CNT
Packit 6c4009
	srd	r7, U1, TNC
Packit 6c4009
	addi	RP, RP, r8
Packit 6c4009
	bdz	L(cj4)
Packit 6c4009
Packit 6c4009
L(gt4):	addi	UP, UP, -32
Packit 6c4009
	ld	U0, -8(UP)
Packit 6c4009
	or	r11, r8, r9
Packit 6c4009
	b	L(L00)
Packit 6c4009
Packit 6c4009
	.align	4
Packit 6c4009
L(b01):	bdnz	L(gt1)
Packit 6c4009
	sld	r8, r10, CNT
Packit 6c4009
	std	r8, -8(RP)
Packit 6c4009
	b	L(ret)
Packit 6c4009
Packit 6c4009
L(gt1):	ld	U0, -16(UP)
Packit 6c4009
	sld	r8, r10, CNT
Packit 6c4009
	srd	r9, U0, TNC
Packit 6c4009
	ld	U1, -24(UP)
Packit 6c4009
	sld	r12, U0, CNT
Packit 6c4009
	srd	r7, U1, TNC
Packit 6c4009
	ld	U0, -32(UP)
Packit 6c4009
	or	r11, r8, r9
Packit 6c4009
	sld	r8, U1, CNT
Packit 6c4009
	srd	r9, U0, TNC
Packit 6c4009
	ld	U1, -40(UP)
Packit 6c4009
	addi	UP, UP, -40
Packit 6c4009
	or	r10, r12, r7
Packit 6c4009
	bdz	L(end)
Packit 6c4009
Packit 6c4009
	.align	5
Packit 6c4009
L(top):	sld	r12, U0, CNT
Packit 6c4009
	srd	r7, U1, TNC
Packit 6c4009
	ld	U0, -8(UP)
Packit 6c4009
	std	r11, -8(RP)
Packit 6c4009
	or	r11, r8, r9
Packit 6c4009
L(L00):	sld	r8, U1, CNT
Packit 6c4009
	srd	r9, U0, TNC
Packit 6c4009
	ld	U1, -16(UP)
Packit 6c4009
	std	r10, -16(RP)
Packit 6c4009
	or	r10, r12, r7
Packit 6c4009
L(L11):	sld	r12, U0, CNT
Packit 6c4009
	srd	r7, U1, TNC
Packit 6c4009
	ld	U0, -24(UP)
Packit 6c4009
	std	r11, -24(RP)
Packit 6c4009
	or	r11, r8, r9
Packit 6c4009
L(L10):	sld	r8, U1, CNT
Packit 6c4009
	srd	r9, U0, TNC
Packit 6c4009
	ld	U1, -32(UP)
Packit 6c4009
	addi	UP, UP, -32
Packit 6c4009
	std	r10, -32(RP)
Packit 6c4009
	addi	RP, RP, -32
Packit 6c4009
	or	r10, r12, r7
Packit 6c4009
	bdnz	L(top)
Packit 6c4009
Packit 6c4009
	.align	5
Packit 6c4009
L(end):	sld	r12, U0, CNT
Packit 6c4009
	srd	r7, U1, TNC
Packit 6c4009
	std	r11, -8(RP)
Packit 6c4009
L(cj4):	or	r11, r8, r9
Packit 6c4009
	sld	r8, U1, CNT
Packit 6c4009
	std	r10, -16(RP)
Packit 6c4009
L(cj3):	or	r10, r12, r7
Packit 6c4009
	std	r11, -24(RP)
Packit 6c4009
L(cj2):	std	r10, -32(RP)
Packit 6c4009
	std	r8, -40(RP)
Packit 6c4009
Packit Service caa92d
L(ret):	ld	U1, U1SAVE(r1)
Packit Service caa92d
	ld	U0, U0SAVE(r1)
Packit 6c4009
	mr	RP, RETVAL
Packit 6c4009
	blr
Packit 6c4009
END(__mpn_lshift)