|
Packit |
5c3484 |
dnl Alpha mpn_sec_tabselect.
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
dnl Contributed to the GNU project by Torbjörn Granlund.
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
dnl Copyright 2011-2013 Free Software Foundation, Inc.
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
dnl This file is part of the GNU MP Library.
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl The GNU MP Library is free software; you can redistribute it and/or modify
|
|
Packit |
5c3484 |
dnl it under the terms of either:
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl * the GNU Lesser General Public License as published by the Free
|
|
Packit |
5c3484 |
dnl Software Foundation; either version 3 of the License, or (at your
|
|
Packit |
5c3484 |
dnl option) any later version.
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl or
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl * the GNU General Public License as published by the Free Software
|
|
Packit |
5c3484 |
dnl Foundation; either version 2 of the License, or (at your option) any
|
|
Packit |
5c3484 |
dnl later version.
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl or both in parallel, as here.
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl The GNU MP Library is distributed in the hope that it will be useful, but
|
|
Packit |
5c3484 |
dnl WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
|
|
Packit |
5c3484 |
dnl or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
Packit |
5c3484 |
dnl for more details.
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl You should have received copies of the GNU General Public License and the
|
|
Packit |
5c3484 |
dnl GNU Lesser General Public License along with the GNU MP Library. If not,
|
|
Packit |
5c3484 |
dnl see https://www.gnu.org/licenses/.
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
include(`../config.m4')
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
C cycles/limb
|
|
Packit |
5c3484 |
C EV4: ?
|
|
Packit |
5c3484 |
C EV5: 2.25
|
|
Packit |
5c3484 |
C EV6: 1.64
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
define(`rp', `r16')
|
|
Packit |
5c3484 |
define(`tp', `r17')
|
|
Packit |
5c3484 |
define(`n', `r18')
|
|
Packit |
5c3484 |
define(`nents', `r19')
|
|
Packit |
5c3484 |
define(`which', `r20')
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
define(`i', `r21')
|
|
Packit |
5c3484 |
define(`j', `r22')
|
|
Packit |
5c3484 |
define(`stride', `r23')
|
|
Packit |
5c3484 |
define(`mask', `r24')
|
|
Packit |
5c3484 |
define(`k', `r25')
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
ASM_START()
|
|
Packit |
5c3484 |
PROLOGUE(mpn_sec_tabselect)
|
|
Packit |
5c3484 |
subq n, 4, j C outer loop induction variable
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
blt j, L(outer_end)
|
|
Packit |
5c3484 |
L(outer_top):
|
|
Packit |
5c3484 |
mov tp, r8
|
|
Packit |
5c3484 |
lda r0, 0(r31)
|
|
Packit |
5c3484 |
lda r1, 0(r31)
|
|
Packit |
5c3484 |
lda r2, 0(r31)
|
|
Packit |
5c3484 |
lda r3, 0(r31)
|
|
Packit |
5c3484 |
subq j, 4, j C outer loop induction variable
|
|
Packit |
5c3484 |
subq nents, which, k
|
|
Packit |
5c3484 |
mov nents, i
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
ALIGN(16)
|
|
Packit |
5c3484 |
L(top): ldq r4, 0(tp)
|
|
Packit |
5c3484 |
ldq r5, 8(tp)
|
|
Packit |
5c3484 |
cmpeq k, i, mask
|
|
Packit |
5c3484 |
subq i, 1, i
|
|
Packit |
5c3484 |
subq r31, mask, mask
|
|
Packit |
5c3484 |
ldq r6, 16(tp)
|
|
Packit |
5c3484 |
ldq r7, 24(tp)
|
|
Packit |
5c3484 |
and r4, mask, r4
|
|
Packit |
5c3484 |
and r5, mask, r5
|
|
Packit |
5c3484 |
or r0, r4, r0
|
|
Packit |
5c3484 |
or r1, r5, r1
|
|
Packit |
5c3484 |
and r6, mask, r6
|
|
Packit |
5c3484 |
and r7, mask, r7
|
|
Packit |
5c3484 |
or r2, r6, r2
|
|
Packit |
5c3484 |
or r3, r7, r3
|
|
Packit |
5c3484 |
s8addq n, tp, tp
|
|
Packit |
5c3484 |
bne i, L(top)
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
stq r0, 0(rp)
|
|
Packit |
5c3484 |
stq r1, 8(rp)
|
|
Packit |
5c3484 |
stq r2, 16(rp)
|
|
Packit |
5c3484 |
stq r3, 24(rp)
|
|
Packit |
5c3484 |
addq r8, 32, tp
|
|
Packit |
5c3484 |
addq rp, 32, rp
|
|
Packit |
5c3484 |
bge j, L(outer_top)
|
|
Packit |
5c3484 |
L(outer_end):
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
and n, 2, r0
|
|
Packit |
5c3484 |
beq r0, L(b0x)
|
|
Packit |
5c3484 |
L(b1x): mov tp, r8
|
|
Packit |
5c3484 |
lda r0, 0(r31)
|
|
Packit |
5c3484 |
lda r1, 0(r31)
|
|
Packit |
5c3484 |
subq nents, which, k
|
|
Packit |
5c3484 |
mov nents, i
|
|
Packit |
5c3484 |
ALIGN(16)
|
|
Packit |
5c3484 |
L(tp2): ldq r4, 0(tp)
|
|
Packit |
5c3484 |
ldq r5, 8(tp)
|
|
Packit |
5c3484 |
cmpeq k, i, mask
|
|
Packit |
5c3484 |
subq i, 1, i
|
|
Packit |
5c3484 |
subq r31, mask, mask
|
|
Packit |
5c3484 |
and r4, mask, r4
|
|
Packit |
5c3484 |
and r5, mask, r5
|
|
Packit |
5c3484 |
or r0, r4, r0
|
|
Packit |
5c3484 |
or r1, r5, r1
|
|
Packit |
5c3484 |
s8addq n, tp, tp
|
|
Packit |
5c3484 |
bne i, L(tp2)
|
|
Packit |
5c3484 |
stq r0, 0(rp)
|
|
Packit |
5c3484 |
stq r1, 8(rp)
|
|
Packit |
5c3484 |
addq r8, 16, tp
|
|
Packit |
5c3484 |
addq rp, 16, rp
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
L(b0x): and n, 1, r0
|
|
Packit |
5c3484 |
beq r0, L(b00)
|
|
Packit |
5c3484 |
L(b01): lda r0, 0(r31)
|
|
Packit |
5c3484 |
subq nents, which, k
|
|
Packit |
5c3484 |
mov nents, i
|
|
Packit |
5c3484 |
ALIGN(16)
|
|
Packit |
5c3484 |
L(tp1): ldq r4, 0(tp)
|
|
Packit |
5c3484 |
cmpeq k, i, mask
|
|
Packit |
5c3484 |
subq i, 1, i
|
|
Packit |
5c3484 |
subq r31, mask, mask
|
|
Packit |
5c3484 |
and r4, mask, r4
|
|
Packit |
5c3484 |
or r0, r4, r0
|
|
Packit |
5c3484 |
s8addq n, tp, tp
|
|
Packit |
5c3484 |
bne i, L(tp1)
|
|
Packit |
5c3484 |
stq r0, 0(rp)
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
L(b00): ret r31, (r26), 1
|
|
Packit |
5c3484 |
EPILOGUE()
|