|
Packit |
5c3484 |
dnl PowerPC-32 mpn_mul_1 -- Multiply a limb vector with a limb and store the
|
|
Packit |
5c3484 |
dnl result in a second limb vector.
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
dnl Copyright 1995, 1997, 2000, 2002, 2003, 2005 Free Software Foundation,
|
|
Packit |
5c3484 |
dnl Inc.
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
dnl This file is part of the GNU MP Library.
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl The GNU MP Library is free software; you can redistribute it and/or modify
|
|
Packit |
5c3484 |
dnl it under the terms of either:
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl * the GNU Lesser General Public License as published by the Free
|
|
Packit |
5c3484 |
dnl Software Foundation; either version 3 of the License, or (at your
|
|
Packit |
5c3484 |
dnl option) any later version.
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl or
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl * the GNU General Public License as published by the Free Software
|
|
Packit |
5c3484 |
dnl Foundation; either version 2 of the License, or (at your option) any
|
|
Packit |
5c3484 |
dnl later version.
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl or both in parallel, as here.
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl The GNU MP Library is distributed in the hope that it will be useful, but
|
|
Packit |
5c3484 |
dnl WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
|
|
Packit |
5c3484 |
dnl or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
Packit |
5c3484 |
dnl for more details.
|
|
Packit |
5c3484 |
dnl
|
|
Packit |
5c3484 |
dnl You should have received copies of the GNU General Public License and the
|
|
Packit |
5c3484 |
dnl GNU Lesser General Public License along with the GNU MP Library. If not,
|
|
Packit |
5c3484 |
dnl see https://www.gnu.org/licenses/.
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
include(`../config.m4')
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
C cycles/limb
|
|
Packit |
5c3484 |
C 603e: ?
|
|
Packit |
5c3484 |
C 604e: 4.0
|
|
Packit |
5c3484 |
C 75x (G3): 4.5-11
|
|
Packit |
5c3484 |
C 7400,7410 (G4): 4.5-11
|
|
Packit |
5c3484 |
C 744x,745x (G4+): 6.0
|
|
Packit |
5c3484 |
C power4/ppc970: 6.0
|
|
Packit |
5c3484 |
C power5: 5.63
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
C INPUT PARAMETERS
|
|
Packit |
5c3484 |
C rp r3
|
|
Packit |
5c3484 |
C up r4
|
|
Packit |
5c3484 |
C n r5
|
|
Packit |
5c3484 |
C vl r6
|
|
Packit |
5c3484 |
|
|
Packit |
5c3484 |
ASM_START()
|
|
Packit |
5c3484 |
PROLOGUE(mpn_mul_1)
|
|
Packit |
5c3484 |
mtctr r5
|
|
Packit |
5c3484 |
addi r3,r3,-4 C adjust res_ptr, it's offset before it's used
|
|
Packit |
5c3484 |
li r12,0 C clear upper product reg
|
|
Packit |
5c3484 |
addic r0,r0,0 C clear cy
|
|
Packit |
5c3484 |
C Start software pipeline
|
|
Packit |
5c3484 |
lwz r8,0(r4)
|
|
Packit |
5c3484 |
bdz L(end3)
|
|
Packit |
5c3484 |
lwzu r9,4(r4)
|
|
Packit |
5c3484 |
mullw r11,r8,r6
|
|
Packit |
5c3484 |
mulhwu r0,r8,r6
|
|
Packit |
5c3484 |
bdz L(end1)
|
|
Packit |
5c3484 |
C Software pipelined main loop
|
|
Packit |
5c3484 |
L(loop):
|
|
Packit |
5c3484 |
lwz r8,4(r4)
|
|
Packit |
5c3484 |
mullw r10,r9,r6
|
|
Packit |
5c3484 |
adde r5,r11,r12
|
|
Packit |
5c3484 |
mulhwu r12,r9,r6
|
|
Packit |
5c3484 |
stw r5,4(r3)
|
|
Packit |
5c3484 |
bdz L(end2)
|
|
Packit |
5c3484 |
lwzu r9,8(r4)
|
|
Packit |
5c3484 |
mullw r11,r8,r6
|
|
Packit |
5c3484 |
adde r7,r10,r0
|
|
Packit |
5c3484 |
mulhwu r0,r8,r6
|
|
Packit |
5c3484 |
stwu r7,8(r3)
|
|
Packit |
5c3484 |
bdnz L(loop)
|
|
Packit |
5c3484 |
C Finish software pipeline
|
|
Packit |
5c3484 |
L(end1):
|
|
Packit |
5c3484 |
mullw r10,r9,r6
|
|
Packit |
5c3484 |
adde r5,r11,r12
|
|
Packit |
5c3484 |
mulhwu r12,r9,r6
|
|
Packit |
5c3484 |
stw r5,4(r3)
|
|
Packit |
5c3484 |
adde r7,r10,r0
|
|
Packit |
5c3484 |
stwu r7,8(r3)
|
|
Packit |
5c3484 |
addze r3,r12
|
|
Packit |
5c3484 |
blr
|
|
Packit |
5c3484 |
L(end2):
|
|
Packit |
5c3484 |
mullw r11,r8,r6
|
|
Packit |
5c3484 |
adde r7,r10,r0
|
|
Packit |
5c3484 |
mulhwu r0,r8,r6
|
|
Packit |
5c3484 |
stwu r7,8(r3)
|
|
Packit |
5c3484 |
adde r5,r11,r12
|
|
Packit |
5c3484 |
stw r5,4(r3)
|
|
Packit |
5c3484 |
addze r3,r0
|
|
Packit |
5c3484 |
blr
|
|
Packit |
5c3484 |
L(end3):
|
|
Packit |
5c3484 |
mullw r11,r8,r6
|
|
Packit |
5c3484 |
stw r11,4(r3)
|
|
Packit |
5c3484 |
mulhwu r3,r8,r6
|
|
Packit |
5c3484 |
blr
|
|
Packit |
5c3484 |
EPILOGUE(mpn_mul_1)
|