Blame sysdeps/x86_64/addmul_1.S

Packit 6c4009
/* x86-64 __mpn_addmul_1 -- Multiply a limb vector with a limb and add
Packit 6c4009
   the result to a second limb vector.
Packit 6c4009
   Copyright (C) 2003-2018 Free Software Foundation, Inc.
Packit 6c4009
   This file is part of the GNU MP Library.
Packit 6c4009
Packit 6c4009
   The GNU MP Library is free software; you can redistribute it and/or modify
Packit 6c4009
   it under the terms of the GNU Lesser General Public License as published by
Packit 6c4009
   the Free Software Foundation; either version 2.1 of the License, or (at your
Packit 6c4009
   option) any later version.
Packit 6c4009
Packit 6c4009
   The GNU MP Library is distributed in the hope that it will be useful, but
Packit 6c4009
   WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
Packit 6c4009
   or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
Packit 6c4009
   License for more details.
Packit 6c4009
Packit 6c4009
   You should have received a copy of the GNU Lesser General Public License
Packit 6c4009
   along with the GNU MP Library; see the file COPYING.LIB.  If not,
Packit 6c4009
   see <http://www.gnu.org/licenses/>.  */
Packit 6c4009
Packit 6c4009
#include "sysdep.h"
Packit 6c4009
#include "asm-syntax.h"
Packit 6c4009
Packit 6c4009
#define rp	%rdi
Packit 6c4009
#define up	%rsi
Packit 6c4009
#define n	%rdx
Packit 6c4009
#define v0	%rcx
Packit 6c4009
Packit 6c4009
#ifndef func
Packit 6c4009
# define func __mpn_addmul_1
Packit 6c4009
# define ADDSUB add
Packit 6c4009
#endif
Packit 6c4009
Packit 6c4009
	.text
Packit 6c4009
ENTRY (func)
Packit 6c4009
	push	%rbx
Packit 6c4009
	push	%rbp
Packit 6c4009
	lea	(%rdx), %rbx
Packit 6c4009
	neg	%rbx
Packit 6c4009
Packit 6c4009
	mov	(up), %rax
Packit 6c4009
	mov	(rp), %r10
Packit 6c4009
Packit 6c4009
	lea	-16(rp,%rdx,8), rp
Packit 6c4009
	lea	(up,%rdx,8), up
Packit 6c4009
	mul	%rcx
Packit 6c4009
Packit 6c4009
	bt	$0, %ebx
Packit 6c4009
	jc	L(odd)
Packit 6c4009
Packit 6c4009
	lea	(%rax), %r11
Packit 6c4009
	mov	8(up,%rbx,8), %rax
Packit 6c4009
	lea	(%rdx), %rbp
Packit 6c4009
	mul	%rcx
Packit 6c4009
	add	$2, %rbx
Packit 6c4009
	jns	L(n2)
Packit 6c4009
Packit 6c4009
	lea	(%rax), %r8
Packit 6c4009
	mov	(up,%rbx,8), %rax
Packit 6c4009
	lea	(%rdx), %r9
Packit 6c4009
	jmp	L(mid)
Packit 6c4009
Packit 6c4009
L(odd):	add	$1, %rbx
Packit 6c4009
	jns	L(n1)
Packit 6c4009
Packit 6c4009
	lea	(%rax), %r8
Packit 6c4009
	mov	(up,%rbx,8), %rax
Packit 6c4009
	lea	(%rdx), %r9
Packit 6c4009
	mul	%rcx
Packit 6c4009
	lea	(%rax), %r11
Packit 6c4009
	mov	8(up,%rbx,8), %rax
Packit 6c4009
	lea	(%rdx), %rbp
Packit 6c4009
	jmp	L(e)
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(top):	mul	%rcx
Packit 6c4009
	ADDSUB	%r8, %r10
Packit 6c4009
	lea	(%rax), %r8
Packit 6c4009
	mov	(up,%rbx,8), %rax
Packit 6c4009
	adc	%r9, %r11
Packit 6c4009
	mov	%r10, -8(rp,%rbx,8)
Packit 6c4009
	mov	(rp,%rbx,8), %r10
Packit 6c4009
	lea	(%rdx), %r9
Packit 6c4009
	adc	$0, %rbp
Packit 6c4009
L(mid):	mul	%rcx
Packit 6c4009
	ADDSUB	%r11, %r10
Packit 6c4009
	lea	(%rax), %r11
Packit 6c4009
	mov	8(up,%rbx,8), %rax
Packit 6c4009
	adc	%rbp, %r8
Packit 6c4009
	mov	%r10, (rp,%rbx,8)
Packit 6c4009
	mov	8(rp,%rbx,8), %r10
Packit 6c4009
	lea	(%rdx), %rbp
Packit 6c4009
	adc	$0, %r9
Packit 6c4009
L(e):	add	$2, %rbx
Packit 6c4009
	js	L(top)
Packit 6c4009
Packit 6c4009
	mul	%rcx
Packit 6c4009
	ADDSUB	%r8, %r10
Packit 6c4009
	adc	%r9, %r11
Packit 6c4009
	mov	%r10, -8(rp)
Packit 6c4009
	adc	$0, %rbp
Packit 6c4009
L(n2):	mov	(rp), %r10
Packit 6c4009
	ADDSUB	%r11, %r10
Packit 6c4009
	adc	%rbp, %rax
Packit 6c4009
	mov	%r10, (rp)
Packit 6c4009
	adc	$0, %rdx
Packit 6c4009
L(n1):	mov	8(rp), %r10
Packit 6c4009
	ADDSUB	%rax, %r10
Packit 6c4009
	mov	%r10, 8(rp)
Packit 6c4009
	mov	%ebx, %eax	/* zero rax */
Packit 6c4009
	adc	%rdx, %rax
Packit 6c4009
	pop	%rbp
Packit 6c4009
	pop	%rbx
Packit 6c4009
	ret
Packit 6c4009
END (func)