Blame nss/lib/freebl/mpi/mpi_x86_asm.c

Packit 40b132
/*
Packit 40b132
 *  mpi_x86_asm.c - MSVC inline assembly implementation of s_mpv_ functions.
Packit 40b132
 * 
Packit 40b132
 * This Source Code Form is subject to the terms of the Mozilla Public
Packit 40b132
 * License, v. 2.0. If a copy of the MPL was not distributed with this
Packit 40b132
 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
Packit 40b132
Packit 40b132
#include "mpi-priv.h"
Packit 40b132
Packit 40b132
static int is_sse = -1;
Packit 40b132
extern unsigned long s_mpi_is_sse2();
Packit 40b132
Packit 40b132
/*
Packit 40b132
 *   ebp - 36:	caller's esi
Packit 40b132
 *   ebp - 32:	caller's edi
Packit 40b132
 *   ebp - 28:	
Packit 40b132
 *   ebp - 24:	
Packit 40b132
 *   ebp - 20:	
Packit 40b132
 *   ebp - 16:	
Packit 40b132
 *   ebp - 12:	
Packit 40b132
 *   ebp - 8:	
Packit 40b132
 *   ebp - 4:	
Packit 40b132
 *   ebp + 0:	caller's ebp
Packit 40b132
 *   ebp + 4:	return address
Packit 40b132
 *   ebp + 8:	a	argument
Packit 40b132
 *   ebp + 12:	a_len	argument
Packit 40b132
 *   ebp + 16:	b	argument
Packit 40b132
 *   ebp + 20:	c	argument
Packit 40b132
 *   registers:
Packit 40b132
 *  	eax:
Packit 40b132
 * 	ebx:	carry
Packit 40b132
 * 	ecx:	a_len
Packit 40b132
 * 	edx:
Packit 40b132
 * 	esi:	a ptr
Packit 40b132
 * 	edi:	c ptr
Packit 40b132
 */
Packit 40b132
__declspec(naked) void
Packit 40b132
s_mpv_mul_d(const mp_digit *a, mp_size a_len, mp_digit b, mp_digit *c)
Packit 40b132
{
Packit 40b132
  __asm {
Packit 40b132
    mov    eax, is_sse
Packit 40b132
    cmp    eax, 0
Packit 40b132
    je     s_mpv_mul_d_x86
Packit 40b132
    jg     s_mpv_mul_d_sse2
Packit 40b132
    call   s_mpi_is_sse2
Packit 40b132
    mov    is_sse, eax
Packit 40b132
    cmp    eax, 0
Packit 40b132
    jg     s_mpv_mul_d_sse2
Packit 40b132
s_mpv_mul_d_x86:
Packit 40b132
    push   ebp
Packit 40b132
    mov    ebp,esp
Packit 40b132
    sub    esp,28
Packit 40b132
    push   edi
Packit 40b132
    push   esi
Packit 40b132
    push   ebx
Packit 40b132
    mov    ebx,0		; carry = 0
Packit 40b132
    mov    ecx,[ebp+12]		; ecx = a_len
Packit 40b132
    mov    edi,[ebp+20]
Packit 40b132
    cmp    ecx,0
Packit 40b132
    je     L_2			; jmp if a_len == 0
Packit 40b132
    mov    esi,[ebp+8]		; esi = a
Packit 40b132
    cld
Packit 40b132
L_1:
Packit 40b132
    lodsd			; eax = [ds:esi]; esi += 4
Packit 40b132
    mov    edx,[ebp+16]		; edx = b
Packit 40b132
    mul    edx			; edx:eax = Phi:Plo = a_i * b
Packit 40b132
Packit 40b132
    add    eax,ebx		; add carry (ebx) to edx:eax
Packit 40b132
    adc    edx,0
Packit 40b132
    mov    ebx,edx		; high half of product becomes next carry
Packit 40b132
Packit 40b132
    stosd			; [es:edi] = ax; edi += 4;
Packit 40b132
    dec    ecx			; --a_len
Packit 40b132
    jnz    L_1			; jmp if a_len != 0
Packit 40b132
L_2:
Packit 40b132
    mov    [edi],ebx		; *c = carry
Packit 40b132
    pop    ebx
Packit 40b132
    pop    esi
Packit 40b132
    pop    edi
Packit 40b132
    leave  
Packit 40b132
    ret    
Packit 40b132
    nop
Packit 40b132
s_mpv_mul_d_sse2:
Packit 40b132
    push   ebp
Packit 40b132
    mov    ebp, esp
Packit 40b132
    push   edi
Packit 40b132
    push   esi
Packit 40b132
    psubq  mm2, mm2		; carry = 0
Packit 40b132
    mov    ecx, [ebp+12]	; ecx = a_len
Packit 40b132
    movd   mm1, [ebp+16]	; mm1 = b
Packit 40b132
    mov    edi, [ebp+20]
Packit 40b132
    cmp    ecx, 0
Packit 40b132
    je     L_6			; jmp if a_len == 0
Packit 40b132
    mov    esi, [ebp+8]		; esi = a
Packit 40b132
    cld
Packit 40b132
L_5:
Packit 40b132
    movd   mm0, [esi]		; mm0 = *a++
Packit 40b132
    add    esi, 4
Packit 40b132
    pmuludq mm0, mm1		; mm0 = b * *a++
Packit 40b132
    paddq  mm2, mm0		; add the carry
Packit 40b132
    movd   [edi], mm2		; store the 32bit result
Packit 40b132
    add    edi, 4
Packit 40b132
    psrlq  mm2, 32		; save the carry
Packit 40b132
    dec    ecx			; --a_len
Packit 40b132
    jnz    L_5			; jmp if a_len != 0
Packit 40b132
L_6:
Packit 40b132
    movd   [edi], mm2		; *c = carry
Packit 40b132
    emms
Packit 40b132
    pop    esi
Packit 40b132
    pop    edi
Packit 40b132
    leave  
Packit 40b132
    ret    
Packit 40b132
    nop
Packit 40b132
  }
Packit 40b132
}
Packit 40b132
Packit 40b132
/*
Packit 40b132
 *   ebp - 36:	caller's esi
Packit 40b132
 *   ebp - 32:	caller's edi
Packit 40b132
 *   ebp - 28:	
Packit 40b132
 *   ebp - 24:	
Packit 40b132
 *   ebp - 20:	
Packit 40b132
 *   ebp - 16:	
Packit 40b132
 *   ebp - 12:	
Packit 40b132
 *   ebp - 8:	
Packit 40b132
 *   ebp - 4:	
Packit 40b132
 *   ebp + 0:	caller's ebp
Packit 40b132
 *   ebp + 4:	return address
Packit 40b132
 *   ebp + 8:	a	argument
Packit 40b132
 *   ebp + 12:	a_len	argument
Packit 40b132
 *   ebp + 16:	b	argument
Packit 40b132
 *   ebp + 20:	c	argument
Packit 40b132
 *   registers:
Packit 40b132
 *  	eax:
Packit 40b132
 * 	ebx:	carry
Packit 40b132
 * 	ecx:	a_len
Packit 40b132
 * 	edx:
Packit 40b132
 * 	esi:	a ptr
Packit 40b132
 * 	edi:	c ptr
Packit 40b132
 */
Packit 40b132
__declspec(naked) void
Packit 40b132
s_mpv_mul_d_add(const mp_digit *a, mp_size a_len, mp_digit b, mp_digit *c)
Packit 40b132
{
Packit 40b132
  __asm {
Packit 40b132
    mov    eax, is_sse
Packit 40b132
    cmp    eax, 0
Packit 40b132
    je     s_mpv_mul_d_add_x86
Packit 40b132
    jg     s_mpv_mul_d_add_sse2
Packit 40b132
    call   s_mpi_is_sse2
Packit 40b132
    mov    is_sse, eax
Packit 40b132
    cmp    eax, 0
Packit 40b132
    jg     s_mpv_mul_d_add_sse2
Packit 40b132
s_mpv_mul_d_add_x86:
Packit 40b132
    push   ebp
Packit 40b132
    mov    ebp,esp
Packit 40b132
    sub    esp,28
Packit 40b132
    push   edi
Packit 40b132
    push   esi
Packit 40b132
    push   ebx
Packit 40b132
    mov    ebx,0		; carry = 0
Packit 40b132
    mov    ecx,[ebp+12]		; ecx = a_len
Packit 40b132
    mov    edi,[ebp+20]
Packit 40b132
    cmp    ecx,0
Packit 40b132
    je     L_11			; jmp if a_len == 0
Packit 40b132
    mov    esi,[ebp+8]		; esi = a
Packit 40b132
    cld
Packit 40b132
L_10:
Packit 40b132
    lodsd			; eax = [ds:esi]; esi += 4
Packit 40b132
    mov    edx,[ebp+16]		; edx = b
Packit 40b132
    mul    edx			; edx:eax = Phi:Plo = a_i * b
Packit 40b132
Packit 40b132
    add    eax,ebx		; add carry (ebx) to edx:eax
Packit 40b132
    adc    edx,0
Packit 40b132
    mov    ebx,[edi]		; add in current word from *c
Packit 40b132
    add    eax,ebx		
Packit 40b132
    adc    edx,0
Packit 40b132
    mov    ebx,edx		; high half of product becomes next carry
Packit 40b132
Packit 40b132
    stosd			; [es:edi] = ax; edi += 4;
Packit 40b132
    dec    ecx			; --a_len
Packit 40b132
    jnz    L_10			; jmp if a_len != 0
Packit 40b132
L_11:
Packit 40b132
    mov    [edi],ebx		; *c = carry
Packit 40b132
    pop    ebx
Packit 40b132
    pop    esi
Packit 40b132
    pop    edi
Packit 40b132
    leave  
Packit 40b132
    ret    
Packit 40b132
    nop
Packit 40b132
s_mpv_mul_d_add_sse2:
Packit 40b132
    push   ebp
Packit 40b132
    mov    ebp, esp
Packit 40b132
    push   edi
Packit 40b132
    push   esi
Packit 40b132
    psubq  mm2, mm2		; carry = 0
Packit 40b132
    mov    ecx, [ebp+12]	; ecx = a_len
Packit 40b132
    movd   mm1, [ebp+16]	; mm1 = b
Packit 40b132
    mov    edi, [ebp+20]
Packit 40b132
    cmp    ecx, 0
Packit 40b132
    je     L_16			; jmp if a_len == 0
Packit 40b132
    mov    esi, [ebp+8]		; esi = a
Packit 40b132
    cld
Packit 40b132
L_15:
Packit 40b132
    movd   mm0, [esi]		; mm0 = *a++
Packit 40b132
    add    esi, 4
Packit 40b132
    pmuludq mm0, mm1		; mm0 = b * *a++
Packit 40b132
    paddq  mm2, mm0		; add the carry
Packit 40b132
    movd   mm0, [edi]
Packit 40b132
    paddq  mm2, mm0		; add the carry
Packit 40b132
    movd   [edi], mm2		; store the 32bit result
Packit 40b132
    add    edi, 4
Packit 40b132
    psrlq  mm2, 32		; save the carry
Packit 40b132
    dec    ecx			; --a_len
Packit 40b132
    jnz    L_15			; jmp if a_len != 0
Packit 40b132
L_16:
Packit 40b132
    movd   [edi], mm2		; *c = carry
Packit 40b132
    emms
Packit 40b132
    pop    esi
Packit 40b132
    pop    edi
Packit 40b132
    leave  
Packit 40b132
    ret    
Packit 40b132
    nop
Packit 40b132
  }
Packit 40b132
}
Packit 40b132
Packit 40b132
/*
Packit 40b132
 *   ebp - 36:	caller's esi
Packit 40b132
 *   ebp - 32:	caller's edi
Packit 40b132
 *   ebp - 28:	
Packit 40b132
 *   ebp - 24:	
Packit 40b132
 *   ebp - 20:	
Packit 40b132
 *   ebp - 16:	
Packit 40b132
 *   ebp - 12:	
Packit 40b132
 *   ebp - 8:	
Packit 40b132
 *   ebp - 4:	
Packit 40b132
 *   ebp + 0:	caller's ebp
Packit 40b132
 *   ebp + 4:	return address
Packit 40b132
 *   ebp + 8:	a	argument
Packit 40b132
 *   ebp + 12:	a_len	argument
Packit 40b132
 *   ebp + 16:	b	argument
Packit 40b132
 *   ebp + 20:	c	argument
Packit 40b132
 *   registers:
Packit 40b132
 *  	eax:
Packit 40b132
 * 	ebx:	carry
Packit 40b132
 * 	ecx:	a_len
Packit 40b132
 * 	edx:
Packit 40b132
 * 	esi:	a ptr
Packit 40b132
 * 	edi:	c ptr
Packit 40b132
 */
Packit 40b132
__declspec(naked) void
Packit 40b132
s_mpv_mul_d_add_prop(const mp_digit *a, mp_size a_len, mp_digit b, mp_digit *c)
Packit 40b132
{
Packit 40b132
  __asm {
Packit 40b132
    mov    eax, is_sse
Packit 40b132
    cmp    eax, 0
Packit 40b132
    je     s_mpv_mul_d_add_prop_x86
Packit 40b132
    jg     s_mpv_mul_d_add_prop_sse2
Packit 40b132
    call   s_mpi_is_sse2
Packit 40b132
    mov    is_sse, eax
Packit 40b132
    cmp    eax, 0
Packit 40b132
    jg     s_mpv_mul_d_add_prop_sse2
Packit 40b132
s_mpv_mul_d_add_prop_x86:
Packit 40b132
    push   ebp
Packit 40b132
    mov    ebp,esp
Packit 40b132
    sub    esp,28
Packit 40b132
    push   edi
Packit 40b132
    push   esi
Packit 40b132
    push   ebx
Packit 40b132
    mov    ebx,0		; carry = 0
Packit 40b132
    mov    ecx,[ebp+12]		; ecx = a_len
Packit 40b132
    mov    edi,[ebp+20]
Packit 40b132
    cmp    ecx,0
Packit 40b132
    je     L_21			; jmp if a_len == 0
Packit 40b132
    cld
Packit 40b132
    mov    esi,[ebp+8]		; esi = a
Packit 40b132
L_20:
Packit 40b132
    lodsd			; eax = [ds:esi]; esi += 4
Packit 40b132
    mov    edx,[ebp+16]		; edx = b
Packit 40b132
    mul    edx			; edx:eax = Phi:Plo = a_i * b
Packit 40b132
Packit 40b132
    add    eax,ebx		; add carry (ebx) to edx:eax
Packit 40b132
    adc    edx,0
Packit 40b132
    mov    ebx,[edi]		; add in current word from *c
Packit 40b132
    add    eax,ebx		
Packit 40b132
    adc    edx,0
Packit 40b132
    mov    ebx,edx		; high half of product becomes next carry
Packit 40b132
Packit 40b132
    stosd			; [es:edi] = ax; edi += 4;
Packit 40b132
    dec    ecx			; --a_len
Packit 40b132
    jnz    L_20			; jmp if a_len != 0
Packit 40b132
L_21:
Packit 40b132
    cmp    ebx,0		; is carry zero?
Packit 40b132
    jz     L_23
Packit 40b132
    mov    eax,[edi]		; add in current word from *c
Packit 40b132
    add    eax,ebx
Packit 40b132
    stosd			; [es:edi] = ax; edi += 4;
Packit 40b132
    jnc    L_23
Packit 40b132
L_22:
Packit 40b132
    mov    eax,[edi]		; add in current word from *c
Packit 40b132
    adc    eax,0
Packit 40b132
    stosd			; [es:edi] = ax; edi += 4;
Packit 40b132
    jc     L_22
Packit 40b132
L_23:
Packit 40b132
    pop    ebx
Packit 40b132
    pop    esi
Packit 40b132
    pop    edi
Packit 40b132
    leave  
Packit 40b132
    ret    
Packit 40b132
    nop
Packit 40b132
s_mpv_mul_d_add_prop_sse2:
Packit 40b132
    push   ebp
Packit 40b132
    mov    ebp, esp
Packit 40b132
    push   edi
Packit 40b132
    push   esi
Packit 40b132
    push   ebx
Packit 40b132
    psubq  mm2, mm2		; carry = 0
Packit 40b132
    mov    ecx, [ebp+12]	; ecx = a_len
Packit 40b132
    movd   mm1, [ebp+16]	; mm1 = b
Packit 40b132
    mov    edi, [ebp+20]
Packit 40b132
    cmp    ecx, 0
Packit 40b132
    je     L_26			; jmp if a_len == 0
Packit 40b132
    mov    esi, [ebp+8]		; esi = a
Packit 40b132
    cld
Packit 40b132
L_25:
Packit 40b132
    movd   mm0, [esi]		; mm0 = *a++
Packit 40b132
    movd   mm3, [edi]		; fetch the sum
Packit 40b132
    add    esi, 4
Packit 40b132
    pmuludq mm0, mm1		; mm0 = b * *a++
Packit 40b132
    paddq  mm2, mm0		; add the carry
Packit 40b132
    paddq  mm2, mm3		; add *c++
Packit 40b132
    movd   [edi], mm2		; store the 32bit result
Packit 40b132
    add    edi, 4
Packit 40b132
    psrlq  mm2, 32		; save the carry
Packit 40b132
    dec    ecx			; --a_len
Packit 40b132
    jnz    L_25			; jmp if a_len != 0
Packit 40b132
L_26:
Packit 40b132
    movd   ebx, mm2
Packit 40b132
    cmp    ebx, 0		; is carry zero?
Packit 40b132
    jz     L_28
Packit 40b132
    mov    eax, [edi]
Packit 40b132
    add    eax, ebx
Packit 40b132
    stosd
Packit 40b132
    jnc    L_28
Packit 40b132
L_27:
Packit 40b132
    mov    eax, [edi]		; add in current word from *c
Packit 40b132
    adc	   eax, 0
Packit 40b132
    stosd			; [es:edi] = ax; edi += 4;
Packit 40b132
    jc     L_27
Packit 40b132
L_28:
Packit 40b132
    emms
Packit 40b132
    pop    ebx
Packit 40b132
    pop    esi
Packit 40b132
    pop    edi
Packit 40b132
    leave  
Packit 40b132
    ret    
Packit 40b132
    nop
Packit 40b132
  }
Packit 40b132
}
Packit 40b132
Packit 40b132
/*
Packit 40b132
 *   ebp - 20:	caller's esi
Packit 40b132
 *   ebp - 16:	caller's edi
Packit 40b132
 *   ebp - 12:	
Packit 40b132
 *   ebp - 8:	carry
Packit 40b132
 *   ebp - 4:	a_len	local
Packit 40b132
 *   ebp + 0:	caller's ebp
Packit 40b132
 *   ebp + 4:	return address
Packit 40b132
 *   ebp + 8:	pa	argument
Packit 40b132
 *   ebp + 12:	a_len	argument
Packit 40b132
 *   ebp + 16:	ps	argument
Packit 40b132
 *   ebp + 20:	
Packit 40b132
 *   registers:
Packit 40b132
 *  	eax:
Packit 40b132
 * 	ebx:	carry
Packit 40b132
 * 	ecx:	a_len
Packit 40b132
 * 	edx:
Packit 40b132
 * 	esi:	a ptr
Packit 40b132
 * 	edi:	c ptr
Packit 40b132
 */
Packit 40b132
__declspec(naked) void
Packit 40b132
s_mpv_sqr_add_prop(const mp_digit *a, mp_size a_len, mp_digit *sqrs)
Packit 40b132
{
Packit 40b132
  __asm {
Packit 40b132
     mov    eax, is_sse
Packit 40b132
     cmp    eax, 0
Packit 40b132
     je     s_mpv_sqr_add_prop_x86
Packit 40b132
     jg     s_mpv_sqr_add_prop_sse2
Packit 40b132
     call   s_mpi_is_sse2
Packit 40b132
     mov    is_sse, eax
Packit 40b132
     cmp    eax, 0
Packit 40b132
     jg     s_mpv_sqr_add_prop_sse2
Packit 40b132
s_mpv_sqr_add_prop_x86:
Packit 40b132
     push   ebp
Packit 40b132
     mov    ebp,esp
Packit 40b132
     sub    esp,12
Packit 40b132
     push   edi
Packit 40b132
     push   esi
Packit 40b132
     push   ebx
Packit 40b132
     mov    ebx,0		; carry = 0
Packit 40b132
     mov    ecx,[ebp+12]	; a_len
Packit 40b132
     mov    edi,[ebp+16]	; edi = ps
Packit 40b132
     cmp    ecx,0
Packit 40b132
     je     L_31		; jump if a_len == 0
Packit 40b132
     cld
Packit 40b132
     mov    esi,[ebp+8]		; esi = pa
Packit 40b132
L_30:
Packit 40b132
     lodsd			; eax = [ds:si]; si += 4;
Packit 40b132
     mul    eax
Packit 40b132
Packit 40b132
     add    eax,ebx		; add "carry"
Packit 40b132
     adc    edx,0
Packit 40b132
     mov    ebx,[edi]
Packit 40b132
     add    eax,ebx		; add low word from result
Packit 40b132
     mov    ebx,[edi+4]
Packit 40b132
     stosd			; [es:di] = eax; di += 4;
Packit 40b132
     adc    edx,ebx		; add high word from result
Packit 40b132
     mov    ebx,0
Packit 40b132
     mov    eax,edx
Packit 40b132
     adc    ebx,0
Packit 40b132
     stosd			; [es:di] = eax; di += 4;
Packit 40b132
     dec    ecx			; --a_len
Packit 40b132
     jnz    L_30		; jmp if a_len != 0
Packit 40b132
L_31:
Packit 40b132
    cmp    ebx,0		; is carry zero?
Packit 40b132
    jz     L_34
Packit 40b132
    mov    eax,[edi]		; add in current word from *c
Packit 40b132
    add    eax,ebx
Packit 40b132
    stosd			; [es:edi] = ax; edi += 4;
Packit 40b132
    jnc    L_34
Packit 40b132
L_32:
Packit 40b132
    mov    eax,[edi]		; add in current word from *c
Packit 40b132
    adc    eax,0
Packit 40b132
    stosd			; [es:edi] = ax; edi += 4;
Packit 40b132
    jc     L_32
Packit 40b132
L_34:
Packit 40b132
    pop    ebx
Packit 40b132
    pop    esi
Packit 40b132
    pop    edi
Packit 40b132
    leave  
Packit 40b132
    ret    
Packit 40b132
    nop
Packit 40b132
s_mpv_sqr_add_prop_sse2:
Packit 40b132
    push   ebp
Packit 40b132
    mov    ebp, esp
Packit 40b132
    push   edi
Packit 40b132
    push   esi
Packit 40b132
    push   ebx
Packit 40b132
    psubq  mm2, mm2		; carry = 0
Packit 40b132
    mov    ecx, [ebp+12]	; ecx = a_len
Packit 40b132
    mov    edi, [ebp+16]
Packit 40b132
    cmp    ecx, 0
Packit 40b132
    je     L_36		; jmp if a_len == 0
Packit 40b132
    mov    esi, [ebp+8]		; esi = a
Packit 40b132
    cld
Packit 40b132
L_35:
Packit 40b132
    movd   mm0, [esi]		; mm0 = *a
Packit 40b132
    movd   mm3, [edi]		; fetch the sum
Packit 40b132
    add	   esi, 4
Packit 40b132
    pmuludq mm0, mm0		; mm0 = sqr(a)
Packit 40b132
    paddq  mm2, mm0		; add the carry
Packit 40b132
    paddq  mm2, mm3		; add the low word
Packit 40b132
    movd   mm3, [edi+4]
Packit 40b132
    movd   [edi], mm2		; store the 32bit result
Packit 40b132
    psrlq  mm2, 32	
Packit 40b132
    paddq  mm2, mm3		; add the high word
Packit 40b132
    movd   [edi+4], mm2		; store the 32bit result
Packit 40b132
    psrlq  mm2, 32		; save the carry.
Packit 40b132
    add    edi, 8
Packit 40b132
    dec    ecx			; --a_len
Packit 40b132
    jnz    L_35			; jmp if a_len != 0
Packit 40b132
L_36:
Packit 40b132
    movd   ebx, mm2
Packit 40b132
    cmp    ebx, 0		; is carry zero?
Packit 40b132
    jz     L_38
Packit 40b132
    mov    eax, [edi]
Packit 40b132
    add    eax, ebx
Packit 40b132
    stosd
Packit 40b132
    jnc    L_38
Packit 40b132
L_37:
Packit 40b132
    mov    eax, [edi]		; add in current word from *c
Packit 40b132
    adc	   eax, 0
Packit 40b132
    stosd			; [es:edi] = ax; edi += 4;
Packit 40b132
    jc     L_37
Packit 40b132
L_38:
Packit 40b132
    emms
Packit 40b132
    pop    ebx
Packit 40b132
    pop    esi
Packit 40b132
    pop    edi
Packit 40b132
    leave  
Packit 40b132
    ret    
Packit 40b132
    nop
Packit 40b132
  }
Packit 40b132
}
Packit 40b132
Packit 40b132
/* 
Packit 40b132
 *  Divide 64-bit (Nhi,Nlo) by 32-bit divisor, which must be normalized
Packit 40b132
 *  so its high bit is 1.   This code is from NSPR.
Packit 40b132
 *
Packit 40b132
 *  Dump of assembler code for function s_mpv_div_2dx1d:
Packit 40b132
 *  
Packit 40b132
 *   esp +  0:   Caller's ebx
Packit 40b132
 *   esp +  4:	return address
Packit 40b132
 *   esp +  8:	Nhi	argument
Packit 40b132
 *   esp + 12:	Nlo	argument
Packit 40b132
 *   esp + 16:	divisor	argument
Packit 40b132
 *   esp + 20:	qp	argument
Packit 40b132
 *   esp + 24:   rp	argument
Packit 40b132
 *   registers:
Packit 40b132
 *  	eax:
Packit 40b132
 * 	ebx:	carry
Packit 40b132
 * 	ecx:	a_len
Packit 40b132
 * 	edx:
Packit 40b132
 * 	esi:	a ptr
Packit 40b132
 * 	edi:	c ptr
Packit 40b132
 */  
Packit 40b132
__declspec(naked) mp_err
Packit 40b132
s_mpv_div_2dx1d(mp_digit Nhi, mp_digit Nlo, mp_digit divisor,
Packit 40b132
		mp_digit *qp, mp_digit *rp)
Packit 40b132
{
Packit 40b132
  __asm {
Packit 40b132
       push   ebx
Packit 40b132
       mov    edx,[esp+8]
Packit 40b132
       mov    eax,[esp+12]
Packit 40b132
       mov    ebx,[esp+16]
Packit 40b132
       div    ebx
Packit 40b132
       mov    ebx,[esp+20]
Packit 40b132
       mov    [ebx],eax
Packit 40b132
       mov    ebx,[esp+24]
Packit 40b132
       mov    [ebx],edx
Packit 40b132
       xor    eax,eax		; return zero
Packit 40b132
       pop    ebx
Packit 40b132
       ret    
Packit 40b132
       nop
Packit 40b132
  }
Packit 40b132
}