mpir/mpn/x86w/mul_1.asm

108 lines
2.6 KiB
NASM
Raw Normal View History

; Copyright 1992, 1994, 1997, 1998, 1999, 2000, 2001, 2002 Free Software
; Foundation, Inc.
;
; This file is part of the GNU MP Library.
;
; The GNU MP Library is free software; you can redistribute it and/or
; modify it under the terms of the GNU Lesser General Public License as
; published by the Free Software Foundation; either version 2.1 of the
; License, or (at your option) any later version.
;
; The GNU MP Library is distributed in the hope that it will be useful,
; but WITHOUT ANY WARRANTY; without even the implied warranty of
; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
; Lesser General Public License for more details.
;
; You should have received a copy of the GNU Lesser General Public
; License along with the GNU MP Library; see the file COPYING.LIB. If
; not, write to the Free Software Foundation, Inc., 59 Temple Place -
; Suite 330, Boston, MA 02111-1307, USA.
;
; Translation of AT&T syntax code by Brian Gladman
%include "x86i.inc"
%define PARAM_MULTIPLIER esp+frame+16
%define PARAM_SIZE esp+frame+12
%define PARAM_SRC esp+frame+8
%define PARAM_DST esp+frame+4
%assign frame 0
section .text
global ___gmpn_mul_1
%ifdef DLL
export ___gmpn_mul_1
%endif
align 8
___gmpn_mul_1:
push edi
push esi
push ebx
push ebp
%assign frame frame+16
mov edi,[PARAM_DST]
mov esi,[PARAM_SRC]
mov ecx,[PARAM_SIZE]
xor ebx,ebx
and ecx,3
jz Lend0
Loop0:
mov eax,[esi]
mul dword [PARAM_MULTIPLIER]
lea esi,[4+esi]
add eax,ebx
mov ebx,0
adc edx,ebx
mov [edi],eax
mov ebx,edx ; propagate carry into cylimb
lea edi,[4+edi]
dec ecx
jnz Loop0
Lend0:
mov ecx,[PARAM_SIZE]
shr ecx,2
jz Lend
align 8
Lop:
mov eax,[esi]
mul dword [PARAM_MULTIPLIER]
add ebx,eax
mov ebp,0
adc ebp,edx
mov eax,[4+esi]
mul dword [PARAM_MULTIPLIER]
mov [edi],ebx
add ebp,eax ; new lo + cylimb
mov ebx,0
adc ebx,edx
mov eax,[8+esi]
mul dword [PARAM_MULTIPLIER]
mov [4+edi],ebp
add ebx,eax ; new lo + cylimb
mov ebp,0
adc ebp,edx
mov eax,[12+esi]
mul dword [PARAM_MULTIPLIER]
mov [8+edi],ebx
add ebp,eax ; new lo + cylimb
mov ebx,0
adc ebx,edx
mov [12+edi],ebp
lea esi,[16+esi]
lea edi,[16+edi]
dec ecx
jnz Lop
Lend:
mov eax,ebx
pop ebp
pop ebx
pop esi
pop edi
ret
end