mpir/mpn/x86i/mul_1.asm
brgladman 48248cda46 1. longlong.h change to add MSVC intrinsics
2. longlong.h rearrangement for Intel compiler
3. MSVC additions in test  code 
4. GMP 4.2.1 bug fixes
5. Intel format assembly code
2008-05-18 22:20:43 +00:00

108 lines
2.7 KiB
NASM

; Copyright 1992, 1994, 1997, 1998, 1999, 2000, 2001, 2002 Free Software
; Foundation, Inc.
;
; This file is part of the GNU MP Library.
;
; The GNU MP Library is free software; you can redistribute it and/or
; modify it under the terms of the GNU Lesser General Public License as
; published by the Free Software Foundation; either version 2.1 of the
; License, or (at your option) any later version.
;
; The GNU MP Library is distributed in the hope that it will be useful,
; but WITHOUT ANY WARRANTY; without even the implied warranty of
; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
; Lesser General Public License for more details.
;
; You should have received a copy of the GNU Lesser General Public
; License along with the GNU MP Library; see the file COPYING.LIB. If
; not, write to the Free Software Foundation, Inc., 59 Temple Place -
; Suite 330, Boston, MA 02111-1307, USA.
;
; Translation of AT&T syntax code by Brian Gladman
%include "x86i.inc"
%define PARAM_MULTIPLIER esp+frame+16
%define PARAM_SIZE esp+frame+12
%define PARAM_SRC esp+frame+8
%define PARAM_DST esp+frame+4
%assign frame 0
section .text
global ___gmpn_mul_1
%ifdef DLL
export ___gmpn_mul_1
%endif
align 8
___gmpn_mul_1:
push edi
push esi
push ebx
push ebp
%assign frame frame+16
mov edi,[PARAM_DST]
mov esi,[PARAM_SRC]
mov ecx,[PARAM_SIZE]
xor ebx,ebx
and ecx,3
jz Lend0
Loop0:
mov eax,[esi]
mul dword [PARAM_MULTIPLIER]
lea esi,[4+esi]
add eax,ebx
mov ebx,0
adc edx,ebx
mov [edi],eax
mov ebx,edx ; propagate carry into cylimb
lea edi,[4+edi]
dec ecx
jnz Loop0
Lend0:
mov ecx,[PARAM_SIZE]
shr ecx,2
jz Lend
align 8
Lop:
mov eax,[esi]
mul dword [PARAM_MULTIPLIER]
add ebx,eax
mov ebp,0
adc ebp,edx
mov eax,[4+esi]
mul dword [PARAM_MULTIPLIER]
mov [edi],ebx
add ebp,eax ; new lo + cylimb
mov ebx,0
adc ebx,edx
mov eax,[8+esi]
mul dword [PARAM_MULTIPLIER]
mov [4+edi],ebp
add ebx,eax ; new lo + cylimb
mov ebp,0
adc ebp,edx
mov eax,[12+esi]
mul dword [PARAM_MULTIPLIER]
mov [8+edi],ebx
add ebp,eax ; new lo + cylimb
mov ebx,0
adc ebx,edx
mov [12+edi],ebp
lea esi,[16+esi]
lea edi,[16+edi]
dec ecx
jnz Lop
Lend:
mov eax,ebx
pop ebp
pop ebx
pop esi
pop edi
ret
end