177 lines
4.3 KiB
NASM
177 lines
4.3 KiB
NASM
|
|
; Copyright 1996, 1997, 1998, 1999, 2000, 2001, 2002 Free Software
|
|
; Foundation, Inc.
|
|
;
|
|
; This file is part of the GNU MP Library.
|
|
;
|
|
; The GNU MP Library is free software; you can redistribute it and/or
|
|
; modify it under the terms of the GNU Lesser General Public License as
|
|
; published by the Free Software Foundation; either version 2.1 of the
|
|
; License, or (at your option) any later version.
|
|
;
|
|
; The GNU MP Library is distributed in the hope that it will be useful,
|
|
; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
; Lesser General Public License for more details.
|
|
;
|
|
; You should have received a copy of the GNU Lesser General Public
|
|
; License along with the GNU MP Library; see the file COPYING.LIB. If
|
|
; not, write to the Free Software Foundation, Inc., 59 Temple Place -
|
|
; Suite 330, Boston, MA 02111-1307, USA.
|
|
;
|
|
; Translation of AT&T syntax code by Brian Gladman
|
|
|
|
%include "x86i.inc"
|
|
|
|
|
|
%define VAR_STACK_SPACE 8
|
|
%define PARAM_YSIZE esp+frame+20
|
|
%define PARAM_YP esp+frame+16
|
|
%define PARAM_XSIZE esp+frame+12
|
|
%define PARAM_XP esp+frame+8
|
|
%define PARAM_WP esp+frame+4
|
|
%define VAR_MULTIPLIER esp+frame-4
|
|
%define VAR_COUNTER esp+frame-8
|
|
|
|
section .text
|
|
|
|
global ___gmpn_mul_basecase
|
|
%ifdef DLL
|
|
export ___gmpn_mul_basecase
|
|
%endif
|
|
|
|
align 8
|
|
___gmpn_mul_basecase:
|
|
sub esp,VAR_STACK_SPACE
|
|
push esi
|
|
push ebp
|
|
push edi
|
|
%assign frame VAR_STACK_SPACE+12
|
|
mov esi,[PARAM_XP]
|
|
mov edi,[PARAM_WP]
|
|
mov ebp,[PARAM_YP]
|
|
mov eax,[esi] ; load xp[0]
|
|
mul dword [ebp] ; multiply by yp[0]
|
|
mov [edi],eax ; store to wp[0]
|
|
mov ecx,[PARAM_XSIZE] ; xsize
|
|
dec ecx ; If xsize = 1,ysize = 1 too
|
|
jz Ldone
|
|
FR_push ebx
|
|
mov ebx,edx
|
|
lea esi,[4+esi]
|
|
lea edi,[4+edi]
|
|
LoopM:
|
|
mov eax,[esi] ; load next limb at xp[j]
|
|
lea esi,[4+esi]
|
|
mul dword [ebp]
|
|
add eax,ebx
|
|
mov ebx,edx
|
|
adc ebx,0
|
|
mov [edi],eax
|
|
lea edi,[4+edi]
|
|
dec ecx
|
|
jnz LoopM
|
|
mov [edi],ebx ; most significant limb of product
|
|
add edi,4 ; increment wp
|
|
mov eax,[PARAM_XSIZE]
|
|
shl eax,2
|
|
sub edi,eax
|
|
sub esi,eax
|
|
mov eax,[PARAM_YSIZE] ; ysize
|
|
dec eax
|
|
jz Lskip
|
|
mov [VAR_COUNTER],eax ; set index i to ysize
|
|
Louter:
|
|
mov ebp,[PARAM_YP] ; yp
|
|
add ebp,4 ; make ebp point to next v limb
|
|
mov [PARAM_YP],ebp
|
|
mov eax,[ebp] ; copy y limb ...
|
|
mov [VAR_MULTIPLIER],eax ; ... to stack slot
|
|
mov ecx,[PARAM_XSIZE]
|
|
xor ebx,ebx
|
|
and ecx,3
|
|
jz Lend0
|
|
Loop0:
|
|
mov eax,[esi]
|
|
mul dword [VAR_MULTIPLIER]
|
|
lea esi,[4+esi]
|
|
add eax,ebx
|
|
mov ebx,0
|
|
adc edx,ebx
|
|
add [edi],eax
|
|
adc ebx,edx ; propagate carry into cylimb
|
|
lea edi,[4+edi]
|
|
dec ecx
|
|
jnz Loop0
|
|
Lend0:
|
|
mov ecx,[PARAM_XSIZE]
|
|
shr ecx,2
|
|
jz LendX
|
|
|
|
align 8
|
|
LoopX:
|
|
mov eax,[esi]
|
|
mul dword [VAR_MULTIPLIER]
|
|
add ebx,eax
|
|
mov ebp,0
|
|
adc ebp,edx
|
|
|
|
mov eax,[4+esi]
|
|
mul dword [VAR_MULTIPLIER]
|
|
add [edi],ebx
|
|
adc ebp,eax ; new lo + cylimb
|
|
mov ebx,0
|
|
adc ebx,edx
|
|
|
|
mov eax,[8+esi]
|
|
mul dword [VAR_MULTIPLIER]
|
|
add [4+edi],ebp
|
|
adc ebx,eax ; new lo + cylimb
|
|
mov ebp,0
|
|
adc ebp,edx
|
|
|
|
mov eax,[12+esi]
|
|
mul dword [VAR_MULTIPLIER]
|
|
add [8+edi],ebx
|
|
adc ebp,eax ; new lo + cylimb
|
|
mov ebx,0
|
|
adc ebx,edx
|
|
|
|
add [12+edi],ebp
|
|
adc ebx,0 ; propagate carry into cylimb
|
|
|
|
lea esi,[16+esi]
|
|
lea edi,[16+edi]
|
|
dec ecx
|
|
jnz LoopX
|
|
LendX:
|
|
mov [edi],ebx
|
|
add edi,4
|
|
|
|
; we incremented wp and xp in the loop above; compensate
|
|
mov eax,[PARAM_XSIZE]
|
|
shl eax,2
|
|
sub edi,eax
|
|
sub esi,eax
|
|
|
|
mov eax,[VAR_COUNTER]
|
|
dec eax
|
|
mov [VAR_COUNTER],eax
|
|
jnz Louter
|
|
Lskip:
|
|
pop ebx
|
|
pop edi
|
|
pop ebp
|
|
pop esi
|
|
add esp,8
|
|
ret
|
|
Ldone:
|
|
mov [4+edi],edx ; store to wp[1]
|
|
pop edi
|
|
pop ebp
|
|
pop esi
|
|
add esp,8
|
|
ret
|
|
|
|
end
|