mpir/mpn/x86i/pentium4/sse2/sub_n.asm
brgladman 48248cda46 1. longlong.h change to add MSVC intrinsics
2. longlong.h rearrangement for Intel compiler
3. MSVC additions in test  code 
4. GMP 4.2.1 bug fixes
5. Intel format assembly code
2008-05-18 22:20:43 +00:00

83 lines
1.9 KiB
NASM

; Copyright 2001, 2002 Free Software Foundation, Inc.
;
; This file is part of the GNU MP Library.
;
; The GNU MP Library is free software; you can redistribute it and/or
; modify it under the terms of the GNU Lesser General Public License as
; published by the Free Software Foundation; either version 2.1 of the
; License, or (at your option) any later version.
;
; The GNU MP Library is distributed in the hope that it will be useful,
; but WITHOUT ANY WARRANTY; without even the implied warranty of
; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
; Lesser General Public License for more details.
;
; You should have received a copy of the GNU Lesser General Public
; License along with the GNU MP Library; see the file COPYING.LIB. If
; not, write to the Free Software Foundation, Inc., 59 Temple Place -
; Suite 330, Boston, MA 02111-1307, USA.
;
; Translation of AT&T syntax code by Brian Gladman
section .text
global ___gmpn_sub_nc
global ___gmpn_sub_n
%ifdef DLL
export ___gmpn_sub_nc
export ___gmpn_sub_n
%endif
align 8
___gmpn_sub_nc:
movd mm0,[20+esp]
jmp start_nc
align 8
___gmpn_sub_n:
pxor mm0,mm0
start_nc:
mov eax,[8+esp]
mov [8+esp],ebx
mov ebx,[12+esp]
mov edx,[4+esp]
mov ecx,[16+esp]
lea eax,[eax+ecx*4]
lea ebx,[ebx+ecx*4]
lea edx,[edx+ecx*4]
neg ecx
top:
movd mm1,[eax+ecx*4]
movd mm2,[ebx+ecx*4]
psubq mm1,mm2
psubq mm1,mm0
movd [edx+ecx*4],mm1
psrlq mm1,63
add ecx,1
jz done_mm1
movd mm0,[eax+ecx*4]
movd mm2,[ebx+ecx*4]
psubq mm0,mm2
psubq mm0,mm1
movd [edx+ecx*4],mm0
psrlq mm0,63
add ecx,1
jnz top
movd eax,mm0
mov ebx,[8+esp]
emms
ret
done_mm1:
movd eax,mm1
mov ebx,[8+esp]
emms
ret
end