mpir/mpn/x86w/divexact_by3c.asm
2010-08-13 13:18:45 +00:00

89 lines
2.3 KiB
NASM

; Copyright 2000, 2001, 2002 Free Software Foundation, Inc.
;
; This file is part of the GNU MP Library.
;
; The GNU MP Library is free software; you can redistribute it and/or
; modify it under the terms of the GNU Lesser General Public License as
; published by the Free Software Foundation; either version 2.1 of the
; License, or (at your option) any later version.
;
; The GNU MP Library is distributed in the hope that it will be useful,
; but WITHOUT ANY WARRANTY; without even the implied warranty of
; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
; Lesser General Public License for more details.
;
; You should have received a copy of the GNU Lesser General Public
; License along with the GNU MP Library; see the file COPYING.LIB. If
; not, write to the Free Software Foundation, Inc., 59 Temple Place -
; Suite 330, Boston, MA 02111-1307, USA.
;
; Translation of AT&T syntax code by Brian Gladman
%include "x86i.inc"
%define PARAM_CARRY esp+frame+16
%define PARAM_SIZE esp+frame+12
%define PARAM_SRC esp+frame+8
%define PARAM_DST esp+frame+4
%assign frame 0
; multiplicative inverse of 3,modulo 2^32
; ceil(b/3) and ceil(b*2/3) where b=2^32
%define INVERSE_3 0xAAAAAAAB
%define ONE_THIRD_CEIL 0x55555556
%define TWO_THIRDS_CEIL 0xAAAAAAAB
section .text
global ___gmpn_divexact_by3c
%ifdef DLL
export ___gmpn_divexact_by3c
%endif
align 8
___gmpn_divexact_by3c:
mov ecx,[PARAM_SRC]
FR_push ebp
mov ebp,[PARAM_SIZE]
FR_push edi
mov edi,[PARAM_DST]
FR_push esi
mov esi,INVERSE_3
FR_push ebx
lea ecx,[ecx+ebp*4]
mov ebx,[PARAM_CARRY]
lea edi,[edi+ebp*4]
neg ebp
; eax scratch,low product
; ebx carry limb (0 to 3)
; ecx &src[size]
; edx scratch,high product
; esi multiplier
; edi &dst[size]
; ebp counter,limbs,negative
align 8
Ltop:
mov eax,[ecx+ebp*4]
sub eax,ebx
setc bl
imul esi
cmp eax,ONE_THIRD_CEIL
mov [edi+ebp*4],eax
sbb ebx,-1 ; +1 if eax>=ceil(b/3)
cmp eax,TWO_THIRDS_CEIL
sbb ebx,-1 ; +1 if eax>=ceil(b*2/3)
inc ebp
jnz Ltop
mov eax,ebx
pop ebx
pop esi
pop edi
pop ebp
ret
end