283 lines
6.6 KiB
NASM
283 lines
6.6 KiB
NASM
dnl HP-PA __udiv_qrnnd division support, used from longlong.h.
|
|
dnl This version runs fast on pre-PA7000 CPUs.
|
|
|
|
dnl Copyright 1993, 1994, 2000, 2001, 2002 Free Software Foundation, Inc.
|
|
|
|
dnl This file is part of the GNU MP Library.
|
|
|
|
dnl The GNU MP Library is free software; you can redistribute it and/or modify
|
|
dnl it under the terms of the GNU Lesser General Public License as published
|
|
dnl by the Free Software Foundation; either version 2.1 of the License, or (at
|
|
dnl your option) any later version.
|
|
|
|
dnl The GNU MP Library is distributed in the hope that it will be useful, but
|
|
dnl WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
|
|
dnl or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public
|
|
dnl License for more details.
|
|
|
|
dnl You should have received a copy of the GNU Lesser General Public License
|
|
dnl along with the GNU MP Library; see the file COPYING.LIB. If not, write
|
|
dnl to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
|
|
dnl Boston, MA 02110-1301, USA.
|
|
|
|
include(`../config.m4')
|
|
|
|
C INPUT PARAMETERS
|
|
C rem_ptr gr26
|
|
C n1 gr25
|
|
C n0 gr24
|
|
C d gr23
|
|
|
|
C The code size is a bit excessive. We could merge the last two ds;addc
|
|
C sequences by simply moving the "bb,< Odd" instruction down. The only
|
|
C trouble is the FFFFFFFF code that would need some hacking.
|
|
|
|
ASM_START()
|
|
PROLOGUE(mpn_udiv_qrnnd)
|
|
comb,< %r23,0,L(largedivisor)
|
|
sub %r0,%r23,%r1 C clear cy as side-effect
|
|
ds %r0,%r1,%r0
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r23,%r25
|
|
addc %r24,%r24,%r28
|
|
ds %r25,%r23,%r25
|
|
comclr,>= %r25,%r0,%r0
|
|
addl %r25,%r23,%r25
|
|
stws %r25,0(0,%r26)
|
|
bv 0(%r2)
|
|
addc %r28,%r28,%r28
|
|
|
|
LDEF(largedivisor)
|
|
extru %r24,31,1,%r19 C r19 = n0 & 1
|
|
bb,< %r23,31,L(odd)
|
|
extru %r23,30,31,%r22 C r22 = d >> 1
|
|
shd %r25,%r24,1,%r24 C r24 = new n0
|
|
extru %r25,30,31,%r25 C r25 = new n1
|
|
sub %r0,%r22,%r21
|
|
ds %r0,%r21,%r0
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
comclr,>= %r25,%r0,%r0
|
|
addl %r25,%r22,%r25
|
|
sh1addl %r25,%r19,%r25
|
|
stws %r25,0(0,%r26)
|
|
bv 0(%r2)
|
|
addc %r24,%r24,%r28
|
|
|
|
LDEF(odd)
|
|
addib,sv,n 1,%r22,L(FFFFFFFF) C r22 = (d / 2 + 1)
|
|
shd %r25,%r24,1,%r24 C r24 = new n0
|
|
extru %r25,30,31,%r25 C r25 = new n1
|
|
sub %r0,%r22,%r21
|
|
ds %r0,%r21,%r0
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r24
|
|
ds %r25,%r22,%r25
|
|
addc %r24,%r24,%r28
|
|
comclr,>= %r25,%r0,%r0
|
|
addl %r25,%r22,%r25
|
|
sh1addl %r25,%r19,%r25
|
|
C We have computed (n1,,n0) / (d + 1), q' = r28, r' = r25
|
|
add,nuv %r28,%r25,%r25
|
|
addl %r25,%r1,%r25
|
|
addc %r0,%r28,%r28
|
|
sub,<< %r25,%r23,%r0
|
|
addl %r25,%r1,%r25
|
|
stws %r25,0(0,%r26)
|
|
bv 0(%r2)
|
|
addc %r0,%r28,%r28
|
|
|
|
C This is just a special case of the code above.
|
|
C We come here when d == 0xFFFFFFFF
|
|
LDEF(FFFFFFFF)
|
|
add,uv %r25,%r24,%r24
|
|
sub,<< %r24,%r23,%r0
|
|
ldo 1(%r24),%r24
|
|
stws %r24,0(0,%r26)
|
|
bv 0(%r2)
|
|
addc %r0,%r25,%r28
|
|
EPILOGUE()
|