=================================================================== RCS file: /home/cvs/OpenXM_contrib/gmp/mpn/powerpc32/Attic/sub_n.asm,v retrieving revision 1.1 retrieving revision 1.1.1.2 diff -u -p -r1.1 -r1.1.1.2 --- OpenXM_contrib/gmp/mpn/powerpc32/Attic/sub_n.asm 2000/09/09 14:12:38 1.1 +++ OpenXM_contrib/gmp/mpn/powerpc32/Attic/sub_n.asm 2003/08/25 16:06:24 1.1.1.2 @@ -1,61 +1,83 @@ -dnl PowerPC-32 mpn_sub_n -- Subtract two limb vectors of the same length > 0 -dnl and store difference in a third limb vector. +dnl PowerPC 750 mpn_sub_n -- subtract limb vectors. -dnl Copyright (C) 1995, 1997, 2000 Free Software Foundation, Inc. +dnl Copyright 2002 Free Software Foundation, Inc. +dnl +dnl This file is part of the GNU MP Library. +dnl +dnl The GNU MP Library is free software; you can redistribute it and/or +dnl modify it under the terms of the GNU Lesser General Public License as +dnl published by the Free Software Foundation; either version 2.1 of the +dnl License, or (at your option) any later version. +dnl +dnl The GNU MP Library is distributed in the hope that it will be useful, +dnl but WITHOUT ANY WARRANTY; without even the implied warranty of +dnl MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +dnl Lesser General Public License for more details. +dnl +dnl You should have received a copy of the GNU Lesser General Public +dnl License along with the GNU MP Library; see the file COPYING.LIB. If +dnl not, write to the Free Software Foundation, Inc., 59 Temple Place - +dnl Suite 330, Boston, MA 02111-1307, USA. -dnl This file is part of the GNU MP Library. +include(`../config.m4') -dnl The GNU MP Library is free software; you can redistribute it and/or modify -dnl it under the terms of the GNU Lesser General Public License as published by -dnl the Free Software Foundation; either version 2.1 of the License, or (at your -dnl option) any later version. -dnl The GNU MP Library is distributed in the hope that it will be useful, but -dnl WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY -dnl or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public -dnl License for more details. +C cycles/limb +C 604e: 4.0 +C 750: 4.0 -dnl You should have received a copy of the GNU Lesser General Public License -dnl along with the GNU MP Library; see the file COPYING.LIB. If not, write to -dnl the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, -dnl MA 02111-1307, USA. +C mp_limb_t mpn_sub_n (mp_ptr dst, mp_srcptr src1, mp_srcptr src2, +C mp_size_t size); +C +C Same style as mpn_add_n. -dnl INPUT PARAMETERS -dnl res_ptr r3 -dnl s1_ptr r4 -dnl s2_ptr r5 -dnl size r6 - -include(`../config.m4') - ASM_START() PROLOGUE(mpn_sub_n) - mtctr r6 C copy size into CTR - addic r0,r6,-1 C set cy - lwz r8,0(r4) C load least significant s1 limb - lwz r0,0(r5) C load least significant s2 limb - addi r3,r3,-4 C offset res_ptr, it's updated before it's used - bdz .Lend C If done, skip loop -.Loop: lwz r9,4(r4) C load s1 limb - lwz r10,4(r5) C load s2 limb - subfe r7,r0,r8 C subtract limbs with cy, set cy - stw r7,4(r3) C store result limb - bdz .Lexit C decrement CTR and exit if done - lwzu r8,8(r4) C load s1 limb and update s1_ptr - lwzu r0,8(r5) C load s2 limb and update s2_ptr - subfe r7,r10,r9 C subtract limbs with cy, set cy - stwu r7,8(r3) C store result limb and update res_ptr - bdnz .Loop C decrement CTR and loop back -.Lend: subfe r7,r0,r8 - stw r7,4(r3) C store ultimate result limb - subfe r3,r0,r0 C load !cy into ... - subfic r3,r3,0 C ... return value register + C r3 wp + C r4 xp + C r5 yp + C r6 size + + mtctr r6 C size + lwz r6, 0(r4) C xp[0] + + lwz r7, 0(r5) C yp[0] + sub r4, r4, r3 C xp-wp + + sub r5, r5, r3 C yp-wp + addi r4, r4, 4 C xp-wp-4 + + addi r5, r5, 4 C yp-wp-4 + subfc r6, r7, r6 + + stw r6, 0(r3) C wp[0] + bdz L(done) + + +L(top): + C r3 wp, incrementing + C r4 xp-wp+4 + C r5 yp-wp+4 + C r6 scratch + C r7 scratch + + lwzx r6, r4,r3 C xp[i] + + lwzx r7, r5,r3 C yp[i] + + C serialize + subfe r6, r7, r6 + + stwu r6, 4(r3) C wp[i] + bdnz L(top) + + +L(done): + subfe r3, r0, r0 C 0 or -1 + + subfic r3, r3, 0 C 0 or 1 blr -.Lexit: subfe r7,r10,r9 - stw r7,8(r3) - subfe r3,r0,r0 C load !cy into ... - subfic r3,r3,0 C ... return value register - blr -EPILOGUE(mpn_sub_n) + +EPILOGUE()