[BACK]Return to add_n.asm CVS log [TXT][DIR] Up to [local] / OpenXM_contrib / gmp / mpn / pa32 / hppa2_0

Annotation of OpenXM_contrib/gmp/mpn/pa32/hppa2_0/add_n.asm, Revision 1.1.1.1

1.1       ohara       1: dnl  HP-PA 2.0 32-bit mpn_add_n -- Add two limb vectors of the same length > 0
                      2: dnl  and store sum in a third limb vector.
                      3:
                      4: dnl  Copyright 1997, 1998, 2000, 2001, 2002 Free Software Foundation, Inc.
                      5:
                      6: dnl  This file is part of the GNU MP Library.
                      7:
                      8: dnl  The GNU MP Library is free software; you can redistribute it and/or modify
                      9: dnl  it under the terms of the GNU Lesser General Public License as published
                     10: dnl  by the Free Software Foundation; either version 2.1 of the License, or (at
                     11: dnl  your option) any later version.
                     12:
                     13: dnl  The GNU MP Library is distributed in the hope that it will be useful, but
                     14: dnl  WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
                     15: dnl  or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
                     16: dnl  License for more details.
                     17:
                     18: dnl  You should have received a copy of the GNU Lesser General Public License
                     19: dnl  along with the GNU MP Library; see the file COPYING.LIB.  If not, write to
                     20: dnl  the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
                     21: dnl  MA 02111-1307, USA.
                     22:
                     23: include(`../config.m4')
                     24:
                     25: C INPUT PARAMETERS
                     26: C res_ptr      gr26
                     27: C s1_ptr       gr25
                     28: C s2_ptr       gr24
                     29: C size         gr23
                     30:
                     31: C This runs at 2 cycles/limb on PA8000.
                     32:
                     33: ASM_START()
                     34: PROLOGUE(mpn_add_n)
                     35:        sub             %r0,%r23,%r22
                     36:        zdep            %r22,30,3,%r28          C r28 = 2 * (-n & 7)
                     37:        zdep            %r22,29,3,%r22          C r22 = 4 * (-n & 7)
                     38:        sub             %r25,%r22,%r25          C offset s1_ptr
                     39:        sub             %r24,%r22,%r24          C offset s2_ptr
                     40:        sub             %r26,%r22,%r26          C offset res_ptr
                     41:        blr             %r28,%r0                C branch into loop
                     42:        add             %r0,%r0,%r0             C reset carry
                     43:
                     44:        .label  L(loop)
                     45:        ldw             0(%r25),%r20
                     46:        ldw             0(%r24),%r31
                     47:        addc            %r20,%r31,%r20
                     48:        stw             %r20,0(%r26)
                     49:
                     50:        .label  L(7)
                     51:        ldw             4(%r25),%r21
                     52:        ldw             4(%r24),%r19
                     53:        addc            %r21,%r19,%r21
                     54:        stw             %r21,4(%r26)
                     55:
                     56:        .label  L(6)
                     57:        ldw             8(%r25),%r20
                     58:        ldw             8(%r24),%r31
                     59:        addc            %r20,%r31,%r20
                     60:        stw             %r20,8(%r26)
                     61:
                     62:        .label  L(5)
                     63:        ldw             12(%r25),%r21
                     64:        ldw             12(%r24),%r19
                     65:        addc            %r21,%r19,%r21
                     66:        stw             %r21,12(%r26)
                     67:
                     68:        .label  L(4)
                     69:        ldw             16(%r25),%r20
                     70:        ldw             16(%r24),%r31
                     71:        addc            %r20,%r31,%r20
                     72:        stw             %r20,16(%r26)
                     73:
                     74:        .label  L(3)
                     75:        ldw             20(%r25),%r21
                     76:        ldw             20(%r24),%r19
                     77:        addc            %r21,%r19,%r21
                     78:        stw             %r21,20(%r26)
                     79:
                     80:        .label  L(2)
                     81:        ldw             24(%r25),%r20
                     82:        ldw             24(%r24),%r31
                     83:        addc            %r20,%r31,%r20
                     84:        stw             %r20,24(%r26)
                     85:
                     86:        .label  L(1)
                     87:        ldw             28(%r25),%r21
                     88:        ldo             32(%r25),%r25
                     89:        ldw             28(%r24),%r19
                     90:        addc            %r21,%r19,%r21
                     91:        stw             %r21,28(%r26)
                     92:        ldo             32(%r24),%r24
                     93:        addib,>         -8,%r23,L(loop)
                     94:        ldo             32(%r26),%r26
                     95:
                     96:        bv              (%r2)
                     97:        addc            %r0,%r0,%r28
                     98: EPILOGUE()

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>