[BACK]Return to add_n.s CVS log [TXT][DIR] Up to [local] / OpenXM_contrib / gmp / mpn / a29k

Annotation of OpenXM_contrib/gmp/mpn/a29k/add_n.s, Revision 1.1.1.2

1.1.1.2 ! maekawa     1: ; 29000 __gmpn_add -- Add two limb vectors of the same length > 0 and store
1.1       maekawa     2: ; sum in a third limb vector.
                      3:
1.1.1.2 ! maekawa     4: ; Copyright (C) 1992, 1994, 2000 Free Software Foundation, Inc.
1.1       maekawa     5:
                      6: ; This file is part of the GNU MP Library.
                      7:
                      8: ; The GNU MP Library is free software; you can redistribute it and/or modify
1.1.1.2 ! maekawa     9: ; it under the terms of the GNU Lesser General Public License as published by
        !            10: ; the Free Software Foundation; either version 2.1 of the License, or (at your
1.1       maekawa    11: ; option) any later version.
                     12:
                     13: ; The GNU MP Library is distributed in the hope that it will be useful, but
                     14: ; WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
1.1.1.2 ! maekawa    15: ; or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
1.1       maekawa    16: ; License for more details.
                     17:
1.1.1.2 ! maekawa    18: ; You should have received a copy of the GNU Lesser General Public License
1.1       maekawa    19: ; along with the GNU MP Library; see the file COPYING.LIB.  If not, write to
                     20: ; the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
                     21: ; MA 02111-1307, USA.
                     22:
                     23:
                     24: ; INPUT PARAMETERS
                     25: ; res_ptr      lr2
                     26: ; s1_ptr       lr3
                     27: ; s2_ptr       lr4
                     28: ; size         lr5
                     29:
                     30: ; We use the loadm/storem instructions and operate on chunks of 8
                     31: ; limbs/per iteration, until less than 8 limbs remain.
                     32:
                     33: ; The 29k has no addition or subtraction instructions that doesn't
                     34: ; affect carry, so we need to save and restore that as soon as we
                     35: ; adjust the pointers.  gr116 is used for this purpose.  Note that
                     36: ; gr116==0 means that carry should be set.
                     37:
                     38:        .sect .lit,lit
                     39:        .text
                     40:        .align  4
1.1.1.2 ! maekawa    41:        .global ___gmpn_add_n
1.1       maekawa    42:        .word   0x60000
1.1.1.2 ! maekawa    43: ___gmpn_add_n:
1.1       maekawa    44:        srl     gr117,lr5,3
                     45:        sub     gr118,gr117,1
                     46:        jmpt    gr118,Ltail
                     47:         constn gr116,-1                ; init cy reg
                     48:        sub     gr117,gr117,2           ; count for jmpfdec
                     49:
                     50: ; Main loop working 8 limbs/iteration.
                     51: Loop:  mtsrim  cr,(8-1)
                     52:        loadm   0,0,gr96,lr3
                     53:        add     lr3,lr3,32
                     54:        mtsrim  cr,(8-1)
                     55:        loadm   0,0,gr104,lr4
                     56:        add     lr4,lr4,32
                     57:
                     58:        subr    gr116,gr116,0           ; restore carry
                     59:        addc    gr96,gr96,gr104
                     60:        addc    gr97,gr97,gr105
                     61:        addc    gr98,gr98,gr106
                     62:        addc    gr99,gr99,gr107
                     63:        addc    gr100,gr100,gr108
                     64:        addc    gr101,gr101,gr109
                     65:        addc    gr102,gr102,gr110
                     66:        addc    gr103,gr103,gr111
                     67:        subc    gr116,gr116,gr116       ; gr116 = not(cy)
                     68:
                     69:        mtsrim  cr,(8-1)
                     70:        storem  0,0,gr96,lr2
                     71:        jmpfdec gr117,Loop
                     72:         add    lr2,lr2,32
                     73:
                     74: ; Code for the last up-to-7 limbs.
                     75: ; This code might look very strange, but it's hard to write it
                     76: ; differently without major slowdown.
                     77:
                     78:        and     lr5,lr5,(8-1)
                     79: Ltail: sub     gr118,lr5,1             ; count for CR
                     80:        jmpt    gr118,Lend
                     81:         sub    gr117,lr5,2             ; count for jmpfdec
                     82:
                     83:        mtsr    cr,gr118
                     84:        loadm   0,0,gr96,lr3
                     85:        mtsr    cr,gr118
                     86:        loadm   0,0,gr104,lr4
                     87:
                     88:        subr    gr116,gr116,0           ; restore carry
                     89:
                     90:        jmpfdec gr117,L1
                     91:         addc   gr96,gr96,gr104
                     92:        jmp     Lstore
                     93:         mtsr   cr,gr118
                     94: L1:    jmpfdec gr117,L2
                     95:         addc   gr97,gr97,gr105
                     96:        jmp     Lstore
                     97:         mtsr   cr,gr118
                     98: L2:    jmpfdec gr117,L3
                     99:         addc   gr98,gr98,gr106
                    100:        jmp     Lstore
                    101:         mtsr   cr,gr118
                    102: L3:    jmpfdec gr117,L4
                    103:         addc   gr99,gr99,gr107
                    104:        jmp     Lstore
                    105:         mtsr   cr,gr118
                    106: L4:    jmpfdec gr117,L5
                    107:         addc   gr100,gr100,gr108
                    108:        jmp     Lstore
                    109:         mtsr   cr,gr118
                    110: L5:    jmpfdec gr117,L6
                    111:         addc   gr101,gr101,gr109
                    112:        jmp     Lstore
                    113:         mtsr   cr,gr118
                    114: L6:    addc    gr102,gr102,gr110
                    115:
                    116: Lstore:        storem  0,0,gr96,lr2
                    117:        subc    gr116,gr116,gr116       ; gr116 = not(cy)
                    118:
                    119: Lend:  jmpi    lr0
                    120:         add    gr96,gr116,1

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>