[BACK]Return to lshift.asm CVS log [TXT][DIR] Up to [local] / OpenXM_contrib / gmp / mpn / powerpc64

Annotation of OpenXM_contrib/gmp/mpn/powerpc64/lshift.asm, Revision 1.1

1.1     ! maekawa     1: #  PowerPC-64 mpn_lshift -- Shift a number left.
        !             2:
        !             3: # Copyright (C) 1999, 2000 Free Software Foundation, Inc.
        !             4:
        !             5: # This file is part of the GNU MP Library.
        !             6:
        !             7: # The GNU MP Library is free software; you can redistribute it and/or modify
        !             8: # it under the terms of the GNU Lesser General Public License as published by
        !             9: # the Free Software Foundation; either version 2.1 of the License, or (at your
        !            10: # option) any later version.
        !            11:
        !            12: # The GNU MP Library is distributed in the hope that it will be useful, but
        !            13: # WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
        !            14: # or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
        !            15: # License for more details.
        !            16:
        !            17: # You should have received a copy of the GNU Lesser General Public License
        !            18: # along with the GNU MP Library; see the file COPYING.LIB.  If not, write to
        !            19: # the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
        !            20: # MA 02111-1307, USA.
        !            21:
        !            22:
        !            23: # INPUT PARAMETERS
        !            24: # res_ptr      r3
        !            25: # s1_ptr       r4
        !            26: # size         r5
        !            27: # cnt          r6
        !            28:
        !            29: include(`../config.m4')
        !            30:
        !            31: ASM_START()
        !            32: PROLOGUE(mpn_lshift)
        !            33:        cmpdi   cr0,r5,20       # more than 20 limbs?
        !            34:        sldi    r0,r5,3
        !            35:        add     r4,r4,r0        # make r4 point at end of s1
        !            36:        add     r7,r3,r0        # make r7 point at end of res
        !            37:        bgt     .LBIG           # branch if more than 12 limbs
        !            38:
        !            39:        mtctr   r5              # copy size into CTR
        !            40:        subfic  r8,r6,64
        !            41:        ldu     r11,-8(r4)      # load first s1 limb
        !            42:        srd     r3,r11,r8       # compute function return value
        !            43:        bdz     .Lend1
        !            44:
        !            45: .Loop: ldu     r10,-8(r4)
        !            46:        sld     r9,r11,r6
        !            47:        srd     r12,r10,r8
        !            48:        or      r9,r9,r12
        !            49:        stdu    r9,-8(r7)
        !            50:        bdz     .Lend2
        !            51:        ldu     r11,-8(r4)
        !            52:        sld     r9,r10,r6
        !            53:        srd     r12,r11,r8
        !            54:        or      r9,r9,r12
        !            55:        stdu    r9,-8(r7)
        !            56:        bdnz    .Loop
        !            57:
        !            58: .Lend1:        sld     r0,r11,r6
        !            59:        std     r0,-8(r7)
        !            60:        blr
        !            61: .Lend2:        sld     r0,r10,r6
        !            62:        std     r0,-8(r7)
        !            63:        blr
        !            64:
        !            65: .LBIG:
        !            66:        std     r24,-64(1)
        !            67:        std     r25,-56(1)
        !            68:        std     r26,-48(1)
        !            69:        std     r27,-40(1)
        !            70:        std     r28,-32(1)
        !            71:        std     r29,-24(1)
        !            72:        std     r30,-16(1)
        !            73:        std     r31,-8(1)
        !            74:        ldu     r9,-8(r4)
        !            75:        subfic  r8,r6,64
        !            76:        srd     r3,r9,r8        # compute function return value
        !            77:        sld     r0,r9,r6
        !            78:        addi    r5,r5,-1
        !            79:
        !            80:        andi.   r10,r5,3        # count for spill loop
        !            81:        beq     .Le
        !            82:        mtctr   r10
        !            83:        ldu     r28,-8(r4)
        !            84:        bdz     .Lxe0
        !            85:
        !            86: .Loop0:        sld     r12,r28,r6
        !            87:        srd     r24,r28,r8
        !            88:        ldu     r28,-8(r4)
        !            89:        or      r24,r0,r24
        !            90:        stdu    r24,-8(r7)
        !            91:        mr      r0,r12
        !            92:        bdnz    .Loop0          # taken at most once!
        !            93:
        !            94: .Lxe0: sld     r12,r28,r6
        !            95:        srd     r24,r28,r8
        !            96:        or      r24,r0,r24
        !            97:        stdu    r24,-8(r7)
        !            98:        mr      r0,r12
        !            99:
        !           100: .Le:   srdi    r5,r5,2         # count for unrolled loop
        !           101:        addi    r5,r5,-1
        !           102:        mtctr   r5
        !           103:        ld      r28,-8(r4)
        !           104:        ld      r29,-16(r4)
        !           105:        ld      r30,-24(r4)
        !           106:        ldu     r31,-32(r4)
        !           107:
        !           108: .LoopU:        sld     r9,r28,r6
        !           109:        srd     r24,r28,r8
        !           110:        ld      r28,-8(r4)
        !           111:        sld     r10,r29,r6
        !           112:        srd     r25,r29,r8
        !           113:        ld      r29,-16(r4)
        !           114:        sld     r11,r30,r6
        !           115:        srd     r26,r30,r8
        !           116:        ld      r30,-24(r4)
        !           117:        sld     r12,r31,r6
        !           118:        srd     r27,r31,r8
        !           119:        ldu     r31,-32(r4)
        !           120:        or      r24,r0,r24
        !           121:        std     r24,-8(r7)
        !           122:        or      r25,r9,r25
        !           123:        std     r25,-16(r7)
        !           124:        or      r26,r10,r26
        !           125:        std     r26,-24(r7)
        !           126:        or      r27,r11,r27
        !           127:        stdu    r27,-32(r7)
        !           128:        mr      r0,r12
        !           129:        bdnz    .LoopU
        !           130:
        !           131:        sld     r9,r28,r6
        !           132:        srd     r24,r28,r8
        !           133:        sld     r10,r29,r6
        !           134:        srd     r25,r29,r8
        !           135:        sld     r11,r30,r6
        !           136:        srd     r26,r30,r8
        !           137:        sld     r12,r31,r6
        !           138:        srd     r27,r31,r8
        !           139:        or      r24,r0,r24
        !           140:        std     r24,-8(r7)
        !           141:        or      r25,r9,r25
        !           142:        std     r25,-16(r7)
        !           143:        or      r26,r10,r26
        !           144:        std     r26,-24(r7)
        !           145:        or      r27,r11,r27
        !           146:        stdu    r27,-32(r7)
        !           147:        mr      r0,r12
        !           148:
        !           149:        std     r0,-8(r7)
        !           150:        ld      r24,-64(1)
        !           151:        ld      r25,-56(1)
        !           152:        ld      r26,-48(1)
        !           153:        ld      r27,-40(1)
        !           154:        ld      r28,-32(1)
        !           155:        ld      r29,-24(1)
        !           156:        ld      r30,-16(1)
        !           157:        ld      r31,-8(1)
        !           158:        blr
        !           159: EPILOGUE(mpn_lshift)

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>