/* $Id: level0_sparcv8_super.S,v 1.2 2000/11/03 21:00:27 karim Exp $
Copyright (C) 2000 The PARI group.
This file is part of the PARI/GP package.
PARI/GP is free software; you can redistribute it and/or modify it under the
terms of the GNU General Public License as published by the Free Software
Foundation. It is distributed in the hope that it will be useful, but WITHOUT
ANY WARRANTY WHATSOEVER.
Check the License for details. You should have received a copy of it, along
with the package; see the file 'COPYING'. If not, write to the Free Software
Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
/* This file defines some "level 0" kernel functions for SPARC V8 */
/* These are optimised for SuperSparc */
/* The following symbols are defined in this file : */
/* divll bfffo (& tabshi) */
/* But divll have to use hiremainder, so it is different when */
/* hiremainder is inline or not */
/* If libpari.so is compiled with gcc, you should compile all */
/* files with gcc */
#if defined(sun) || defined(NeXT)
# ifdef __STDC__
# define C(entrypoint) _##entrypoint
# else
# define C(entrypoint) _/**/entrypoint
# endif
#elif defined(linux)
# define C(entrypoint) entrypoint
#endif
#if defined(sun) || defined(linux)
# define GLOBL .global
#elif defined(NeXT)
# define GLOBL .globl
#endif
#if defined(sun) || defined(linux)
.seg "data"
.align 4
C(tabshi): .word 4,3,2,2,1,1,1,1,0,0,0,0,0,0,0,0
.seg "text"
#elif defined(NeXT)
.data
.align 3
C(tabshi):
.long 4
.long 3
.long 2
.long 2
.long 1
.long 1
.long 1
.long 1
.long 0
.long 0
.long 0
.long 0
.long 0
.long 0
.long 0
.long 0
.text
.align 2
#endif
GLOBL C(bfffo),C(divll)
C(bfffo): sethi %hi(65535),%o2
or %o2,%lo(65535),%o2
cmp %o0,%o2
bleu 1f
mov 28,%o1
mov 12,%o1
srl %o0,16,%o0
1: cmp %o0,255
bleu 2f
cmp %o0,15
add %o1,-8,%o1
srl %o0,8,%o0
cmp %o0,15
2: bleu 3f
sethi %hi(C(tabshi)),%o2
add %o1,-4,%o1
srl %o0,4,%o0
3: or %o2,%lo(C(tabshi)),%o2
sll %o0,2,%o3
ld [%o3+%o2],%o0
retl
add %o1,%o0,%o0
#ifdef __GNUC__
#define SAVE_HI(X) mov X,%g5
#define LOAD_HI(X) mov %g5,X
#define LOAD_Hi(X)
#else
#define SAVE_HI(X) st X,[%o4+%lo(C(hiremainder))]
#define LOAD_HI(X) sethi %hi(C(hiremainder)),%o4
#define LOAD_Hi(X) ld [%o4+%lo(C(hiremainder))],X
#endif
C(divll): LOAD_HI(%o2)
LOAD_Hi(%o2)
sethi %hi(0xfff00000),%o5
andcc %o5,%o2,%g0
bnz,a C(divlllong)
subcc %o2,%o1,%g0
wr %o2,%g0,%y
mov %o0,%o3
nop
nop
udivcc %o0,%o1,%o0
bvc 1f
umul %o0,%o1,%o5
mov 0x2f,%o0
call C(pari_err),1
nop
1: subcc %o3,%o5,%o2
retl
SAVE_HI(%o2)
#define SS0(label) \
addx %o2,%o2,%o2;\
subcc %o2,%o1,%o3;\
bcc label;\
addxcc %o0,%o0,%o0
#define SS1(label) \
addx %o3,%o3,%o3;\
subcc %o3,%o1,%o2;\
bcc label;\
addxcc %o0,%o0,%o0
C(divlllong):
blu 1f
addcc %o1,%o1,%g0
mov 0x2f,%o0
call C(pari_err),1
nop
1: bcc Lsmalldiv
andcc %o1,1,%g0
be Levendiv
srl %o1,1,%o1
add %o1,1,%o1
subcc %o2,%o1,%o3
bcc Lb01
addxcc %o0,%o0,%o0
La01: SS0(Lb02)
La02: SS0(Lb03)
La03: SS0(Lb04)
La04: SS0(Lb05)
La05: SS0(Lb06)
La06: SS0(Lb07)
La07: SS0(Lb08)
La08: SS0(Lb09)
La09: SS0(Lb10)
La10: SS0(Lb11)
La11: SS0(Lb12)
La12: SS0(Lb13)
La13: SS0(Lb14)
La14: SS0(Lb15)
La15: SS0(Lb16)
La16: SS0(Lb17)
La17: SS0(Lb18)
La18: SS0(Lb19)
La19: SS0(Lb20)
La20: SS0(Lb21)
La21: SS0(Lb22)
La22: SS0(Lb23)
La23: SS0(Lb24)
La24: SS0(Lb25)
La25: SS0(Lb26)
La26: SS0(Lb27)
La27: SS0(Lb28)
La28: SS0(Lb29)
La29: SS0(Lb30)
La30: SS0(Lb31)
La31: SS0(Lb32)
La32: addx %o2,%o2,%o2
xor %o0,-1,%o0
add %o1,%o1,%o1
sub %o1,1,%o1
addcc %o0,%o2,%o2
bcc 1f
subcc %o2,%o1,%o3
subcc %o3,%o1,%o2
bcs 2f
add %o0,1,%o0
add %o0,1,%o0
3: retl
SAVE_HI(%o2)
1: bcs 3b
nop
add %o0,1,%o0
2: retl
SAVE_HI(%o3)
Lb01: SS1(La02)
Lb02: SS1(La03)
Lb03: SS1(La04)
Lb04: SS1(La05)
Lb05: SS1(La06)
Lb06: SS1(La07)
Lb07: SS1(La08)
Lb08: SS1(La09)
Lb09: SS1(La10)
Lb10: SS1(La11)
Lb11: SS1(La12)
Lb12: SS1(La13)
Lb13: SS1(La14)
Lb14: SS1(La15)
Lb15: SS1(La16)
Lb16: SS1(La17)
Lb17: SS1(La18)
Lb18: SS1(La19)
Lb19: SS1(La20)
Lb20: SS1(La21)
Lb21: SS1(La22)
Lb22: SS1(La23)
Lb23: SS1(La24)
Lb24: SS1(La25)
Lb25: SS1(La26)
Lb26: SS1(La27)
Lb27: SS1(La28)
Lb28: SS1(La29)
Lb29: SS1(La30)
Lb30: SS1(La31)
Lb31: SS1(La32)
Lb32: addx %o3,%o3,%o2
xor %o0,-1,%o0
add %o1,%o1,%o1
sub %o1,1,%o1
addcc %o0,%o2,%o2
bcc 1f
subcc %o2,%o1,%o3
subcc %o3,%o1,%o2
bcs 2f
add %o0,1,%o0
add %o0,1,%o0
3: retl
SAVE_HI(%o2)
1: bcs 3b
nop
add %o0,1,%o0
2: retl
SAVE_HI(%o3)
Lsmalldiv:
addcc %o0,%o0,%o0
Lc00: SS0(Ld01)
Lc01: SS0(Ld02)
Lc02: SS0(Ld03)
Lc03: SS0(Ld04)
Lc04: SS0(Ld05)
Lc05: SS0(Ld06)
Lc06: SS0(Ld07)
Lc07: SS0(Ld08)
Lc08: SS0(Ld09)
Lc09: SS0(Ld10)
Lc10: SS0(Ld11)
Lc11: SS0(Ld12)
Lc12: SS0(Ld13)
Lc13: SS0(Ld14)
Lc14: SS0(Ld15)
Lc15: SS0(Ld16)
Lc16: SS0(Ld17)
Lc17: SS0(Ld18)
Lc18: SS0(Ld19)
Lc19: SS0(Ld20)
Lc20: SS0(Ld21)
Lc21: SS0(Ld22)
Lc22: SS0(Ld23)
Lc23: SS0(Ld24)
Lc24: SS0(Ld25)
Lc25: SS0(Ld26)
Lc26: SS0(Ld27)
Lc27: SS0(Ld28)
Lc28: SS0(Ld29)
Lc29: SS0(Ld30)
Lc30: SS0(Ld31)
Lc31: SS0(Ld32)
Lc32: xor %o0,-1,%o0
retl
SAVE_HI(%o2)
Ld01: SS1(Lc02)
Ld02: SS1(Lc03)
Ld03: SS1(Lc04)
Ld04: SS1(Lc05)
Ld05: SS1(Lc06)
Ld06: SS1(Lc07)
Ld07: SS1(Lc08)
Ld08: SS1(Lc09)
Ld09: SS1(Lc10)
Ld10: SS1(Lc11)
Ld11: SS1(Lc12)
Ld12: SS1(Lc13)
Ld13: SS1(Lc14)
Ld14: SS1(Lc15)
Ld15: SS1(Lc16)
Ld16: SS1(Lc17)
Ld17: SS1(Lc18)
Ld18: SS1(Lc19)
Ld19: SS1(Lc20)
Ld20: SS1(Lc21)
Ld21: SS1(Lc22)
Ld22: SS1(Lc23)
Ld23: SS1(Lc24)
Ld24: SS1(Lc25)
Ld25: SS1(Lc26)
Ld26: SS1(Lc27)
Ld27: SS1(Lc28)
Ld28: SS1(Lc29)
Ld29: SS1(Lc30)
Ld30: SS1(Lc31)
Ld31: SS1(Lc32)
Ld32: xor %o0,-1,%o0
retl
SAVE_HI(%o3)
Levendiv:
subcc %o2,%o1,%o3
bcc Lf01
addxcc %o0,%o0,%o0
Le01: SS0(Lf02)
Le02: SS0(Lf03)
Le03: SS0(Lf04)
Le04: SS0(Lf05)
Le05: SS0(Lf06)
Le06: SS0(Lf07)
Le07: SS0(Lf08)
Le08: SS0(Lf09)
Le09: SS0(Lf10)
Le10: SS0(Lf11)
Le11: SS0(Lf12)
Le12: SS0(Lf13)
Le13: SS0(Lf14)
Le14: SS0(Lf15)
Le15: SS0(Lf16)
Le16: SS0(Lf17)
Le17: SS0(Lf18)
Le18: SS0(Lf19)
Le19: SS0(Lf20)
Le20: SS0(Lf21)
Le21: SS0(Lf22)
Le22: SS0(Lf23)
Le23: SS0(Lf24)
Le24: SS0(Lf25)
Le25: SS0(Lf26)
Le26: SS0(Lf27)
Le27: SS0(Lf28)
Le28: SS0(Lf29)
Le29: SS0(Lf30)
Le30: SS0(Lf31)
Le31: SS0(Lf32)
Le32: addx %o2,%o2,%o2
xor %o0,-1,%o0
retl
SAVE_HI(%o2)
Lf01: SS1(Le02)
Lf02: SS1(Le03)
Lf03: SS1(Le04)
Lf04: SS1(Le05)
Lf05: SS1(Le06)
Lf06: SS1(Le07)
Lf07: SS1(Le08)
Lf08: SS1(Le09)
Lf09: SS1(Le10)
Lf10: SS1(Le11)
Lf11: SS1(Le12)
Lf12: SS1(Le13)
Lf13: SS1(Le14)
Lf14: SS1(Le15)
Lf15: SS1(Le16)
Lf16: SS1(Le17)
Lf17: SS1(Le18)
Lf18: SS1(Le19)
Lf19: SS1(Le20)
Lf20: SS1(Le21)
Lf21: SS1(Le22)
Lf22: SS1(Le23)
Lf23: SS1(Le24)
Lf24: SS1(Le25)
Lf25: SS1(Le26)
Lf26: SS1(Le27)
Lf27: SS1(Le28)
Lf28: SS1(Le29)
Lf29: SS1(Le30)
Lf30: SS1(Le31)
Lf31: SS1(Le32)
Lf32: addx %o3,%o3,%o3
xor %o0,-1,%o0
retl
SAVE_HI(%o3)