forked from luck/tmp_suning_uos_patched
205 lines
6.1 KiB
ArmAsm
205 lines
6.1 KiB
ArmAsm
|
.file "wm_shrx.S"
|
||
|
/*---------------------------------------------------------------------------+
|
||
|
| wm_shrx.S |
|
||
|
| |
|
||
|
| 64 bit right shift functions |
|
||
|
| |
|
||
|
| Copyright (C) 1992,1995 |
|
||
|
| W. Metzenthen, 22 Parker St, Ormond, Vic 3163, |
|
||
|
| Australia. E-mail billm@jacobi.maths.monash.edu.au |
|
||
|
| |
|
||
|
| Call from C as: |
|
||
|
| unsigned FPU_shrx(void *arg1, unsigned arg2) |
|
||
|
| and |
|
||
|
| unsigned FPU_shrxs(void *arg1, unsigned arg2) |
|
||
|
| |
|
||
|
+---------------------------------------------------------------------------*/
|
||
|
|
||
|
#include "fpu_emu.h"
|
||
|
|
||
|
.text
|
||
|
/*---------------------------------------------------------------------------+
|
||
|
| unsigned FPU_shrx(void *arg1, unsigned arg2) |
|
||
|
| |
|
||
|
| Extended shift right function. |
|
||
|
| Fastest for small shifts. |
|
||
|
| Shifts the 64 bit quantity pointed to by the first arg (arg1) |
|
||
|
| right by the number of bits specified by the second arg (arg2). |
|
||
|
| Forms a 96 bit quantity from the 64 bit arg and eax: |
|
||
|
| [ 64 bit arg ][ eax ] |
|
||
|
| shift right ---------> |
|
||
|
| The eax register is initialized to 0 before the shifting. |
|
||
|
| Results returned in the 64 bit arg and eax. |
|
||
|
+---------------------------------------------------------------------------*/
|
||
|
|
||
|
ENTRY(FPU_shrx)
|
||
|
push %ebp
|
||
|
movl %esp,%ebp
|
||
|
pushl %esi
|
||
|
movl PARAM2,%ecx
|
||
|
movl PARAM1,%esi
|
||
|
cmpl $32,%ecx /* shrd only works for 0..31 bits */
|
||
|
jnc L_more_than_31
|
||
|
|
||
|
/* less than 32 bits */
|
||
|
pushl %ebx
|
||
|
movl (%esi),%ebx /* lsl */
|
||
|
movl 4(%esi),%edx /* msl */
|
||
|
xorl %eax,%eax /* extension */
|
||
|
shrd %cl,%ebx,%eax
|
||
|
shrd %cl,%edx,%ebx
|
||
|
shr %cl,%edx
|
||
|
movl %ebx,(%esi)
|
||
|
movl %edx,4(%esi)
|
||
|
popl %ebx
|
||
|
popl %esi
|
||
|
leave
|
||
|
ret
|
||
|
|
||
|
L_more_than_31:
|
||
|
cmpl $64,%ecx
|
||
|
jnc L_more_than_63
|
||
|
|
||
|
subb $32,%cl
|
||
|
movl (%esi),%eax /* lsl */
|
||
|
movl 4(%esi),%edx /* msl */
|
||
|
shrd %cl,%edx,%eax
|
||
|
shr %cl,%edx
|
||
|
movl %edx,(%esi)
|
||
|
movl $0,4(%esi)
|
||
|
popl %esi
|
||
|
leave
|
||
|
ret
|
||
|
|
||
|
L_more_than_63:
|
||
|
cmpl $96,%ecx
|
||
|
jnc L_more_than_95
|
||
|
|
||
|
subb $64,%cl
|
||
|
movl 4(%esi),%eax /* msl */
|
||
|
shr %cl,%eax
|
||
|
xorl %edx,%edx
|
||
|
movl %edx,(%esi)
|
||
|
movl %edx,4(%esi)
|
||
|
popl %esi
|
||
|
leave
|
||
|
ret
|
||
|
|
||
|
L_more_than_95:
|
||
|
xorl %eax,%eax
|
||
|
movl %eax,(%esi)
|
||
|
movl %eax,4(%esi)
|
||
|
popl %esi
|
||
|
leave
|
||
|
ret
|
||
|
|
||
|
|
||
|
/*---------------------------------------------------------------------------+
|
||
|
| unsigned FPU_shrxs(void *arg1, unsigned arg2) |
|
||
|
| |
|
||
|
| Extended shift right function (optimized for small floating point |
|
||
|
| integers). |
|
||
|
| Shifts the 64 bit quantity pointed to by the first arg (arg1) |
|
||
|
| right by the number of bits specified by the second arg (arg2). |
|
||
|
| Forms a 96 bit quantity from the 64 bit arg and eax: |
|
||
|
| [ 64 bit arg ][ eax ] |
|
||
|
| shift right ---------> |
|
||
|
| The eax register is initialized to 0 before the shifting. |
|
||
|
| The lower 8 bits of eax are lost and replaced by a flag which is |
|
||
|
| set (to 0x01) if any bit, apart from the first one, is set in the |
|
||
|
| part which has been shifted out of the arg. |
|
||
|
| Results returned in the 64 bit arg and eax. |
|
||
|
+---------------------------------------------------------------------------*/
|
||
|
ENTRY(FPU_shrxs)
|
||
|
push %ebp
|
||
|
movl %esp,%ebp
|
||
|
pushl %esi
|
||
|
pushl %ebx
|
||
|
movl PARAM2,%ecx
|
||
|
movl PARAM1,%esi
|
||
|
cmpl $64,%ecx /* shrd only works for 0..31 bits */
|
||
|
jnc Ls_more_than_63
|
||
|
|
||
|
cmpl $32,%ecx /* shrd only works for 0..31 bits */
|
||
|
jc Ls_less_than_32
|
||
|
|
||
|
/* We got here without jumps by assuming that the most common requirement
|
||
|
is for small integers */
|
||
|
/* Shift by [32..63] bits */
|
||
|
subb $32,%cl
|
||
|
movl (%esi),%eax /* lsl */
|
||
|
movl 4(%esi),%edx /* msl */
|
||
|
xorl %ebx,%ebx
|
||
|
shrd %cl,%eax,%ebx
|
||
|
shrd %cl,%edx,%eax
|
||
|
shr %cl,%edx
|
||
|
orl %ebx,%ebx /* test these 32 bits */
|
||
|
setne %bl
|
||
|
test $0x7fffffff,%eax /* and 31 bits here */
|
||
|
setne %bh
|
||
|
orw %bx,%bx /* Any of the 63 bit set ? */
|
||
|
setne %al
|
||
|
movl %edx,(%esi)
|
||
|
movl $0,4(%esi)
|
||
|
popl %ebx
|
||
|
popl %esi
|
||
|
leave
|
||
|
ret
|
||
|
|
||
|
/* Shift by [0..31] bits */
|
||
|
Ls_less_than_32:
|
||
|
movl (%esi),%ebx /* lsl */
|
||
|
movl 4(%esi),%edx /* msl */
|
||
|
xorl %eax,%eax /* extension */
|
||
|
shrd %cl,%ebx,%eax
|
||
|
shrd %cl,%edx,%ebx
|
||
|
shr %cl,%edx
|
||
|
test $0x7fffffff,%eax /* only need to look at eax here */
|
||
|
setne %al
|
||
|
movl %ebx,(%esi)
|
||
|
movl %edx,4(%esi)
|
||
|
popl %ebx
|
||
|
popl %esi
|
||
|
leave
|
||
|
ret
|
||
|
|
||
|
/* Shift by [64..95] bits */
|
||
|
Ls_more_than_63:
|
||
|
cmpl $96,%ecx
|
||
|
jnc Ls_more_than_95
|
||
|
|
||
|
subb $64,%cl
|
||
|
movl (%esi),%ebx /* lsl */
|
||
|
movl 4(%esi),%eax /* msl */
|
||
|
xorl %edx,%edx /* extension */
|
||
|
shrd %cl,%ebx,%edx
|
||
|
shrd %cl,%eax,%ebx
|
||
|
shr %cl,%eax
|
||
|
orl %ebx,%edx
|
||
|
setne %bl
|
||
|
test $0x7fffffff,%eax /* only need to look at eax here */
|
||
|
setne %bh
|
||
|
orw %bx,%bx
|
||
|
setne %al
|
||
|
xorl %edx,%edx
|
||
|
movl %edx,(%esi) /* set to zero */
|
||
|
movl %edx,4(%esi) /* set to zero */
|
||
|
popl %ebx
|
||
|
popl %esi
|
||
|
leave
|
||
|
ret
|
||
|
|
||
|
Ls_more_than_95:
|
||
|
/* Shift by [96..inf) bits */
|
||
|
xorl %eax,%eax
|
||
|
movl (%esi),%ebx
|
||
|
orl 4(%esi),%ebx
|
||
|
setne %al
|
||
|
xorl %ebx,%ebx
|
||
|
movl %ebx,(%esi)
|
||
|
movl %ebx,4(%esi)
|
||
|
popl %ebx
|
||
|
popl %esi
|
||
|
leave
|
||
|
ret
|