corda/external/sgx_libm/ia32/csqrtl.S

740 lines
18 KiB
ArmAsm
Raw Normal View History

/*
* Math library
*
* Copyright (C) 2016 Intel Corporation. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* * Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* * Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in
* the documentation and/or other materials provided with the
* distribution.
* * Neither the name of Intel Corporation nor the names of its
* contributors may be used to endorse or promote products derived
* from this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
*
* Author Name <jingwei.zhang@intel.com>
* History:
* 03-14-2016 Initial version. numerics svn rev. 12864
*/
.file "csqrtl.c"
.text
..TXTST0:
# -- Begin csqrtl
.text
.align 16,0x90
.globl csqrtl
csqrtl:
# parameter 1: 12 + %ebp
..B1.1:
..L1:
pushl %ebp
movl %esp, %ebp
andl $-64, %esp
pushl %esi
pushl %edi
pushl %ebx
subl $244, %esp
call ..L2
..L2:
popl %ebx
lea _GLOBAL_OFFSET_TABLE_+[. - ..L2](%ebx), %ebx
movl 8(%ebp), %eax
movl %eax, 44(%esp)
fldt .L_2il0floatpacket.8@GOTOFF(%ebx)
movl %gs:20, %edx
xorl %esp, %edx
movl %edx, 196(%esp)
fstpt 172(%esp)
fldt 172(%esp)
fstpt 184(%esp)
..B1.2:
fnstcw 62(%esp)
..B1.3:
movzwl 62(%esp), %edx
movl %edx, %eax
andl $768, %eax
cmpl $768, %eax
je ..B1.69
..B1.4:
orl $-64768, %edx
movw %dx, 60(%esp)
..B1.5:
fldcw 60(%esp)
..B1.6:
movl $1, %esi
..B1.7:
movzwl 20(%ebp), %ecx
movl %ecx, %edi
andl $32767, %edi
cmpl $32767, %edi
jge ..B1.30
..B1.8:
cmpl $0, 16(%ebp)
jne ..B1.10
..B1.9:
cmpl $0, 12(%ebp)
je ..B1.30
..B1.10:
movzwl 32(%ebp), %eax
movl %eax, %edx
andl $32767, %edx
cmpl $32767, %edx
jge ..B1.48
..B1.11:
cmpl $0, 28(%ebp)
jne ..B1.13
..B1.12:
cmpl $0, 24(%ebp)
je ..B1.32
..B1.13:
fldt 12(%ebp)
testl %edi, %edi
jle ..B1.56
..B1.14:
andl $-32768, %ecx
addl $-16383, %edi
fstpt 148(%esp)
fldt 148(%esp)
orl $-49153, %ecx
movw %cx, 156(%esp)
..B1.15:
fldt 24(%ebp)
testl %edx, %edx
movb $63, 157(%esp)
jle ..B1.55
..B1.16:
andl $-32768, %eax
addl $-16383, %edx
fstpt 76(%esp)
fldt 76(%esp)
orl $-49153, %eax
movw %ax, 84(%esp)
..B1.17:
fldt 72+_CONSTANTS@GOTOFF(%ebx)
movb $63, 85(%esp)
fstpt 88(%esp)
fldt 88(%esp)
addl $-32, %esp
lea 132(%esp), %eax
movl %eax, (%esp)
fxch %st(2)
fstpt 4(%esp)
fstpt 16(%esp)
fstpt 32(%esp)
movl %edx, -72(%eax)
call __libm_hypot2l_k80
..B1.72:
fldt 32(%esp)
movl 60(%esp), %edx
addl $32, %esp
..B1.18:
fldt 132+_CONSTANTS@GOTOFF(%ebx)
faddp %st, %st(2)
fxch %st(1)
fstpt (%esp)
fldt 100(%esp)
fld %st(0)
fsqrt
fldt 84+_CONSTANTS@GOTOFF(%ebx)
fstpt 32(%esp)
fldt 32(%esp)
fmul %st(1), %st
fld %st(0)
movl (%esp), %eax
fsubr %st(2), %st
sarl $1, %eax
faddp %st, %st(1)
fld %st(0)
fsubr %st(2), %st
fld %st(1)
fmul %st(2), %st
fxch %st(1)
fmul %st, %st(2)
fxch %st(2)
fadd %st(0), %st
fld %st(0)
fadd %st(2), %st
fsubr %st, %st(2)
fxch %st(1)
faddp %st, %st(2)
fxch %st(2)
fmul %st(0), %st
faddp %st, %st(1)
fxch %st(1)
fsubrp %st, %st(3)
fsubrp %st, %st(2)
fldt 112(%esp)
faddp %st, %st(2)
fldt 24+_CONSTANTS@GOTOFF(%ebx)
fmul %st, %st(2)
fxch %st(1)
fdivr %st, %st(2)
fxch %st(1)
fstpt 16(%esp)
fld %st(0)
fadd %st(2), %st
fstpt 124(%esp)
fldt 124(%esp)
fsubr %st, %st(1)
movzwl 132(%esp), %ecx
fxch %st(1)
faddp %st, %st(2)
andl $32767, %ecx
movl %ecx, 12(%esp)
fxch %st(1)
fstpt 136(%esp)
fldt 136(%esp)
lea -16464(%ecx,%eax), %ecx
cmpl %ecx, %edi
jle ..B1.22
..B1.19:
movl 12(%esp), %ecx
lea -16302(%ecx,%eax), %ecx
cmpl %ecx, %edi
jge ..B1.21
..B1.20:
fstp %st(2)
subl %eax, %edi
fld %st(0)
addl $16383, %edi
fld %st(1)
movzwl 156(%esp), %ecx
andl $32767, %edi
andl $-32768, %ecx
orl %edi, %ecx
movl %eax, %edi
movw %cx, 156(%esp)
fldt 148(%esp)
fadd %st, %st(2)
fld %st(2)
fxch %st(2)
fsubr %st(3), %st
fsubr %st, %st(2)
fxch %st(2)
fsubrp %st, %st(4)
fsubp %st, %st(1)
faddp %st, %st(2)
fxch %st(2)
faddp %st, %st(1)
fxch %st(1)
jmp ..B1.23
..B1.21:
fstp %st(0)
fstp %st(0)
fldt 148(%esp)
jmp ..B1.23
..B1.22:
fstp %st(2)
movl %eax, %edi
..B1.23:
fldt 32(%esp)
lea 1(%edi), %ecx
andl $1, %ecx
subl %ecx, %edi
decl %edi
sarl $1, %edi
lea (,%ecx,8), %eax
lea (%eax,%ecx,4), %eax
fldt 48+_CONSTANTS@GOTOFF(%eax,%ebx)
fmul %st, %st(2)
fld %st(2)
fsqrt
fmul %st, %st(2)
fld %st(2)
fsubr %st(1), %st
faddp %st, %st(3)
fld %st(2)
fsubr %st(1), %st
fxch %st(2)
fmulp %st, %st(5)
fld %st(2)
fmul %st(3), %st
fxch %st(2)
fmul %st, %st(3)
fxch %st(3)
fadd %st(0), %st
fld %st(0)
fadd %st(3), %st
fsubr %st, %st(3)
fxch %st(1)
faddp %st, %st(3)
fxch %st(3)
fmul %st(0), %st
faddp %st, %st(2)
fxch %st(2)
fsubrp %st, %st(3)
fsubrp %st, %st(2)
fxch %st(2)
faddp %st, %st(1)
fld %st(1)
fldt 16(%esp)
fmulp %st, %st(2)
fxch %st(1)
fdiv %st(2), %st
fadd %st, %st(1)
fxch %st(1)
fstpt 48(%esp)
fldt 48(%esp)
addl $-32, %esp
fsubr %st, %st(2)
fxch %st(2)
faddp %st, %st(1)
fxch %st(1)
fstpt (%esp)
fstpt 12(%esp)
fldt 12(%esp)
movl %edi, 24(%esp)
fstpt 96(%esp)
movl %edx, 60(%esp)
call __libm_scalbl_k80
..B1.73:
fldt 96(%esp)
movl 60(%esp), %edx
fxch %st(1)
fstpt 32(%esp)
addl $32, %esp
..B1.24:
fldt 76(%esp)
subl %edi, %edx
fldt 48(%esp)
fld %st(0)
fdivr %st(2), %st
fmul %st, %st(3)
fld %st(1)
fldt 32(%esp)
fld %st(0)
fmul %st(3), %st
fld %st(0)
fsubr %st(4), %st
faddp %st, %st(1)
fld %st(0)
fsubr %st(4), %st
fxch %st(2)
fmul %st(5), %st
fsubr %st, %st(3)
faddp %st, %st(3)
fxch %st(2)
fsubr %st, %st(4)
fld %st(2)
fmul %st(1), %st
fxch %st(1)
fmul %st(2), %st
fxch %st(3)
fmul %st(5), %st
faddp %st, %st(3)
fld %st(2)
fadd %st(1), %st
fsubr %st, %st(1)
fxch %st(3)
faddp %st, %st(1)
fxch %st(1)
fmulp %st, %st(4)
faddp %st, %st(3)
fld %st(1)
fxch %st(1)
fsubrp %st, %st(4)
fxch %st(2)
fsubrp %st, %st(3)
fldt 88(%esp)
faddp %st, %st(3)
fxch %st(3)
fsubrp %st, %st(2)
fldt 48(%esp)
fdivrp %st, %st(2)
fadd %st(1), %st
fsubr %st, %st(2)
fxch %st(2)
faddp %st, %st(1)
fldt 16(%esp)
fmul %st, %st(2)
fmulp %st, %st(1)
addl $-32, %esp
fxch %st(1)
fstpt (%esp)
fstpt 12(%esp)
movl %edx, 24(%esp)
call __libm_scalbl_k80
..B1.74:
addl $32, %esp
..B1.25:
movzbl 21(%ebp), %eax
testl $128, %eax
jne ..B1.27
..B1.26:
fldt (%esp)
lea 184(%esp), %edi
fstpt -12(%edi)
jmp ..B1.28
..B1.27:
fldt (%esp)
lea 184(%esp), %edi
fxch %st(1)
fstpt -12(%edi)
..B1.28:
movzbl 33(%ebp), %edx
andl $128, %edx
shrl $7, %edx
lea (,%edx,8), %eax
lea (%eax,%edx,4), %ecx
fldt _CONSTANTS@GOTOFF(%ebx,%ecx)
fmulp %st, %st(1)
fstpt (%edi)
jmp ..B1.51
..B1.30:
movzwl 32(%ebp), %edx
andl $32767, %edx
..B1.31:
cmpl $32767, %edx
jge ..B1.48
..B1.32:
movl 16(%ebp), %eax
testl %eax, %eax
jne ..B1.40
..B1.33:
cmpl $0, 12(%ebp)
jne ..B1.40
..B1.34:
cmpl $0, 28(%ebp)
jne ..B1.36
..B1.35:
cmpl $0, 24(%ebp)
je ..B1.40
..B1.36:
fldt 24(%ebp)
movzbl 33(%ebp), %ecx
andl $128, %ecx
shrl $7, %ecx
cmpl $2, %edx
lea (,%ecx,8), %eax
lea (%eax,%ecx,4), %eax
fldt _CONSTANTS@GOTOFF(%eax,%ebx)
jl ..B1.38
..B1.37:
fldt 24+_CONSTANTS@GOTOFF(%ebx,%eax)
fmulp %st, %st(2)
fxch %st(1)
fsqrt
jmp ..B1.39
..B1.38:
fldt 108+_CONSTANTS@GOTOFF(%ebx)
fmulp %st, %st(2)
fmul %st, %st(1)
fxch %st(1)
fsqrt
fldt 156+_CONSTANTS@GOTOFF(%ebx)
fmulp %st, %st(1)
..B1.39:
fstpt 172(%esp)
fldt 172(%esp)
fmulp %st, %st(1)
fstpt 184(%esp)
jmp ..B1.51
..B1.40:
cmpl $32767, %edi
jl ..B1.43
..B1.41:
cmpl $-2147483648, %eax
jne ..B1.47
..B1.42:
cmpl $0, 12(%ebp)
jne ..B1.47
..B1.43:
fldt 12(%ebp)
fldt 72+_CONSTANTS@GOTOFF(%ebx)
movzbl 21(%ebp), %ecx
andl $128, %ecx
shrl $7, %ecx
testl %ecx, %ecx
lea (,%ecx,8), %eax
lea (%eax,%ecx,4), %edx
fldt _CONSTANTS@GOTOFF(%ebx,%edx)
fmulp %st, %st(2)
fxch %st(1)
fstpt 148(%esp)
fldt 148(%esp)
fsqrt
jne ..B1.45
..B1.44:
fstpt 172(%esp)
lea 184(%esp), %edi
jmp ..B1.46
..B1.45:
fxch %st(1)
fstpt 172(%esp)
lea 184(%esp), %edi
..B1.46:
movzbl 33(%ebp), %edx
andl $128, %edx
shrl $7, %edx
lea (,%edx,8), %eax
lea (%eax,%edx,4), %ecx
fldt _CONSTANTS@GOTOFF(%ebx,%ecx)
fmulp %st, %st(1)
fstpt (%edi)
jmp ..B1.51
..B1.47:
fldt 12(%ebp)
fmul %st(0), %st
fstpt 172(%esp)
fldt 172(%esp)
fstpt 184(%esp)
jmp ..B1.51
..B1.48:
je ..B1.63
..B1.49:
cmpl $32767, %edi
je ..B1.58
..B1.50:
fldt 12(%ebp)
fld %st(0)
fldt 24(%ebp)
fmul %st, %st(1)
fxch %st(1)
fmul %st, %st(2)
fxch %st(2)
fstpt 172(%esp)
fmulp %st, %st(1)
fstpt 184(%esp)
..B1.51:
testl %esi, %esi
je ..B1.53
..B1.52:
fldcw 62(%esp)
..B1.53:
movl 44(%esp), %eax
movl 172(%esp), %edx
movl 176(%esp), %ecx
movl %edx, (%eax)
movl %ecx, 4(%eax)
movl 180(%esp), %esi
movl 184(%esp), %edi
movl 188(%esp), %edx
movl 192(%esp), %ecx
movl %esi, 8(%eax)
movl %edi, 12(%eax)
movl %edx, 16(%eax)
movl %ecx, 20(%eax)
movl 196(%esp), %eax
xorl %esp, %eax
cmpl %gs:20, %eax
jne ..B1.57
..B1.54:
movl 44(%esp), %eax
addl $244, %esp
popl %ebx
popl %edi
popl %esi
movl %ebp, %esp
popl %ebp
ret $4
..B1.55:
fldt 120+_CONSTANTS@GOTOFF(%ebx)
fmul %st(1), %st
fstpt 76(%esp)
movzwl 84(%esp), %eax
movl %eax, %edx
andl $-32768, %eax
andl $32767, %edx
orl $-49153, %eax
addl $-16639, %edx
movw %ax, 84(%esp)
jmp ..B1.17
..B1.56:
fldt 120+_CONSTANTS@GOTOFF(%ebx)
fmul %st(1), %st
fstpt 148(%esp)
movzwl 156(%esp), %ecx
movl %ecx, %edi
andl $-32768, %ecx
andl $32767, %edi
orl $-49153, %ecx
addl $-16639, %edi
movw %cx, 156(%esp)
jmp ..B1.15
..B1.57:
call __stack_chk_fail@PLT
..B1.58:
cmpl $-2147483648, 16(%ebp)
jne ..B1.50
..B1.59:
cmpl $0, 12(%ebp)
jne ..B1.50
..B1.60:
fldt 12(%ebp)
movzbl 21(%ebp), %eax
testl $128, %eax
fmul %st(0), %st
fldt 24(%ebp)
fmul %st(0), %st
jne ..B1.62
..B1.61:
fxch %st(1)
fstpt 172(%esp)
fstpt 184(%esp)
jmp ..B1.51
..B1.62:
fstpt 172(%esp)
fstpt 184(%esp)
jmp ..B1.51
..B1.63:
cmpl $-2147483648, 28(%ebp)
jne ..B1.49
..B1.64:
cmpl $0, 24(%ebp)
jne ..B1.49
..B1.65:
fldt 24(%ebp)
movzbl 33(%ebp), %edx
andl $128, %edx
shrl $7, %edx
fmul %st(0), %st
cmpl $32767, %edi
fstpt 172(%esp)
fldt 172(%esp)
lea (,%edx,8), %eax
lea (%eax,%edx,4), %ecx
fldt _CONSTANTS@GOTOFF(%ebx,%ecx)
fmulp %st, %st(1)
fstpt 184(%esp)
jne ..B1.51
..B1.66:
cmpl $-2147483648, 16(%ebp)
jne ..B1.68
..B1.67:
cmpl $0, 12(%ebp)
je ..B1.51
..B1.68:
fldt 12(%ebp)
fldt _CONSTANTS@GOTOFF(%ebx)
fmulp %st, %st(1)
fstpt 12(%ebp)
jmp ..B1.51
..B1.69:
xorl %esi, %esi
jmp ..B1.7
.align 16,0x90
.type csqrtl,@function
.size csqrtl,.-csqrtl
.data
# -- End csqrtl
.section .rodata, "a"
.align 16
.align 16
.L_2il0floatpacket.8:
.byte 0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00
.type .L_2il0floatpacket.8,@object
.size .L_2il0floatpacket.8,12
.space 4, 0x00 # pad
.align 16
_CONSTANTS:
.word 0
.word 0
.word 0
.word 32768
.word 16383
.word 0
.word 0
.word 0
.word 0
.word 32768
.word 49151
.word 0
.word 0
.word 0
.word 0
.word 32768
.word 16382
.word 0
.word 0
.word 0
.word 0
.word 32768
.word 49150
.word 0
.word 0
.word 0
.word 0
.word 32768
.word 16383
.word 0
.word 0
.word 0
.word 0
.word 32768
.word 16384
.word 0
.word 0
.word 0
.word 0
.word 0
.word 0
.word 0
.word 0
.word 32768
.word 0
.word 32768
.word 16415
.word 0
.word 49807
.word 10485
.word 36700
.word 62914
.word 16377
.word 0
.word 0
.word 0
.word 0
.word 32768
.word 32766
.word 0
.word 0
.word 0
.word 0
.word 32768
.word 16639
.word 0
.word 0
.word 0
.word 0
.word 49152
.word 16446
.word 0
.word 0
.word 0
.word 0
.word 32768
.word 16127
.word 0
.word 0
.word 0
.word 0
.word 32768
.word 8191
.word 0
.type _CONSTANTS,@object
.size _CONSTANTS,168
.data
.hidden __libm_hypot2l_k80
.hidden __libm_scalbl_k80
.section .note.GNU-stack, ""
# End