212 lines
5.2 KiB
ArmAsm
Raw Normal View History

/*
* Math library
*
* Copyright (C) 2016 Intel Corporation. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* * Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* * Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in
* the documentation and/or other materials provided with the
* distribution.
* * Neither the name of Intel Corporation nor the names of its
* contributors may be used to endorse or promote products derived
* from this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
*
* Author Name <jingwei.zhang@intel.com>
* History:
* 03-14-2016 Initial version. numerics svn rev. 12864
*/
.file "sqrtl.c"
.text
..TXTST0:
# -- Begin sqrtl
.text
.align 16,0x90
.globl sqrtl
sqrtl:
# parameter 1: 64 + %rsp
..B1.1:
.cfi_startproc
..___tag_value_sqrtl.1:
..L2:
subq $56, %rsp
.cfi_def_cfa_offset 64
xorb %cl, %cl
fldt 64(%rsp)
fstpt 32(%rsp)
..B1.2:
fnstcw 10(%rsp)
..B1.3:
movzwl 72(%rsp), %eax
andl $32767, %eax
cmpl $32767, %eax
je ..B1.23
..B1.4:
testb $-128, 73(%rsp)
jne ..B1.13
..B1.5:
movzwl 10(%rsp), %edx
movl %edx, %eax
andl $768, %eax
cmpl $768, %eax
je ..B1.9
..B1.6:
orl $-64768, %edx
movw %dx, 8(%rsp)
..B1.7:
fldcw 8(%rsp)
..B1.8:
movb $1, %cl
..B1.9:
fldt 32(%rsp)
fsqrt
fstpt 16(%rsp)
..B1.10:
testb %cl, %cl
je ..B1.12
..B1.11:
fldcw 10(%rsp)
..B1.12:
fldt 16(%rsp)
addq $56, %rsp
.cfi_def_cfa_offset 8
ret
.cfi_def_cfa_offset 64
..B1.13:
testl %eax, %eax
jne ..B1.16
..B1.14:
cmpq $0, 64(%rsp)
jne ..B1.16
..B1.15:
fldt 64(%rsp)
addq $56, %rsp
.cfi_def_cfa_offset 8
ret
.cfi_def_cfa_offset 64
..B1.16:
movzwl 10(%rsp), %edx
movl %edx, %eax
andl $768, %eax
cmpl $768, %eax
je ..B1.20
..B1.17:
orl $-64768, %edx
movw %dx, 8(%rsp)
..B1.18:
fldcw 8(%rsp)
..B1.19:
movb $1, %cl
..B1.20:
lea _infs(%rip), %rax
lea _zeros(%rip), %rdx
testb %cl, %cl
movsd (%rax), %xmm0
mulsd (%rdx), %xmm0
movsd %xmm0, (%rsp)
fldl (%rsp)
fstpt 16(%rsp)
je ..B1.22
..B1.21:
fldcw 10(%rsp)
..B1.22:
fldt 16(%rsp)
addq $56, %rsp
.cfi_def_cfa_offset 8
ret
.cfi_def_cfa_offset 64
..B1.23:
cmpl $-2147483648, 68(%rsp)
jne ..B1.25
..B1.24:
cmpl $0, 64(%rsp)
je ..B1.4
..B1.25:
movzwl 10(%rsp), %edx
movl %edx, %eax
andl $768, %eax
cmpl $768, %eax
je ..B1.31
..B1.26:
orl $-64768, %edx
movw %dx, 8(%rsp)
..B1.27:
fldcw 8(%rsp)
..B1.28:
fldt 64(%rsp)
lea _ones(%rip), %rax
fmull (%rax)
fstpt 16(%rsp)
..B1.29:
fldcw 10(%rsp)
..B1.30:
fldt 16(%rsp)
addq $56, %rsp
.cfi_def_cfa_offset 8
ret
.cfi_def_cfa_offset 64
..B1.31:
fldt 64(%rsp)
lea _ones(%rip), %rax
fmull (%rax)
fstpt 16(%rsp)
jmp ..B1.30
.align 16,0x90
.cfi_endproc
.type sqrtl,@function
.size sqrtl,.-sqrtl
.data
# -- End sqrtl
.section .rodata, "a"
.align 4
.align 4
_infs:
.long 0
.long 2146435072
.long 0
.long 4293918720
.type _infs,@object
.size _infs,16
.align 4
_zeros:
.long 0
.long 0
.long 0
.long 2147483648
.type _zeros,@object
.size _zeros,16
.align 4
_ones:
.long 0
.long 1072693248
.long 0
.long 3220176896
.type _ones,@object
.size _ones,16
.data
.section .note.GNU-stack, ""
// -- Begin DWARF2 SEGMENT .eh_frame
.section .eh_frame,"a",@progbits
.eh_frame_seg:
.align 1
# End