/* * Math library * * Copyright (C) 2016 Intel Corporation. All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * * * Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in * the documentation and/or other materials provided with the * distribution. * * Neither the name of Intel Corporation nor the names of its * contributors may be used to endorse or promote products derived * from this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. * * * Author Name * History: * 03-14-2016 Initial version. numerics svn rev. 12864 */ .file "sqrtl.c" .text ..TXTST0: # -- Begin sqrtl .text .align 16,0x90 .globl sqrtl sqrtl: # parameter 1: 64 + %rsp ..B1.1: .cfi_startproc ..___tag_value_sqrtl.1: ..L2: subq $56, %rsp .cfi_def_cfa_offset 64 xorb %cl, %cl fldt 64(%rsp) fstpt 32(%rsp) ..B1.2: fnstcw 10(%rsp) ..B1.3: movzwl 72(%rsp), %eax andl $32767, %eax cmpl $32767, %eax je ..B1.23 ..B1.4: testb $-128, 73(%rsp) jne ..B1.13 ..B1.5: movzwl 10(%rsp), %edx movl %edx, %eax andl $768, %eax cmpl $768, %eax je ..B1.9 ..B1.6: orl $-64768, %edx movw %dx, 8(%rsp) ..B1.7: fldcw 8(%rsp) ..B1.8: movb $1, %cl ..B1.9: fldt 32(%rsp) fsqrt fstpt 16(%rsp) ..B1.10: testb %cl, %cl je ..B1.12 ..B1.11: fldcw 10(%rsp) ..B1.12: fldt 16(%rsp) addq $56, %rsp .cfi_def_cfa_offset 8 ret .cfi_def_cfa_offset 64 ..B1.13: testl %eax, %eax jne ..B1.16 ..B1.14: cmpq $0, 64(%rsp) jne ..B1.16 ..B1.15: fldt 64(%rsp) addq $56, %rsp .cfi_def_cfa_offset 8 ret .cfi_def_cfa_offset 64 ..B1.16: movzwl 10(%rsp), %edx movl %edx, %eax andl $768, %eax cmpl $768, %eax je ..B1.20 ..B1.17: orl $-64768, %edx movw %dx, 8(%rsp) ..B1.18: fldcw 8(%rsp) ..B1.19: movb $1, %cl ..B1.20: lea _infs(%rip), %rax lea _zeros(%rip), %rdx testb %cl, %cl movsd (%rax), %xmm0 mulsd (%rdx), %xmm0 movsd %xmm0, (%rsp) fldl (%rsp) fstpt 16(%rsp) je ..B1.22 ..B1.21: fldcw 10(%rsp) ..B1.22: fldt 16(%rsp) addq $56, %rsp .cfi_def_cfa_offset 8 ret .cfi_def_cfa_offset 64 ..B1.23: cmpl $-2147483648, 68(%rsp) jne ..B1.25 ..B1.24: cmpl $0, 64(%rsp) je ..B1.4 ..B1.25: movzwl 10(%rsp), %edx movl %edx, %eax andl $768, %eax cmpl $768, %eax je ..B1.31 ..B1.26: orl $-64768, %edx movw %dx, 8(%rsp) ..B1.27: fldcw 8(%rsp) ..B1.28: fldt 64(%rsp) lea _ones(%rip), %rax fmull (%rax) fstpt 16(%rsp) ..B1.29: fldcw 10(%rsp) ..B1.30: fldt 16(%rsp) addq $56, %rsp .cfi_def_cfa_offset 8 ret .cfi_def_cfa_offset 64 ..B1.31: fldt 64(%rsp) lea _ones(%rip), %rax fmull (%rax) fstpt 16(%rsp) jmp ..B1.30 .align 16,0x90 .cfi_endproc .type sqrtl,@function .size sqrtl,.-sqrtl .data # -- End sqrtl .section .rodata, "a" .align 4 .align 4 _infs: .long 0 .long 2146435072 .long 0 .long 4293918720 .type _infs,@object .size _infs,16 .align 4 _zeros: .long 0 .long 0 .long 0 .long 2147483648 .type _zeros,@object .size _zeros,16 .align 4 _ones: .long 0 .long 1072693248 .long 0 .long 3220176896 .type _ones,@object .size _ones,16 .data .section .note.GNU-stack, "" // -- Begin DWARF2 SEGMENT .eh_frame .section .eh_frame,"a",@progbits .eh_frame_seg: .align 1 # End