356 lines
14 KiB
LLVM
356 lines
14 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -mtriple=i686-linux-gnu -fast-isel | FileCheck %s --check-prefixes=X86,FASTISEL-X86
|
|
; RUN: llc < %s -mtriple=x86_64-linux-gnu -fast-isel | FileCheck %s --check-prefixes=X64,FASTISEL-X64
|
|
; RUN: llc < %s -mtriple=i686-linux-gnu -global-isel=0 -fast-isel=0 | FileCheck %s --check-prefixes=X86,SDAG-X86
|
|
; RUN: llc < %s -mtriple=x86_64-linux-gnu -global-isel=0 -fast-isel=0 | FileCheck %s --check-prefixes=X64,SDAG-X64
|
|
; TODO: The below RUN line will fails GISEL selection and will fallback to DAG selection due to lack of support for loads/stores in i686 mode, support is expected soon enough, for this reason the llvm/test/CodeGen/X86/GlobalISel/llvm.sincos.mir test is added for now because of the lack of support for i686 in GlobalISel.
|
|
; RUN: llc < %s -mtriple=i686-linux-gnu -global-isel=1 -global-isel-abort=2 | FileCheck %s --check-prefixes=GISEL-X86
|
|
; RUN: llc < %s -mtriple=x86_64-linux-gnu -global-isel=1 -global-isel-abort=1 | FileCheck %s --check-prefixes=GISEL-X64
|
|
|
|
define { float, float } @test_sincos_f32(float %Val) nounwind {
|
|
; X86-LABEL: test_sincos_f32:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: subl $28, %esp
|
|
; X86-NEXT: flds {{[0-9]+}}(%esp)
|
|
; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; X86-NEXT: fstps (%esp)
|
|
; X86-NEXT: calll sincosf
|
|
; X86-NEXT: flds {{[0-9]+}}(%esp)
|
|
; X86-NEXT: flds {{[0-9]+}}(%esp)
|
|
; X86-NEXT: addl $28, %esp
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: test_sincos_f32:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: pushq %rax
|
|
; X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
|
|
; X64-NEXT: movq %rsp, %rsi
|
|
; X64-NEXT: callq sincosf@PLT
|
|
; X64-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
|
|
; X64-NEXT: movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
|
|
; X64-NEXT: popq %rax
|
|
; X64-NEXT: retq
|
|
;
|
|
; GISEL-X86-LABEL: test_sincos_f32:
|
|
; GISEL-X86: # %bb.0:
|
|
; GISEL-X86-NEXT: subl $28, %esp
|
|
; GISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %ecx
|
|
; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %edx
|
|
; GISEL-X86-NEXT: movl %eax, (%esp)
|
|
; GISEL-X86-NEXT: movl %ecx, {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: movl %edx, {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: calll sincosf
|
|
; GISEL-X86-NEXT: flds {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: flds {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: fxch %st(1)
|
|
; GISEL-X86-NEXT: addl $28, %esp
|
|
; GISEL-X86-NEXT: retl
|
|
;
|
|
; GISEL-X64-LABEL: test_sincos_f32:
|
|
; GISEL-X64: # %bb.0:
|
|
; GISEL-X64-NEXT: pushq %rax
|
|
; GISEL-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
|
|
; GISEL-X64-NEXT: movq %rsp, %rsi
|
|
; GISEL-X64-NEXT: callq sincosf
|
|
; GISEL-X64-NEXT: movl {{[0-9]+}}(%rsp), %eax
|
|
; GISEL-X64-NEXT: movl (%rsp), %ecx
|
|
; GISEL-X64-NEXT: movd %eax, %xmm0
|
|
; GISEL-X64-NEXT: movd %ecx, %xmm1
|
|
; GISEL-X64-NEXT: popq %rax
|
|
; GISEL-X64-NEXT: retq
|
|
%res = call { float, float } @llvm.sincos.f32(float %Val)
|
|
ret { float, float } %res
|
|
}
|
|
|
|
define { double, double } @test_sincos_f64(double %Val) nounwind {
|
|
; X86-LABEL: test_sincos_f64:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: subl $44, %esp
|
|
; X86-NEXT: fldl {{[0-9]+}}(%esp)
|
|
; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; X86-NEXT: fstpl (%esp)
|
|
; X86-NEXT: calll sincos
|
|
; X86-NEXT: fldl {{[0-9]+}}(%esp)
|
|
; X86-NEXT: fldl {{[0-9]+}}(%esp)
|
|
; X86-NEXT: addl $44, %esp
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: test_sincos_f64:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: subq $24, %rsp
|
|
; X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
|
|
; X64-NEXT: leaq {{[0-9]+}}(%rsp), %rsi
|
|
; X64-NEXT: callq sincos@PLT
|
|
; X64-NEXT: movsd {{.*#+}} xmm0 = mem[0],zero
|
|
; X64-NEXT: movsd {{.*#+}} xmm1 = mem[0],zero
|
|
; X64-NEXT: addq $24, %rsp
|
|
; X64-NEXT: retq
|
|
;
|
|
; GISEL-X86-LABEL: test_sincos_f64:
|
|
; GISEL-X86: # %bb.0:
|
|
; GISEL-X86-NEXT: subl $44, %esp
|
|
; GISEL-X86-NEXT: fldl {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; GISEL-X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; GISEL-X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: fstpl (%esp)
|
|
; GISEL-X86-NEXT: calll sincos
|
|
; GISEL-X86-NEXT: fldl {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: fldl {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: addl $44, %esp
|
|
; GISEL-X86-NEXT: retl
|
|
;
|
|
; GISEL-X64-LABEL: test_sincos_f64:
|
|
; GISEL-X64: # %bb.0:
|
|
; GISEL-X64-NEXT: subq $24, %rsp
|
|
; GISEL-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
|
|
; GISEL-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rsi
|
|
; GISEL-X64-NEXT: callq sincos
|
|
; GISEL-X64-NEXT: movq {{[0-9]+}}(%rsp), %rax
|
|
; GISEL-X64-NEXT: movq {{[0-9]+}}(%rsp), %rcx
|
|
; GISEL-X64-NEXT: movq %rax, %xmm0
|
|
; GISEL-X64-NEXT: movq %rcx, %xmm1
|
|
; GISEL-X64-NEXT: addq $24, %rsp
|
|
; GISEL-X64-NEXT: retq
|
|
%res = call { double, double } @llvm.sincos.f64(double %Val)
|
|
ret { double, double } %res
|
|
}
|
|
|
|
define { x86_fp80, x86_fp80 } @test_sincos_f80(x86_fp80 %Val) nounwind {
|
|
; X86-LABEL: test_sincos_f80:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: subl $44, %esp
|
|
; X86-NEXT: fldt {{[0-9]+}}(%esp)
|
|
; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; X86-NEXT: fstpt (%esp)
|
|
; X86-NEXT: calll sincosl
|
|
; X86-NEXT: fldt {{[0-9]+}}(%esp)
|
|
; X86-NEXT: fldt {{[0-9]+}}(%esp)
|
|
; X86-NEXT: addl $44, %esp
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: test_sincos_f80:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: subq $56, %rsp
|
|
; X64-NEXT: fldt {{[0-9]+}}(%rsp)
|
|
; X64-NEXT: fstpt (%rsp)
|
|
; X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
|
|
; X64-NEXT: leaq {{[0-9]+}}(%rsp), %rsi
|
|
; X64-NEXT: callq sincosl@PLT
|
|
; X64-NEXT: fldt {{[0-9]+}}(%rsp)
|
|
; X64-NEXT: fldt {{[0-9]+}}(%rsp)
|
|
; X64-NEXT: addq $56, %rsp
|
|
; X64-NEXT: retq
|
|
;
|
|
; GISEL-X86-LABEL: test_sincos_f80:
|
|
; GISEL-X86: # %bb.0:
|
|
; GISEL-X86-NEXT: subl $60, %esp
|
|
; GISEL-X86-NEXT: fldt {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %ecx
|
|
; GISEL-X86-NEXT: fstpt (%esp)
|
|
; GISEL-X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: movl %ecx, {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: calll sincosl
|
|
; GISEL-X86-NEXT: fldt {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: fldt {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: fxch %st(1)
|
|
; GISEL-X86-NEXT: addl $60, %esp
|
|
; GISEL-X86-NEXT: retl
|
|
;
|
|
; GISEL-X64-LABEL: test_sincos_f80:
|
|
; GISEL-X64: # %bb.0:
|
|
; GISEL-X64-NEXT: subq $56, %rsp
|
|
; GISEL-X64-NEXT: fldt {{[0-9]+}}(%rsp)
|
|
; GISEL-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
|
|
; GISEL-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rsi
|
|
; GISEL-X64-NEXT: fstpt (%rsp)
|
|
; GISEL-X64-NEXT: callq sincosl
|
|
; GISEL-X64-NEXT: fldt {{[0-9]+}}(%rsp)
|
|
; GISEL-X64-NEXT: fldt {{[0-9]+}}(%rsp)
|
|
; GISEL-X64-NEXT: fxch %st(1)
|
|
; GISEL-X64-NEXT: addq $56, %rsp
|
|
; GISEL-X64-NEXT: retq
|
|
%res = call { x86_fp80, x86_fp80 } @llvm.sincos.f80(x86_fp80 %Val)
|
|
ret { x86_fp80, x86_fp80 } %res
|
|
}
|
|
|
|
declare void @foo(ptr, ptr)
|
|
|
|
define void @can_fold_with_call_in_chain(float %x, ptr noalias %a, ptr noalias %b) nounwind {
|
|
; FASTISEL-X86-LABEL: can_fold_with_call_in_chain:
|
|
; FASTISEL-X86: # %bb.0: # %entry
|
|
; FASTISEL-X86-NEXT: pushl %edi
|
|
; FASTISEL-X86-NEXT: pushl %esi
|
|
; FASTISEL-X86-NEXT: subl $20, %esp
|
|
; FASTISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
; FASTISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %edi
|
|
; FASTISEL-X86-NEXT: flds {{[0-9]+}}(%esp)
|
|
; FASTISEL-X86-NEXT: fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
|
|
; FASTISEL-X86-NEXT: movl %esi, {{[0-9]+}}(%esp)
|
|
; FASTISEL-X86-NEXT: movl %edi, (%esp)
|
|
; FASTISEL-X86-NEXT: calll foo@PLT
|
|
; FASTISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; FASTISEL-X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; FASTISEL-X86-NEXT: movl %edi, {{[0-9]+}}(%esp)
|
|
; FASTISEL-X86-NEXT: flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
|
|
; FASTISEL-X86-NEXT: fstps (%esp)
|
|
; FASTISEL-X86-NEXT: calll sincosf
|
|
; FASTISEL-X86-NEXT: flds {{[0-9]+}}(%esp)
|
|
; FASTISEL-X86-NEXT: fstps (%esi)
|
|
; FASTISEL-X86-NEXT: addl $20, %esp
|
|
; FASTISEL-X86-NEXT: popl %esi
|
|
; FASTISEL-X86-NEXT: popl %edi
|
|
; FASTISEL-X86-NEXT: retl
|
|
;
|
|
; FASTISEL-X64-LABEL: can_fold_with_call_in_chain:
|
|
; FASTISEL-X64: # %bb.0: # %entry
|
|
; FASTISEL-X64-NEXT: pushq %r14
|
|
; FASTISEL-X64-NEXT: pushq %rbx
|
|
; FASTISEL-X64-NEXT: pushq %rax
|
|
; FASTISEL-X64-NEXT: movq %rsi, %rbx
|
|
; FASTISEL-X64-NEXT: movq %rdi, %r14
|
|
; FASTISEL-X64-NEXT: movss %xmm0, (%rsp) # 4-byte Spill
|
|
; FASTISEL-X64-NEXT: callq sinf@PLT
|
|
; FASTISEL-X64-NEXT: movss %xmm0, {{[-0-9]+}}(%r{{[sb]}}p) # 4-byte Spill
|
|
; FASTISEL-X64-NEXT: movss (%rsp), %xmm0 # 4-byte Reload
|
|
; FASTISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
|
|
; FASTISEL-X64-NEXT: callq cosf@PLT
|
|
; FASTISEL-X64-NEXT: movss %xmm0, (%rsp) # 4-byte Spill
|
|
; FASTISEL-X64-NEXT: movq %r14, %rdi
|
|
; FASTISEL-X64-NEXT: movq %rbx, %rsi
|
|
; FASTISEL-X64-NEXT: callq foo@PLT
|
|
; FASTISEL-X64-NEXT: movss {{[-0-9]+}}(%r{{[sb]}}p), %xmm0 # 4-byte Reload
|
|
; FASTISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
|
|
; FASTISEL-X64-NEXT: movss %xmm0, (%r14)
|
|
; FASTISEL-X64-NEXT: movss (%rsp), %xmm0 # 4-byte Reload
|
|
; FASTISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
|
|
; FASTISEL-X64-NEXT: movss %xmm0, (%rbx)
|
|
; FASTISEL-X64-NEXT: addq $8, %rsp
|
|
; FASTISEL-X64-NEXT: popq %rbx
|
|
; FASTISEL-X64-NEXT: popq %r14
|
|
; FASTISEL-X64-NEXT: retq
|
|
;
|
|
; SDAG-X86-LABEL: can_fold_with_call_in_chain:
|
|
; SDAG-X86: # %bb.0: # %entry
|
|
; SDAG-X86-NEXT: pushl %edi
|
|
; SDAG-X86-NEXT: pushl %esi
|
|
; SDAG-X86-NEXT: subl $20, %esp
|
|
; SDAG-X86-NEXT: flds {{[0-9]+}}(%esp)
|
|
; SDAG-X86-NEXT: fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
|
|
; SDAG-X86-NEXT: movl {{[0-9]+}}(%esp), %edi
|
|
; SDAG-X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
; SDAG-X86-NEXT: movl %esi, {{[0-9]+}}(%esp)
|
|
; SDAG-X86-NEXT: movl %edi, (%esp)
|
|
; SDAG-X86-NEXT: calll foo@PLT
|
|
; SDAG-X86-NEXT: leal {{[0-9]+}}(%esp), %eax
|
|
; SDAG-X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
|
|
; SDAG-X86-NEXT: movl %edi, {{[0-9]+}}(%esp)
|
|
; SDAG-X86-NEXT: flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
|
|
; SDAG-X86-NEXT: fstps (%esp)
|
|
; SDAG-X86-NEXT: calll sincosf
|
|
; SDAG-X86-NEXT: flds {{[0-9]+}}(%esp)
|
|
; SDAG-X86-NEXT: fstps (%esi)
|
|
; SDAG-X86-NEXT: addl $20, %esp
|
|
; SDAG-X86-NEXT: popl %esi
|
|
; SDAG-X86-NEXT: popl %edi
|
|
; SDAG-X86-NEXT: retl
|
|
;
|
|
; SDAG-X64-LABEL: can_fold_with_call_in_chain:
|
|
; SDAG-X64: # %bb.0: # %entry
|
|
; SDAG-X64-NEXT: pushq %r14
|
|
; SDAG-X64-NEXT: pushq %rbx
|
|
; SDAG-X64-NEXT: pushq %rax
|
|
; SDAG-X64-NEXT: movq %rsi, %rbx
|
|
; SDAG-X64-NEXT: movq %rdi, %r14
|
|
; SDAG-X64-NEXT: movss %xmm0, (%rsp) # 4-byte Spill
|
|
; SDAG-X64-NEXT: callq foo@PLT
|
|
; SDAG-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rsi
|
|
; SDAG-X64-NEXT: movss (%rsp), %xmm0 # 4-byte Reload
|
|
; SDAG-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
|
|
; SDAG-X64-NEXT: movq %r14, %rdi
|
|
; SDAG-X64-NEXT: callq sincosf@PLT
|
|
; SDAG-X64-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
|
|
; SDAG-X64-NEXT: movss %xmm0, (%rbx)
|
|
; SDAG-X64-NEXT: addq $8, %rsp
|
|
; SDAG-X64-NEXT: popq %rbx
|
|
; SDAG-X64-NEXT: popq %r14
|
|
; SDAG-X64-NEXT: retq
|
|
;
|
|
; GISEL-X86-LABEL: can_fold_with_call_in_chain:
|
|
; GISEL-X86: # %bb.0: # %entry
|
|
; GISEL-X86-NEXT: pushl %ebx
|
|
; GISEL-X86-NEXT: pushl %edi
|
|
; GISEL-X86-NEXT: pushl %esi
|
|
; GISEL-X86-NEXT: subl $16, %esp
|
|
; GISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %ebx
|
|
; GISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
; GISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %edi
|
|
; GISEL-X86-NEXT: movl %ebx, (%esp)
|
|
; GISEL-X86-NEXT: calll sinf
|
|
; GISEL-X86-NEXT: fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
|
|
; GISEL-X86-NEXT: movl %ebx, (%esp)
|
|
; GISEL-X86-NEXT: calll cosf
|
|
; GISEL-X86-NEXT: fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
|
|
; GISEL-X86-NEXT: movl %esi, (%esp)
|
|
; GISEL-X86-NEXT: movl %edi, {{[0-9]+}}(%esp)
|
|
; GISEL-X86-NEXT: calll foo
|
|
; GISEL-X86-NEXT: flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
|
|
; GISEL-X86-NEXT: fstps (%esi)
|
|
; GISEL-X86-NEXT: flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
|
|
; GISEL-X86-NEXT: fstps (%edi)
|
|
; GISEL-X86-NEXT: addl $16, %esp
|
|
; GISEL-X86-NEXT: popl %esi
|
|
; GISEL-X86-NEXT: popl %edi
|
|
; GISEL-X86-NEXT: popl %ebx
|
|
; GISEL-X86-NEXT: retl
|
|
;
|
|
; GISEL-X64-LABEL: can_fold_with_call_in_chain:
|
|
; GISEL-X64: # %bb.0: # %entry
|
|
; GISEL-X64-NEXT: pushq %r14
|
|
; GISEL-X64-NEXT: pushq %rbx
|
|
; GISEL-X64-NEXT: pushq %rax
|
|
; GISEL-X64-NEXT: movss %xmm0, (%rsp) # 4-byte Spill
|
|
; GISEL-X64-NEXT: movq %rdi, %rbx
|
|
; GISEL-X64-NEXT: movq %rsi, %r14
|
|
; GISEL-X64-NEXT: callq sinf
|
|
; GISEL-X64-NEXT: movss %xmm0, {{[-0-9]+}}(%r{{[sb]}}p) # 4-byte Spill
|
|
; GISEL-X64-NEXT: movss (%rsp), %xmm0 # 4-byte Reload
|
|
; GISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
|
|
; GISEL-X64-NEXT: callq cosf
|
|
; GISEL-X64-NEXT: movss %xmm0, (%rsp) # 4-byte Spill
|
|
; GISEL-X64-NEXT: movq %rbx, %rdi
|
|
; GISEL-X64-NEXT: movq %r14, %rsi
|
|
; GISEL-X64-NEXT: callq foo
|
|
; GISEL-X64-NEXT: movd {{[-0-9]+}}(%r{{[sb]}}p), %xmm0 # 4-byte Folded Reload
|
|
; GISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
|
|
; GISEL-X64-NEXT: movd %xmm0, %eax
|
|
; GISEL-X64-NEXT: movl %eax, (%rbx)
|
|
; GISEL-X64-NEXT: movd (%rsp), %xmm0 # 4-byte Folded Reload
|
|
; GISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
|
|
; GISEL-X64-NEXT: movd %xmm0, %eax
|
|
; GISEL-X64-NEXT: movl %eax, (%r14)
|
|
; GISEL-X64-NEXT: addq $8, %rsp
|
|
; GISEL-X64-NEXT: popq %rbx
|
|
; GISEL-X64-NEXT: popq %r14
|
|
; GISEL-X64-NEXT: retq
|
|
entry:
|
|
%sin = tail call float @llvm.sin.f32(float %x)
|
|
%cos = tail call float @llvm.cos.f32(float %x)
|
|
call void @foo(ptr %a, ptr %b)
|
|
store float %sin, ptr %a, align 4
|
|
store float %cos, ptr %b, align 4
|
|
ret void
|
|
}
|