llvm-project/llvm/test/CodeGen/X86/llvm.sincos.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=i686-linux-gnu -fast-isel  | FileCheck %s --check-prefixes=X86,FASTISEL-X86
; RUN: llc < %s -mtriple=x86_64-linux-gnu -fast-isel  | FileCheck %s --check-prefixes=X64,FASTISEL-X64
; RUN: llc < %s -mtriple=i686-linux-gnu -global-isel=0 -fast-isel=0  | FileCheck %s --check-prefixes=X86,SDAG-X86
; RUN: llc < %s -mtriple=x86_64-linux-gnu -global-isel=0 -fast-isel=0  | FileCheck %s --check-prefixes=X64,SDAG-X64
; TODO: The below RUN line will fails GISEL selection and will fallback to DAG selection due to lack of support for loads/stores in i686 mode, support is expected soon enough, for this reason the llvm/test/CodeGen/X86/GlobalISel/llvm.sincos.mir test is added for now because of the lack of support for i686 in GlobalISel.
; RUN: llc < %s -mtriple=i686-linux-gnu -global-isel=1 -global-isel-abort=2 | FileCheck %s --check-prefixes=GISEL-X86
; RUN: llc < %s -mtriple=x86_64-linux-gnu -global-isel=1 -global-isel-abort=1 | FileCheck %s --check-prefixes=GISEL-X64

define { float, float } @test_sincos_f32(float %Val) nounwind {
; X86-LABEL: test_sincos_f32:
; X86:       # %bb.0:
; X86-NEXT:    subl $28, %esp
; X86-NEXT:    flds {{[0-9]+}}(%esp)
; X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; X86-NEXT:    fstps (%esp)
; X86-NEXT:    calll sincosf
; X86-NEXT:    flds {{[0-9]+}}(%esp)
; X86-NEXT:    flds {{[0-9]+}}(%esp)
; X86-NEXT:    addl $28, %esp
; X86-NEXT:    retl
;
; X64-LABEL: test_sincos_f32:
; X64:       # %bb.0:
; X64-NEXT:    pushq %rax
; X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rdi
; X64-NEXT:    movq %rsp, %rsi
; X64-NEXT:    callq sincosf@PLT
; X64-NEXT:    movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
; X64-NEXT:    movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
; X64-NEXT:    popq %rax
; X64-NEXT:    retq
;
; GISEL-X86-LABEL: test_sincos_f32:
; GISEL-X86:       # %bb.0:
; GISEL-X86-NEXT:    subl $28, %esp
; GISEL-X86-NEXT:    movl {{[0-9]+}}(%esp), %eax
; GISEL-X86-NEXT:    leal {{[0-9]+}}(%esp), %ecx
; GISEL-X86-NEXT:    leal {{[0-9]+}}(%esp), %edx
; GISEL-X86-NEXT:    movl %eax, (%esp)
; GISEL-X86-NEXT:    movl %ecx, {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    movl %edx, {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    calll sincosf
; GISEL-X86-NEXT:    flds {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    flds {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    fxch %st(1)
; GISEL-X86-NEXT:    addl $28, %esp
; GISEL-X86-NEXT:    retl
;
; GISEL-X64-LABEL: test_sincos_f32:
; GISEL-X64:       # %bb.0:
; GISEL-X64-NEXT:    pushq %rax
; GISEL-X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rdi
; GISEL-X64-NEXT:    movq %rsp, %rsi
; GISEL-X64-NEXT:    callq sincosf
; GISEL-X64-NEXT:    movl {{[0-9]+}}(%rsp), %eax
; GISEL-X64-NEXT:    movl (%rsp), %ecx
; GISEL-X64-NEXT:    movd %eax, %xmm0
; GISEL-X64-NEXT:    movd %ecx, %xmm1
; GISEL-X64-NEXT:    popq %rax
; GISEL-X64-NEXT:    retq
  %res = call { float, float } @llvm.sincos.f32(float %Val)
  ret { float, float } %res
}

define { double, double } @test_sincos_f64(double %Val) nounwind  {
; X86-LABEL: test_sincos_f64:
; X86:       # %bb.0:
; X86-NEXT:    subl $44, %esp
; X86-NEXT:    fldl {{[0-9]+}}(%esp)
; X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; X86-NEXT:    fstpl (%esp)
; X86-NEXT:    calll sincos
; X86-NEXT:    fldl {{[0-9]+}}(%esp)
; X86-NEXT:    fldl {{[0-9]+}}(%esp)
; X86-NEXT:    addl $44, %esp
; X86-NEXT:    retl
;
; X64-LABEL: test_sincos_f64:
; X64:       # %bb.0:
; X64-NEXT:    subq $24, %rsp
; X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rdi
; X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rsi
; X64-NEXT:    callq sincos@PLT
; X64-NEXT:    movsd {{.*#+}} xmm0 = mem[0],zero
; X64-NEXT:    movsd {{.*#+}} xmm1 = mem[0],zero
; X64-NEXT:    addq $24, %rsp
; X64-NEXT:    retq
;
; GISEL-X86-LABEL: test_sincos_f64:
; GISEL-X86:       # %bb.0:
; GISEL-X86-NEXT:    subl $44, %esp
; GISEL-X86-NEXT:    fldl {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; GISEL-X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; GISEL-X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    fstpl (%esp)
; GISEL-X86-NEXT:    calll sincos
; GISEL-X86-NEXT:    fldl {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    fldl {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    addl $44, %esp
; GISEL-X86-NEXT:    retl
;
; GISEL-X64-LABEL: test_sincos_f64:
; GISEL-X64:       # %bb.0:
; GISEL-X64-NEXT:    subq $24, %rsp
; GISEL-X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rdi
; GISEL-X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rsi
; GISEL-X64-NEXT:    callq sincos
; GISEL-X64-NEXT:    movq {{[0-9]+}}(%rsp), %rax
; GISEL-X64-NEXT:    movq {{[0-9]+}}(%rsp), %rcx
; GISEL-X64-NEXT:    movq %rax, %xmm0
; GISEL-X64-NEXT:    movq %rcx, %xmm1
; GISEL-X64-NEXT:    addq $24, %rsp
; GISEL-X64-NEXT:    retq
  %res = call { double, double } @llvm.sincos.f64(double %Val)
  ret { double, double } %res
}

define { x86_fp80, x86_fp80 } @test_sincos_f80(x86_fp80 %Val) nounwind {
; X86-LABEL: test_sincos_f80:
; X86:       # %bb.0:
; X86-NEXT:    subl $44, %esp
; X86-NEXT:    fldt {{[0-9]+}}(%esp)
; X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; X86-NEXT:    fstpt (%esp)
; X86-NEXT:    calll sincosl
; X86-NEXT:    fldt {{[0-9]+}}(%esp)
; X86-NEXT:    fldt {{[0-9]+}}(%esp)
; X86-NEXT:    addl $44, %esp
; X86-NEXT:    retl
;
; X64-LABEL: test_sincos_f80:
; X64:       # %bb.0:
; X64-NEXT:    subq $56, %rsp
; X64-NEXT:    fldt {{[0-9]+}}(%rsp)
; X64-NEXT:    fstpt (%rsp)
; X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rdi
; X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rsi
; X64-NEXT:    callq sincosl@PLT
; X64-NEXT:    fldt {{[0-9]+}}(%rsp)
; X64-NEXT:    fldt {{[0-9]+}}(%rsp)
; X64-NEXT:    addq $56, %rsp
; X64-NEXT:    retq
;
; GISEL-X86-LABEL: test_sincos_f80:
; GISEL-X86:       # %bb.0:
; GISEL-X86-NEXT:    subl $60, %esp
; GISEL-X86-NEXT:    fldt {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; GISEL-X86-NEXT:    leal {{[0-9]+}}(%esp), %ecx
; GISEL-X86-NEXT:    fstpt (%esp)
; GISEL-X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    movl %ecx, {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    calll sincosl
; GISEL-X86-NEXT:    fldt {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    fldt {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    fxch %st(1)
; GISEL-X86-NEXT:    addl $60, %esp
; GISEL-X86-NEXT:    retl
;
; GISEL-X64-LABEL: test_sincos_f80:
; GISEL-X64:       # %bb.0:
; GISEL-X64-NEXT:    subq $56, %rsp
; GISEL-X64-NEXT:    fldt {{[0-9]+}}(%rsp)
; GISEL-X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rdi
; GISEL-X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rsi
; GISEL-X64-NEXT:    fstpt (%rsp)
; GISEL-X64-NEXT:    callq sincosl
; GISEL-X64-NEXT:    fldt {{[0-9]+}}(%rsp)
; GISEL-X64-NEXT:    fldt {{[0-9]+}}(%rsp)
; GISEL-X64-NEXT:    fxch %st(1)
; GISEL-X64-NEXT:    addq $56, %rsp
; GISEL-X64-NEXT:    retq
  %res = call { x86_fp80, x86_fp80 } @llvm.sincos.f80(x86_fp80 %Val)
  ret { x86_fp80, x86_fp80 } %res
}

declare void @foo(ptr, ptr)

define void @can_fold_with_call_in_chain(float %x, ptr noalias %a, ptr noalias %b) nounwind {
; FASTISEL-X86-LABEL: can_fold_with_call_in_chain:
; FASTISEL-X86:       # %bb.0: # %entry
; FASTISEL-X86-NEXT:    pushl %edi
; FASTISEL-X86-NEXT:    pushl %esi
; FASTISEL-X86-NEXT:    subl $20, %esp
; FASTISEL-X86-NEXT:    movl {{[0-9]+}}(%esp), %esi
; FASTISEL-X86-NEXT:    movl {{[0-9]+}}(%esp), %edi
; FASTISEL-X86-NEXT:    flds {{[0-9]+}}(%esp)
; FASTISEL-X86-NEXT:    fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
; FASTISEL-X86-NEXT:    movl %esi, {{[0-9]+}}(%esp)
; FASTISEL-X86-NEXT:    movl %edi, (%esp)
; FASTISEL-X86-NEXT:    calll foo@PLT
; FASTISEL-X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; FASTISEL-X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; FASTISEL-X86-NEXT:    movl %edi, {{[0-9]+}}(%esp)
; FASTISEL-X86-NEXT:    flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
; FASTISEL-X86-NEXT:    fstps (%esp)
; FASTISEL-X86-NEXT:    calll sincosf
; FASTISEL-X86-NEXT:    flds {{[0-9]+}}(%esp)
; FASTISEL-X86-NEXT:    fstps (%esi)
; FASTISEL-X86-NEXT:    addl $20, %esp
; FASTISEL-X86-NEXT:    popl %esi
; FASTISEL-X86-NEXT:    popl %edi
; FASTISEL-X86-NEXT:    retl
;
; FASTISEL-X64-LABEL: can_fold_with_call_in_chain:
; FASTISEL-X64:       # %bb.0: # %entry
; FASTISEL-X64-NEXT:    pushq %r14
; FASTISEL-X64-NEXT:    pushq %rbx
; FASTISEL-X64-NEXT:    pushq %rax
; FASTISEL-X64-NEXT:    movq %rsi, %rbx
; FASTISEL-X64-NEXT:    movq %rdi, %r14
; FASTISEL-X64-NEXT:    movss %xmm0, (%rsp) # 4-byte Spill
; FASTISEL-X64-NEXT:    callq sinf@PLT
; FASTISEL-X64-NEXT:    movss %xmm0, {{[-0-9]+}}(%r{{[sb]}}p) # 4-byte Spill
; FASTISEL-X64-NEXT:    movss (%rsp), %xmm0 # 4-byte Reload
; FASTISEL-X64-NEXT:    # xmm0 = mem[0],zero,zero,zero
; FASTISEL-X64-NEXT:    callq cosf@PLT
; FASTISEL-X64-NEXT:    movss %xmm0, (%rsp) # 4-byte Spill
; FASTISEL-X64-NEXT:    movq %r14, %rdi
; FASTISEL-X64-NEXT:    movq %rbx, %rsi
; FASTISEL-X64-NEXT:    callq foo@PLT
; FASTISEL-X64-NEXT:    movss {{[-0-9]+}}(%r{{[sb]}}p), %xmm0 # 4-byte Reload
; FASTISEL-X64-NEXT:    # xmm0 = mem[0],zero,zero,zero
; FASTISEL-X64-NEXT:    movss %xmm0, (%r14)
; FASTISEL-X64-NEXT:    movss (%rsp), %xmm0 # 4-byte Reload
; FASTISEL-X64-NEXT:    # xmm0 = mem[0],zero,zero,zero
; FASTISEL-X64-NEXT:    movss %xmm0, (%rbx)
; FASTISEL-X64-NEXT:    addq $8, %rsp
; FASTISEL-X64-NEXT:    popq %rbx
; FASTISEL-X64-NEXT:    popq %r14
; FASTISEL-X64-NEXT:    retq
;
; SDAG-X86-LABEL: can_fold_with_call_in_chain:
; SDAG-X86:       # %bb.0: # %entry
; SDAG-X86-NEXT:    pushl %edi
; SDAG-X86-NEXT:    pushl %esi
; SDAG-X86-NEXT:    subl $20, %esp
; SDAG-X86-NEXT:    flds {{[0-9]+}}(%esp)
; SDAG-X86-NEXT:    fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
; SDAG-X86-NEXT:    movl {{[0-9]+}}(%esp), %edi
; SDAG-X86-NEXT:    movl {{[0-9]+}}(%esp), %esi
; SDAG-X86-NEXT:    movl %esi, {{[0-9]+}}(%esp)
; SDAG-X86-NEXT:    movl %edi, (%esp)
; SDAG-X86-NEXT:    calll foo@PLT
; SDAG-X86-NEXT:    leal {{[0-9]+}}(%esp), %eax
; SDAG-X86-NEXT:    movl %eax, {{[0-9]+}}(%esp)
; SDAG-X86-NEXT:    movl %edi, {{[0-9]+}}(%esp)
; SDAG-X86-NEXT:    flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
; SDAG-X86-NEXT:    fstps (%esp)
; SDAG-X86-NEXT:    calll sincosf
; SDAG-X86-NEXT:    flds {{[0-9]+}}(%esp)
; SDAG-X86-NEXT:    fstps (%esi)
; SDAG-X86-NEXT:    addl $20, %esp
; SDAG-X86-NEXT:    popl %esi
; SDAG-X86-NEXT:    popl %edi
; SDAG-X86-NEXT:    retl
;
; SDAG-X64-LABEL: can_fold_with_call_in_chain:
; SDAG-X64:       # %bb.0: # %entry
; SDAG-X64-NEXT:    pushq %r14
; SDAG-X64-NEXT:    pushq %rbx
; SDAG-X64-NEXT:    pushq %rax
; SDAG-X64-NEXT:    movq %rsi, %rbx
; SDAG-X64-NEXT:    movq %rdi, %r14
; SDAG-X64-NEXT:    movss %xmm0, (%rsp) # 4-byte Spill
; SDAG-X64-NEXT:    callq foo@PLT
; SDAG-X64-NEXT:    leaq {{[0-9]+}}(%rsp), %rsi
; SDAG-X64-NEXT:    movss (%rsp), %xmm0 # 4-byte Reload
; SDAG-X64-NEXT:    # xmm0 = mem[0],zero,zero,zero
; SDAG-X64-NEXT:    movq %r14, %rdi
; SDAG-X64-NEXT:    callq sincosf@PLT
; SDAG-X64-NEXT:    movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
; SDAG-X64-NEXT:    movss %xmm0, (%rbx)
; SDAG-X64-NEXT:    addq $8, %rsp
; SDAG-X64-NEXT:    popq %rbx
; SDAG-X64-NEXT:    popq %r14
; SDAG-X64-NEXT:    retq
;
; GISEL-X86-LABEL: can_fold_with_call_in_chain:
; GISEL-X86:       # %bb.0: # %entry
; GISEL-X86-NEXT:    pushl %ebx
; GISEL-X86-NEXT:    pushl %edi
; GISEL-X86-NEXT:    pushl %esi
; GISEL-X86-NEXT:    subl $16, %esp
; GISEL-X86-NEXT:    movl {{[0-9]+}}(%esp), %ebx
; GISEL-X86-NEXT:    movl {{[0-9]+}}(%esp), %esi
; GISEL-X86-NEXT:    movl {{[0-9]+}}(%esp), %edi
; GISEL-X86-NEXT:    movl %ebx, (%esp)
; GISEL-X86-NEXT:    calll sinf
; GISEL-X86-NEXT:    fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
; GISEL-X86-NEXT:    movl %ebx, (%esp)
; GISEL-X86-NEXT:    calll cosf
; GISEL-X86-NEXT:    fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
; GISEL-X86-NEXT:    movl %esi, (%esp)
; GISEL-X86-NEXT:    movl %edi, {{[0-9]+}}(%esp)
; GISEL-X86-NEXT:    calll foo
; GISEL-X86-NEXT:    flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
; GISEL-X86-NEXT:    fstps (%esi)
; GISEL-X86-NEXT:    flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
; GISEL-X86-NEXT:    fstps (%edi)
; GISEL-X86-NEXT:    addl $16, %esp
; GISEL-X86-NEXT:    popl %esi
; GISEL-X86-NEXT:    popl %edi
; GISEL-X86-NEXT:    popl %ebx
; GISEL-X86-NEXT:    retl
;
; GISEL-X64-LABEL: can_fold_with_call_in_chain:
; GISEL-X64:       # %bb.0: # %entry
; GISEL-X64-NEXT:    pushq %r14
; GISEL-X64-NEXT:    pushq %rbx
; GISEL-X64-NEXT:    pushq %rax
; GISEL-X64-NEXT:    movss %xmm0, (%rsp) # 4-byte Spill
; GISEL-X64-NEXT:    movq %rdi, %rbx
; GISEL-X64-NEXT:    movq %rsi, %r14
; GISEL-X64-NEXT:    callq sinf
; GISEL-X64-NEXT:    movss %xmm0, {{[-0-9]+}}(%r{{[sb]}}p) # 4-byte Spill
; GISEL-X64-NEXT:    movss (%rsp), %xmm0 # 4-byte Reload
; GISEL-X64-NEXT:    # xmm0 = mem[0],zero,zero,zero
; GISEL-X64-NEXT:    callq cosf
; GISEL-X64-NEXT:    movss %xmm0, (%rsp) # 4-byte Spill
; GISEL-X64-NEXT:    movq %rbx, %rdi
; GISEL-X64-NEXT:    movq %r14, %rsi
; GISEL-X64-NEXT:    callq foo
; GISEL-X64-NEXT:    movd {{[-0-9]+}}(%r{{[sb]}}p), %xmm0 # 4-byte Folded Reload
; GISEL-X64-NEXT:    # xmm0 = mem[0],zero,zero,zero
; GISEL-X64-NEXT:    movd %xmm0, %eax
; GISEL-X64-NEXT:    movl %eax, (%rbx)
; GISEL-X64-NEXT:    movd (%rsp), %xmm0 # 4-byte Folded Reload
; GISEL-X64-NEXT:    # xmm0 = mem[0],zero,zero,zero
; GISEL-X64-NEXT:    movd %xmm0, %eax
; GISEL-X64-NEXT:    movl %eax, (%r14)
; GISEL-X64-NEXT:    addq $8, %rsp
; GISEL-X64-NEXT:    popq %rbx
; GISEL-X64-NEXT:    popq %r14
; GISEL-X64-NEXT:    retq
entry:
  %sin = tail call float @llvm.sin.f32(float %x)
  %cos = tail call float @llvm.cos.f32(float %x)
  call void @foo(ptr %a, ptr %b)
  store float %sin, ptr %a, align 4
  store float %cos, ptr %b, align 4
  ret void
}