summaryrefslogtreecommitdiff
path: root/llvm/test/CodeGen/X86/isel-llvm.sincos.ll
diff options
context:
space:
mode:
Diffstat (limited to 'llvm/test/CodeGen/X86/isel-llvm.sincos.ll')
-rw-r--r--llvm/test/CodeGen/X86/isel-llvm.sincos.ll355
1 files changed, 355 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/X86/isel-llvm.sincos.ll b/llvm/test/CodeGen/X86/isel-llvm.sincos.ll
new file mode 100644
index 000000000000..065710f91457
--- /dev/null
+++ b/llvm/test/CodeGen/X86/isel-llvm.sincos.ll
@@ -0,0 +1,355 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc < %s -mtriple=i686-linux-gnu -fast-isel | FileCheck %s --check-prefixes=X86,FASTISEL-X86
+; RUN: llc < %s -mtriple=x86_64-linux-gnu -fast-isel | FileCheck %s --check-prefixes=X64,FASTISEL-X64
+; RUN: llc < %s -mtriple=i686-linux-gnu -global-isel=0 -fast-isel=0 | FileCheck %s --check-prefixes=X86,SDAG-X86
+; RUN: llc < %s -mtriple=x86_64-linux-gnu -global-isel=0 -fast-isel=0 | FileCheck %s --check-prefixes=X64,SDAG-X64
+; TODO: The below RUN line will fails GISEL selection and will fallback to DAG selection due to lack of support for loads/stores in i686 mode, support is expected soon enough, for this reason the llvm/test/CodeGen/X86/GlobalISel/llvm.sincos.mir test is added for now because of the lack of support for i686 in GlobalISel.
+; RUN: llc < %s -mtriple=i686-linux-gnu -global-isel=1 -global-isel-abort=2 | FileCheck %s --check-prefixes=GISEL-X86
+; RUN: llc < %s -mtriple=x86_64-linux-gnu -global-isel=1 -global-isel-abort=1 | FileCheck %s --check-prefixes=GISEL-X64
+
+define { float, float } @test_sincos_f32(float %Val) nounwind {
+; X86-LABEL: test_sincos_f32:
+; X86: # %bb.0:
+; X86-NEXT: subl $28, %esp
+; X86-NEXT: flds {{[0-9]+}}(%esp)
+; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; X86-NEXT: fstps (%esp)
+; X86-NEXT: calll sincosf
+; X86-NEXT: flds {{[0-9]+}}(%esp)
+; X86-NEXT: flds {{[0-9]+}}(%esp)
+; X86-NEXT: addl $28, %esp
+; X86-NEXT: retl
+;
+; X64-LABEL: test_sincos_f32:
+; X64: # %bb.0:
+; X64-NEXT: pushq %rax
+; X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
+; X64-NEXT: movq %rsp, %rsi
+; X64-NEXT: callq sincosf@PLT
+; X64-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
+; X64-NEXT: movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
+; X64-NEXT: popq %rax
+; X64-NEXT: retq
+;
+; GISEL-X86-LABEL: test_sincos_f32:
+; GISEL-X86: # %bb.0:
+; GISEL-X86-NEXT: subl $28, %esp
+; GISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %eax
+; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %ecx
+; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %edx
+; GISEL-X86-NEXT: movl %eax, (%esp)
+; GISEL-X86-NEXT: movl %ecx, {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: movl %edx, {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: calll sincosf
+; GISEL-X86-NEXT: flds {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: flds {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: fxch %st(1)
+; GISEL-X86-NEXT: addl $28, %esp
+; GISEL-X86-NEXT: retl
+;
+; GISEL-X64-LABEL: test_sincos_f32:
+; GISEL-X64: # %bb.0:
+; GISEL-X64-NEXT: pushq %rax
+; GISEL-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
+; GISEL-X64-NEXT: movq %rsp, %rsi
+; GISEL-X64-NEXT: callq sincosf
+; GISEL-X64-NEXT: movl {{[0-9]+}}(%rsp), %eax
+; GISEL-X64-NEXT: movl (%rsp), %ecx
+; GISEL-X64-NEXT: movd %eax, %xmm0
+; GISEL-X64-NEXT: movd %ecx, %xmm1
+; GISEL-X64-NEXT: popq %rax
+; GISEL-X64-NEXT: retq
+ %res = call { float, float } @llvm.sincos.f32(float %Val)
+ ret { float, float } %res
+}
+
+define { double, double } @test_sincos_f64(double %Val) nounwind {
+; X86-LABEL: test_sincos_f64:
+; X86: # %bb.0:
+; X86-NEXT: subl $44, %esp
+; X86-NEXT: fldl {{[0-9]+}}(%esp)
+; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; X86-NEXT: fstpl (%esp)
+; X86-NEXT: calll sincos
+; X86-NEXT: fldl {{[0-9]+}}(%esp)
+; X86-NEXT: fldl {{[0-9]+}}(%esp)
+; X86-NEXT: addl $44, %esp
+; X86-NEXT: retl
+;
+; X64-LABEL: test_sincos_f64:
+; X64: # %bb.0:
+; X64-NEXT: subq $24, %rsp
+; X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
+; X64-NEXT: leaq {{[0-9]+}}(%rsp), %rsi
+; X64-NEXT: callq sincos@PLT
+; X64-NEXT: movsd {{.*#+}} xmm0 = mem[0],zero
+; X64-NEXT: movsd {{.*#+}} xmm1 = mem[0],zero
+; X64-NEXT: addq $24, %rsp
+; X64-NEXT: retq
+;
+; GISEL-X86-LABEL: test_sincos_f64:
+; GISEL-X86: # %bb.0:
+; GISEL-X86-NEXT: subl $44, %esp
+; GISEL-X86-NEXT: fldl {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; GISEL-X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; GISEL-X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: fstpl (%esp)
+; GISEL-X86-NEXT: calll sincos
+; GISEL-X86-NEXT: fldl {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: fldl {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: addl $44, %esp
+; GISEL-X86-NEXT: retl
+;
+; GISEL-X64-LABEL: test_sincos_f64:
+; GISEL-X64: # %bb.0:
+; GISEL-X64-NEXT: subq $24, %rsp
+; GISEL-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
+; GISEL-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rsi
+; GISEL-X64-NEXT: callq sincos
+; GISEL-X64-NEXT: movq {{[0-9]+}}(%rsp), %rax
+; GISEL-X64-NEXT: movq {{[0-9]+}}(%rsp), %rcx
+; GISEL-X64-NEXT: movq %rax, %xmm0
+; GISEL-X64-NEXT: movq %rcx, %xmm1
+; GISEL-X64-NEXT: addq $24, %rsp
+; GISEL-X64-NEXT: retq
+ %res = call { double, double } @llvm.sincos.f64(double %Val)
+ ret { double, double } %res
+}
+
+define { x86_fp80, x86_fp80 } @test_sincos_f80(x86_fp80 %Val) nounwind {
+; X86-LABEL: test_sincos_f80:
+; X86: # %bb.0:
+; X86-NEXT: subl $44, %esp
+; X86-NEXT: fldt {{[0-9]+}}(%esp)
+; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; X86-NEXT: fstpt (%esp)
+; X86-NEXT: calll sincosl
+; X86-NEXT: fldt {{[0-9]+}}(%esp)
+; X86-NEXT: fldt {{[0-9]+}}(%esp)
+; X86-NEXT: addl $44, %esp
+; X86-NEXT: retl
+;
+; X64-LABEL: test_sincos_f80:
+; X64: # %bb.0:
+; X64-NEXT: subq $56, %rsp
+; X64-NEXT: fldt {{[0-9]+}}(%rsp)
+; X64-NEXT: fstpt (%rsp)
+; X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
+; X64-NEXT: leaq {{[0-9]+}}(%rsp), %rsi
+; X64-NEXT: callq sincosl@PLT
+; X64-NEXT: fldt {{[0-9]+}}(%rsp)
+; X64-NEXT: fldt {{[0-9]+}}(%rsp)
+; X64-NEXT: addq $56, %rsp
+; X64-NEXT: retq
+;
+; GISEL-X86-LABEL: test_sincos_f80:
+; GISEL-X86: # %bb.0:
+; GISEL-X86-NEXT: subl $60, %esp
+; GISEL-X86-NEXT: fldt {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; GISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %ecx
+; GISEL-X86-NEXT: fstpt (%esp)
+; GISEL-X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: movl %ecx, {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: calll sincosl
+; GISEL-X86-NEXT: fldt {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: fldt {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: fxch %st(1)
+; GISEL-X86-NEXT: addl $60, %esp
+; GISEL-X86-NEXT: retl
+;
+; GISEL-X64-LABEL: test_sincos_f80:
+; GISEL-X64: # %bb.0:
+; GISEL-X64-NEXT: subq $56, %rsp
+; GISEL-X64-NEXT: fldt {{[0-9]+}}(%rsp)
+; GISEL-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rdi
+; GISEL-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rsi
+; GISEL-X64-NEXT: fstpt (%rsp)
+; GISEL-X64-NEXT: callq sincosl
+; GISEL-X64-NEXT: fldt {{[0-9]+}}(%rsp)
+; GISEL-X64-NEXT: fldt {{[0-9]+}}(%rsp)
+; GISEL-X64-NEXT: fxch %st(1)
+; GISEL-X64-NEXT: addq $56, %rsp
+; GISEL-X64-NEXT: retq
+ %res = call { x86_fp80, x86_fp80 } @llvm.sincos.f80(x86_fp80 %Val)
+ ret { x86_fp80, x86_fp80 } %res
+}
+
+declare void @foo(ptr, ptr)
+
+define void @can_fold_with_call_in_chain(float %x, ptr noalias %a, ptr noalias %b) nounwind {
+; FASTISEL-X86-LABEL: can_fold_with_call_in_chain:
+; FASTISEL-X86: # %bb.0: # %entry
+; FASTISEL-X86-NEXT: pushl %edi
+; FASTISEL-X86-NEXT: pushl %esi
+; FASTISEL-X86-NEXT: subl $20, %esp
+; FASTISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %esi
+; FASTISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %edi
+; FASTISEL-X86-NEXT: flds {{[0-9]+}}(%esp)
+; FASTISEL-X86-NEXT: fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
+; FASTISEL-X86-NEXT: movl %esi, {{[0-9]+}}(%esp)
+; FASTISEL-X86-NEXT: movl %edi, (%esp)
+; FASTISEL-X86-NEXT: calll foo@PLT
+; FASTISEL-X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; FASTISEL-X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; FASTISEL-X86-NEXT: movl %edi, {{[0-9]+}}(%esp)
+; FASTISEL-X86-NEXT: flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
+; FASTISEL-X86-NEXT: fstps (%esp)
+; FASTISEL-X86-NEXT: calll sincosf
+; FASTISEL-X86-NEXT: flds {{[0-9]+}}(%esp)
+; FASTISEL-X86-NEXT: fstps (%esi)
+; FASTISEL-X86-NEXT: addl $20, %esp
+; FASTISEL-X86-NEXT: popl %esi
+; FASTISEL-X86-NEXT: popl %edi
+; FASTISEL-X86-NEXT: retl
+;
+; FASTISEL-X64-LABEL: can_fold_with_call_in_chain:
+; FASTISEL-X64: # %bb.0: # %entry
+; FASTISEL-X64-NEXT: pushq %r14
+; FASTISEL-X64-NEXT: pushq %rbx
+; FASTISEL-X64-NEXT: pushq %rax
+; FASTISEL-X64-NEXT: movq %rsi, %rbx
+; FASTISEL-X64-NEXT: movq %rdi, %r14
+; FASTISEL-X64-NEXT: movss %xmm0, (%rsp) # 4-byte Spill
+; FASTISEL-X64-NEXT: callq sinf@PLT
+; FASTISEL-X64-NEXT: movss %xmm0, {{[-0-9]+}}(%r{{[sb]}}p) # 4-byte Spill
+; FASTISEL-X64-NEXT: movss (%rsp), %xmm0 # 4-byte Reload
+; FASTISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
+; FASTISEL-X64-NEXT: callq cosf@PLT
+; FASTISEL-X64-NEXT: movss %xmm0, (%rsp) # 4-byte Spill
+; FASTISEL-X64-NEXT: movq %r14, %rdi
+; FASTISEL-X64-NEXT: movq %rbx, %rsi
+; FASTISEL-X64-NEXT: callq foo@PLT
+; FASTISEL-X64-NEXT: movss {{[-0-9]+}}(%r{{[sb]}}p), %xmm0 # 4-byte Reload
+; FASTISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
+; FASTISEL-X64-NEXT: movss %xmm0, (%r14)
+; FASTISEL-X64-NEXT: movss (%rsp), %xmm0 # 4-byte Reload
+; FASTISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
+; FASTISEL-X64-NEXT: movss %xmm0, (%rbx)
+; FASTISEL-X64-NEXT: addq $8, %rsp
+; FASTISEL-X64-NEXT: popq %rbx
+; FASTISEL-X64-NEXT: popq %r14
+; FASTISEL-X64-NEXT: retq
+;
+; SDAG-X86-LABEL: can_fold_with_call_in_chain:
+; SDAG-X86: # %bb.0: # %entry
+; SDAG-X86-NEXT: pushl %edi
+; SDAG-X86-NEXT: pushl %esi
+; SDAG-X86-NEXT: subl $20, %esp
+; SDAG-X86-NEXT: flds {{[0-9]+}}(%esp)
+; SDAG-X86-NEXT: fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
+; SDAG-X86-NEXT: movl {{[0-9]+}}(%esp), %edi
+; SDAG-X86-NEXT: movl {{[0-9]+}}(%esp), %esi
+; SDAG-X86-NEXT: movl %esi, {{[0-9]+}}(%esp)
+; SDAG-X86-NEXT: movl %edi, (%esp)
+; SDAG-X86-NEXT: calll foo@PLT
+; SDAG-X86-NEXT: leal {{[0-9]+}}(%esp), %eax
+; SDAG-X86-NEXT: movl %eax, {{[0-9]+}}(%esp)
+; SDAG-X86-NEXT: movl %edi, {{[0-9]+}}(%esp)
+; SDAG-X86-NEXT: flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
+; SDAG-X86-NEXT: fstps (%esp)
+; SDAG-X86-NEXT: calll sincosf
+; SDAG-X86-NEXT: flds {{[0-9]+}}(%esp)
+; SDAG-X86-NEXT: fstps (%esi)
+; SDAG-X86-NEXT: addl $20, %esp
+; SDAG-X86-NEXT: popl %esi
+; SDAG-X86-NEXT: popl %edi
+; SDAG-X86-NEXT: retl
+;
+; SDAG-X64-LABEL: can_fold_with_call_in_chain:
+; SDAG-X64: # %bb.0: # %entry
+; SDAG-X64-NEXT: pushq %r14
+; SDAG-X64-NEXT: pushq %rbx
+; SDAG-X64-NEXT: pushq %rax
+; SDAG-X64-NEXT: movq %rsi, %rbx
+; SDAG-X64-NEXT: movq %rdi, %r14
+; SDAG-X64-NEXT: movss %xmm0, (%rsp) # 4-byte Spill
+; SDAG-X64-NEXT: callq foo@PLT
+; SDAG-X64-NEXT: leaq {{[0-9]+}}(%rsp), %rsi
+; SDAG-X64-NEXT: movss (%rsp), %xmm0 # 4-byte Reload
+; SDAG-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
+; SDAG-X64-NEXT: movq %r14, %rdi
+; SDAG-X64-NEXT: callq sincosf@PLT
+; SDAG-X64-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
+; SDAG-X64-NEXT: movss %xmm0, (%rbx)
+; SDAG-X64-NEXT: addq $8, %rsp
+; SDAG-X64-NEXT: popq %rbx
+; SDAG-X64-NEXT: popq %r14
+; SDAG-X64-NEXT: retq
+;
+; GISEL-X86-LABEL: can_fold_with_call_in_chain:
+; GISEL-X86: # %bb.0: # %entry
+; GISEL-X86-NEXT: pushl %ebx
+; GISEL-X86-NEXT: pushl %edi
+; GISEL-X86-NEXT: pushl %esi
+; GISEL-X86-NEXT: subl $16, %esp
+; GISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %ebx
+; GISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %esi
+; GISEL-X86-NEXT: movl {{[0-9]+}}(%esp), %edi
+; GISEL-X86-NEXT: movl %ebx, (%esp)
+; GISEL-X86-NEXT: calll sinf
+; GISEL-X86-NEXT: fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
+; GISEL-X86-NEXT: movl %ebx, (%esp)
+; GISEL-X86-NEXT: calll cosf
+; GISEL-X86-NEXT: fstps {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Spill
+; GISEL-X86-NEXT: movl %esi, (%esp)
+; GISEL-X86-NEXT: movl %edi, {{[0-9]+}}(%esp)
+; GISEL-X86-NEXT: calll foo
+; GISEL-X86-NEXT: flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
+; GISEL-X86-NEXT: fstps (%esi)
+; GISEL-X86-NEXT: flds {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Folded Reload
+; GISEL-X86-NEXT: fstps (%edi)
+; GISEL-X86-NEXT: addl $16, %esp
+; GISEL-X86-NEXT: popl %esi
+; GISEL-X86-NEXT: popl %edi
+; GISEL-X86-NEXT: popl %ebx
+; GISEL-X86-NEXT: retl
+;
+; GISEL-X64-LABEL: can_fold_with_call_in_chain:
+; GISEL-X64: # %bb.0: # %entry
+; GISEL-X64-NEXT: pushq %r14
+; GISEL-X64-NEXT: pushq %rbx
+; GISEL-X64-NEXT: pushq %rax
+; GISEL-X64-NEXT: movss %xmm0, (%rsp) # 4-byte Spill
+; GISEL-X64-NEXT: movq %rdi, %rbx
+; GISEL-X64-NEXT: movq %rsi, %r14
+; GISEL-X64-NEXT: callq sinf
+; GISEL-X64-NEXT: movss %xmm0, {{[-0-9]+}}(%r{{[sb]}}p) # 4-byte Spill
+; GISEL-X64-NEXT: movss (%rsp), %xmm0 # 4-byte Reload
+; GISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
+; GISEL-X64-NEXT: callq cosf
+; GISEL-X64-NEXT: movss %xmm0, (%rsp) # 4-byte Spill
+; GISEL-X64-NEXT: movq %rbx, %rdi
+; GISEL-X64-NEXT: movq %r14, %rsi
+; GISEL-X64-NEXT: callq foo
+; GISEL-X64-NEXT: movd {{[-0-9]+}}(%r{{[sb]}}p), %xmm0 # 4-byte Folded Reload
+; GISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
+; GISEL-X64-NEXT: movd %xmm0, %eax
+; GISEL-X64-NEXT: movl %eax, (%rbx)
+; GISEL-X64-NEXT: movd (%rsp), %xmm0 # 4-byte Folded Reload
+; GISEL-X64-NEXT: # xmm0 = mem[0],zero,zero,zero
+; GISEL-X64-NEXT: movd %xmm0, %eax
+; GISEL-X64-NEXT: movl %eax, (%r14)
+; GISEL-X64-NEXT: addq $8, %rsp
+; GISEL-X64-NEXT: popq %rbx
+; GISEL-X64-NEXT: popq %r14
+; GISEL-X64-NEXT: retq
+entry:
+ %sin = tail call float @llvm.sin.f32(float %x)
+ %cos = tail call float @llvm.cos.f32(float %x)
+ call void @foo(ptr %a, ptr %b)
+ store float %sin, ptr %a, align 4
+ store float %cos, ptr %b, align 4
+ ret void
+}