
The i386 psABI specifies that `__float128` has 16 byte alignment and must be passed on the stack; however, LLVM currently stores it in a stack slot that has an offset of 4. Add a custom lowering to correct this alignment to 16-byte. i386 does not specify an `__int128`, but it seems reasonable to keep the same behavior as `__float128` so this is changed as well. There also isn't a good way to distinguish whether a set of four registers came from an integer or a float. The main test demonstrating this change is `store_perturbed` in `llvm/test/CodeGen/X86/i128-fp128-abi.ll`. Referenced ABI: https://gitlab.com/x86-psABIs/i386-ABI/-/wikis/uploads/14c05f1b1e156e0e46b61bfa7c1df1e2/intel386-psABI-2020-08-07.pdf Fixes: https://github.com/llvm/llvm-project/issues/77401
173 lines
4.9 KiB
LLVM
173 lines
4.9 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -mtriple=i686-unknown-unknown | FileCheck %s --check-prefix=X86 --check-prefix=X86-NO-CMOV
|
|
; RUN: llc < %s -mtriple=i686-unknown-unknown -mattr=+cmov | FileCheck %s --check-prefix=X86 --check-prefix=X86-CMOV
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown | FileCheck %s --check-prefix=X64
|
|
|
|
;; Integer absolute value, should produce something at least as good as:
|
|
;; movl %edi, %eax
|
|
;; negl %eax
|
|
;; cmovll %edi, %eax
|
|
;; ret
|
|
; rdar://10695237
|
|
define i8 @test_i8(i8 %a) nounwind {
|
|
; X86-LABEL: test_i8:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movzbl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl %eax, %ecx
|
|
; X86-NEXT: sarb $7, %cl
|
|
; X86-NEXT: xorb %cl, %al
|
|
; X86-NEXT: subb %cl, %al
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: test_i8:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: movl %eax, %ecx
|
|
; X64-NEXT: sarb $7, %cl
|
|
; X64-NEXT: xorb %cl, %al
|
|
; X64-NEXT: subb %cl, %al
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
; X64-NEXT: retq
|
|
%tmp1neg = sub i8 0, %a
|
|
%b = icmp sgt i8 %a, -1
|
|
%abs = select i1 %b, i8 %a, i8 %tmp1neg
|
|
ret i8 %abs
|
|
}
|
|
|
|
define i16 @test_i16(i16 %a) nounwind {
|
|
; X86-NO-CMOV-LABEL: test_i16:
|
|
; X86-NO-CMOV: # %bb.0:
|
|
; X86-NO-CMOV-NEXT: movzwl {{[0-9]+}}(%esp), %eax
|
|
; X86-NO-CMOV-NEXT: movswl %ax, %ecx
|
|
; X86-NO-CMOV-NEXT: sarl $15, %ecx
|
|
; X86-NO-CMOV-NEXT: xorl %ecx, %eax
|
|
; X86-NO-CMOV-NEXT: subl %ecx, %eax
|
|
; X86-NO-CMOV-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X86-NO-CMOV-NEXT: retl
|
|
;
|
|
; X86-CMOV-LABEL: test_i16:
|
|
; X86-CMOV: # %bb.0:
|
|
; X86-CMOV-NEXT: movzwl {{[0-9]+}}(%esp), %ecx
|
|
; X86-CMOV-NEXT: movl %ecx, %eax
|
|
; X86-CMOV-NEXT: negw %ax
|
|
; X86-CMOV-NEXT: cmovsw %cx, %ax
|
|
; X86-CMOV-NEXT: retl
|
|
;
|
|
; X64-LABEL: test_i16:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: negw %ax
|
|
; X64-NEXT: cmovsw %di, %ax
|
|
; X64-NEXT: retq
|
|
%tmp1neg = sub i16 0, %a
|
|
%b = icmp sgt i16 %a, -1
|
|
%abs = select i1 %b, i16 %a, i16 %tmp1neg
|
|
ret i16 %abs
|
|
}
|
|
|
|
define i32 @test_i32(i32 %a) nounwind {
|
|
; X86-NO-CMOV-LABEL: test_i32:
|
|
; X86-NO-CMOV: # %bb.0:
|
|
; X86-NO-CMOV-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NO-CMOV-NEXT: movl %eax, %ecx
|
|
; X86-NO-CMOV-NEXT: sarl $31, %ecx
|
|
; X86-NO-CMOV-NEXT: xorl %ecx, %eax
|
|
; X86-NO-CMOV-NEXT: subl %ecx, %eax
|
|
; X86-NO-CMOV-NEXT: retl
|
|
;
|
|
; X86-CMOV-LABEL: test_i32:
|
|
; X86-CMOV: # %bb.0:
|
|
; X86-CMOV-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-CMOV-NEXT: movl %ecx, %eax
|
|
; X86-CMOV-NEXT: negl %eax
|
|
; X86-CMOV-NEXT: cmovsl %ecx, %eax
|
|
; X86-CMOV-NEXT: retl
|
|
;
|
|
; X64-LABEL: test_i32:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: negl %eax
|
|
; X64-NEXT: cmovsl %edi, %eax
|
|
; X64-NEXT: retq
|
|
%tmp1neg = sub i32 0, %a
|
|
%b = icmp sgt i32 %a, -1
|
|
%abs = select i1 %b, i32 %a, i32 %tmp1neg
|
|
ret i32 %abs
|
|
}
|
|
|
|
define i64 @test_i64(i64 %a) nounwind {
|
|
; X86-LABEL: test_i64:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edx
|
|
; X86-NEXT: movl %edx, %ecx
|
|
; X86-NEXT: sarl $31, %ecx
|
|
; X86-NEXT: xorl %ecx, %edx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: xorl %ecx, %eax
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: sbbl %ecx, %edx
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: test_i64:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: negq %rax
|
|
; X64-NEXT: cmovsq %rdi, %rax
|
|
; X64-NEXT: retq
|
|
%tmp1neg = sub i64 0, %a
|
|
%b = icmp sgt i64 %a, -1
|
|
%abs = select i1 %b, i64 %a, i64 %tmp1neg
|
|
ret i64 %abs
|
|
}
|
|
|
|
define i128 @test_i128(i128 %a) nounwind {
|
|
; X86-LABEL: test_i128:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebp
|
|
; X86-NEXT: movl %esp, %ebp
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: andl $-16, %esp
|
|
; X86-NEXT: movl 36(%ebp), %ecx
|
|
; X86-NEXT: movl %ecx, %eax
|
|
; X86-NEXT: sarl $31, %eax
|
|
; X86-NEXT: xorl %eax, %ecx
|
|
; X86-NEXT: movl 32(%ebp), %edx
|
|
; X86-NEXT: xorl %eax, %edx
|
|
; X86-NEXT: movl 28(%ebp), %esi
|
|
; X86-NEXT: xorl %eax, %esi
|
|
; X86-NEXT: movl 24(%ebp), %edi
|
|
; X86-NEXT: xorl %eax, %edi
|
|
; X86-NEXT: subl %eax, %edi
|
|
; X86-NEXT: sbbl %eax, %esi
|
|
; X86-NEXT: sbbl %eax, %edx
|
|
; X86-NEXT: sbbl %eax, %ecx
|
|
; X86-NEXT: movl 8(%ebp), %eax
|
|
; X86-NEXT: movl %edi, (%eax)
|
|
; X86-NEXT: movl %esi, 4(%eax)
|
|
; X86-NEXT: movl %edx, 8(%eax)
|
|
; X86-NEXT: movl %ecx, 12(%eax)
|
|
; X86-NEXT: leal -8(%ebp), %esp
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebp
|
|
; X86-NEXT: retl $4
|
|
;
|
|
; X64-LABEL: test_i128:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rsi, %rdx
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: movq %rsi, %rcx
|
|
; X64-NEXT: sarq $63, %rcx
|
|
; X64-NEXT: xorq %rcx, %rdx
|
|
; X64-NEXT: xorq %rcx, %rax
|
|
; X64-NEXT: subq %rcx, %rax
|
|
; X64-NEXT: sbbq %rcx, %rdx
|
|
; X64-NEXT: retq
|
|
%tmp1neg = sub i128 0, %a
|
|
%b = icmp sgt i128 %a, -1
|
|
%abs = select i1 %b, i128 %a, i128 %tmp1neg
|
|
ret i128 %abs
|
|
}
|
|
|