
The i386 psABI specifies that `__float128` has 16 byte alignment and must be passed on the stack; however, LLVM currently stores it in a stack slot that has an offset of 4. Add a custom lowering to correct this alignment to 16-byte. i386 does not specify an `__int128`, but it seems reasonable to keep the same behavior as `__float128` so this is changed as well. There also isn't a good way to distinguish whether a set of four registers came from an integer or a float. The main test demonstrating this change is `store_perturbed` in `llvm/test/CodeGen/X86/i128-fp128-abi.ll`. Referenced ABI: https://gitlab.com/x86-psABIs/i386-ABI/-/wikis/uploads/14c05f1b1e156e0e46b61bfa7c1df1e2/intel386-psABI-2020-08-07.pdf Fixes: https://github.com/llvm/llvm-project/issues/77401
1382 lines
40 KiB
LLVM
1382 lines
40 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -mtriple=i686 -mattr=cmov | FileCheck %s --check-prefixes=X86
|
|
; RUN: llc < %s -mtriple=x86_64-linux | FileCheck %s --check-prefixes=X64
|
|
|
|
;
|
|
; trunc(abs(sub(sext(a),sext(b)))) -> abds(a,b)
|
|
;
|
|
|
|
define i8 @abd_ext_i8(i8 %a, i8 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i8:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $al killed $al killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i8:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movsbl %sil, %eax
|
|
; X64-NEXT: movsbl %dil, %ecx
|
|
; X64-NEXT: movl %ecx, %edx
|
|
; X64-NEXT: subl %eax, %edx
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edx, %eax
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
; X64-NEXT: retq
|
|
%aext = sext i8 %a to i64
|
|
%bext = sext i8 %b to i64
|
|
%sub = sub i64 %aext, %bext
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 false)
|
|
%trunc = trunc i64 %abs to i8
|
|
ret i8 %trunc
|
|
}
|
|
|
|
define i8 @abd_ext_i8_i16(i8 %a, i16 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i8_i16:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $al killed $al killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i8_i16:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movsbl %dil, %ecx
|
|
; X64-NEXT: subl %esi, %edi
|
|
; X64-NEXT: movswl %si, %eax
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edi, %eax
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
; X64-NEXT: retq
|
|
%aext = sext i8 %a to i64
|
|
%bext = sext i16 %b to i64
|
|
%sub = sub i64 %aext, %bext
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 false)
|
|
%trunc = trunc i64 %abs to i8
|
|
ret i8 %trunc
|
|
}
|
|
|
|
define i8 @abd_ext_i8_undef(i8 %a, i8 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i8_undef:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $al killed $al killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i8_undef:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movsbl %sil, %eax
|
|
; X64-NEXT: movsbl %dil, %ecx
|
|
; X64-NEXT: movl %ecx, %edx
|
|
; X64-NEXT: subl %eax, %edx
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edx, %eax
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
; X64-NEXT: retq
|
|
%aext = sext i8 %a to i64
|
|
%bext = sext i8 %b to i64
|
|
%sub = sub i64 %aext, %bext
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 true)
|
|
%trunc = trunc i64 %abs to i8
|
|
ret i8 %trunc
|
|
}
|
|
|
|
define i16 @abd_ext_i16(i16 %a, i16 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i16:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i16:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movswl %si, %eax
|
|
; X64-NEXT: movswl %di, %ecx
|
|
; X64-NEXT: movl %ecx, %edx
|
|
; X64-NEXT: subl %eax, %edx
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edx, %eax
|
|
; X64-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X64-NEXT: retq
|
|
%aext = sext i16 %a to i64
|
|
%bext = sext i16 %b to i64
|
|
%sub = sub i64 %aext, %bext
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 false)
|
|
%trunc = trunc i64 %abs to i16
|
|
ret i16 %trunc
|
|
}
|
|
|
|
define i16 @abd_ext_i16_i32(i16 %a, i32 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i16_i32:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i16_i32:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movswl %di, %ecx
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: subl %esi, %eax
|
|
; X64-NEXT: subl %ecx, %esi
|
|
; X64-NEXT: cmovgel %esi, %eax
|
|
; X64-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X64-NEXT: retq
|
|
%aext = sext i16 %a to i64
|
|
%bext = sext i32 %b to i64
|
|
%sub = sub i64 %aext, %bext
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 false)
|
|
%trunc = trunc i64 %abs to i16
|
|
ret i16 %trunc
|
|
}
|
|
|
|
define i16 @abd_ext_i16_undef(i16 %a, i16 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i16_undef:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i16_undef:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movswl %si, %eax
|
|
; X64-NEXT: movswl %di, %ecx
|
|
; X64-NEXT: movl %ecx, %edx
|
|
; X64-NEXT: subl %eax, %edx
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edx, %eax
|
|
; X64-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X64-NEXT: retq
|
|
%aext = sext i16 %a to i64
|
|
%bext = sext i16 %b to i64
|
|
%sub = sub i64 %aext, %bext
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 true)
|
|
%trunc = trunc i64 %abs to i16
|
|
ret i16 %trunc
|
|
}
|
|
|
|
define i32 @abd_ext_i32(i32 %a, i32 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i32:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i32:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: subl %esi, %eax
|
|
; X64-NEXT: subl %edi, %esi
|
|
; X64-NEXT: cmovgel %esi, %eax
|
|
; X64-NEXT: retq
|
|
%aext = sext i32 %a to i64
|
|
%bext = sext i32 %b to i64
|
|
%sub = sub i64 %aext, %bext
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 false)
|
|
%trunc = trunc i64 %abs to i32
|
|
ret i32 %trunc
|
|
}
|
|
|
|
define i32 @abd_ext_i32_i16(i32 %a, i16 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i32_i16:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i32_i16:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movswl %si, %eax
|
|
; X64-NEXT: movl %edi, %ecx
|
|
; X64-NEXT: subl %eax, %ecx
|
|
; X64-NEXT: subl %edi, %eax
|
|
; X64-NEXT: cmovll %ecx, %eax
|
|
; X64-NEXT: retq
|
|
%aext = sext i32 %a to i64
|
|
%bext = sext i16 %b to i64
|
|
%sub = sub i64 %aext, %bext
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 false)
|
|
%trunc = trunc i64 %abs to i32
|
|
ret i32 %trunc
|
|
}
|
|
|
|
define i32 @abd_ext_i32_undef(i32 %a, i32 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i32_undef:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i32_undef:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: subl %esi, %eax
|
|
; X64-NEXT: subl %edi, %esi
|
|
; X64-NEXT: cmovgel %esi, %eax
|
|
; X64-NEXT: retq
|
|
%aext = sext i32 %a to i64
|
|
%bext = sext i32 %b to i64
|
|
%sub = sub i64 %aext, %bext
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 true)
|
|
%trunc = trunc i64 %abs to i32
|
|
ret i32 %trunc
|
|
}
|
|
|
|
define i64 @abd_ext_i64(i64 %a, i64 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i64:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebx
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
; X86-NEXT: movl %ecx, %edi
|
|
; X86-NEXT: subl %eax, %edi
|
|
; X86-NEXT: movl %esi, %ebx
|
|
; X86-NEXT: sbbl %edx, %ebx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: sbbl %esi, %edx
|
|
; X86-NEXT: cmovll %edi, %eax
|
|
; X86-NEXT: cmovll %ebx, %edx
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebx
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i64:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rsi, %rax
|
|
; X64-NEXT: subq %rdi, %rsi
|
|
; X64-NEXT: cmovgeq %rsi, %rax
|
|
; X64-NEXT: retq
|
|
%aext = sext i64 %a to i128
|
|
%bext = sext i64 %b to i128
|
|
%sub = sub i128 %aext, %bext
|
|
%abs = call i128 @llvm.abs.i128(i128 %sub, i1 false)
|
|
%trunc = trunc i128 %abs to i64
|
|
ret i64 %trunc
|
|
}
|
|
|
|
define i64 @abd_ext_i64_undef(i64 %a, i64 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i64_undef:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebx
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
; X86-NEXT: movl %ecx, %edi
|
|
; X86-NEXT: subl %eax, %edi
|
|
; X86-NEXT: movl %esi, %ebx
|
|
; X86-NEXT: sbbl %edx, %ebx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: sbbl %esi, %edx
|
|
; X86-NEXT: cmovll %edi, %eax
|
|
; X86-NEXT: cmovll %ebx, %edx
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebx
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_ext_i64_undef:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rsi, %rax
|
|
; X64-NEXT: subq %rdi, %rsi
|
|
; X64-NEXT: cmovgeq %rsi, %rax
|
|
; X64-NEXT: retq
|
|
%aext = sext i64 %a to i128
|
|
%bext = sext i64 %b to i128
|
|
%sub = sub i128 %aext, %bext
|
|
%abs = call i128 @llvm.abs.i128(i128 %sub, i1 true)
|
|
%trunc = trunc i128 %abs to i64
|
|
ret i64 %trunc
|
|
}
|
|
|
|
define i128 @abd_ext_i128(i128 %a, i128 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i128:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebp
|
|
; X86-NEXT: movl %esp, %ebp
|
|
; X86-NEXT: pushl %ebx
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: andl $-16, %esp
|
|
; X86-NEXT: subl $16, %esp
|
|
; X86-NEXT: movl 40(%ebp), %ecx
|
|
; X86-NEXT: movl 44(%ebp), %edx
|
|
; X86-NEXT: movl 24(%ebp), %eax
|
|
; X86-NEXT: movl 28(%ebp), %esi
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: movl %eax, {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Spill
|
|
; X86-NEXT: movl %esi, %eax
|
|
; X86-NEXT: sbbl %edx, %eax
|
|
; X86-NEXT: movl %eax, {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Spill
|
|
; X86-NEXT: movl 48(%ebp), %esi
|
|
; X86-NEXT: movl 32(%ebp), %edi
|
|
; X86-NEXT: sbbl %esi, %edi
|
|
; X86-NEXT: movl 52(%ebp), %ebx
|
|
; X86-NEXT: movl 36(%ebp), %eax
|
|
; X86-NEXT: sbbl %ebx, %eax
|
|
; X86-NEXT: subl 24(%ebp), %ecx
|
|
; X86-NEXT: sbbl 28(%ebp), %edx
|
|
; X86-NEXT: sbbl 32(%ebp), %esi
|
|
; X86-NEXT: sbbl 36(%ebp), %ebx
|
|
; X86-NEXT: cmovll {{[-0-9]+}}(%e{{[sb]}}p), %ecx # 4-byte Folded Reload
|
|
; X86-NEXT: cmovll {{[-0-9]+}}(%e{{[sb]}}p), %edx # 4-byte Folded Reload
|
|
; X86-NEXT: cmovll %edi, %esi
|
|
; X86-NEXT: cmovll %eax, %ebx
|
|
; X86-NEXT: movl 8(%ebp), %eax
|
|
; X86-NEXT: movl %ebx, 12(%eax)
|
|
; X86-NEXT: movl %esi, 8(%eax)
|
|
; X86-NEXT: movl %edx, 4(%eax)
|
|
; X86-NEXT: movl %ecx, (%eax)
|
|
; X86-NEXT: leal -12(%ebp), %esp
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebx
|
|
; X86-NEXT: popl %ebp
|
|
; X86-NEXT: retl $4
|
|
;
|
|
; X64-LABEL: abd_ext_i128:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rdx, %rax
|
|
; X64-NEXT: movq %rsi, %r8
|
|
; X64-NEXT: sbbq %rcx, %r8
|
|
; X64-NEXT: subq %rdi, %rdx
|
|
; X64-NEXT: sbbq %rsi, %rcx
|
|
; X64-NEXT: cmovgeq %rdx, %rax
|
|
; X64-NEXT: cmovgeq %rcx, %r8
|
|
; X64-NEXT: movq %r8, %rdx
|
|
; X64-NEXT: retq
|
|
%aext = sext i128 %a to i256
|
|
%bext = sext i128 %b to i256
|
|
%sub = sub i256 %aext, %bext
|
|
%abs = call i256 @llvm.abs.i256(i256 %sub, i1 false)
|
|
%trunc = trunc i256 %abs to i128
|
|
ret i128 %trunc
|
|
}
|
|
|
|
define i128 @abd_ext_i128_undef(i128 %a, i128 %b) nounwind {
|
|
; X86-LABEL: abd_ext_i128_undef:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebp
|
|
; X86-NEXT: movl %esp, %ebp
|
|
; X86-NEXT: pushl %ebx
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: andl $-16, %esp
|
|
; X86-NEXT: subl $16, %esp
|
|
; X86-NEXT: movl 40(%ebp), %ecx
|
|
; X86-NEXT: movl 44(%ebp), %edx
|
|
; X86-NEXT: movl 24(%ebp), %eax
|
|
; X86-NEXT: movl 28(%ebp), %esi
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: movl %eax, {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Spill
|
|
; X86-NEXT: movl %esi, %eax
|
|
; X86-NEXT: sbbl %edx, %eax
|
|
; X86-NEXT: movl %eax, {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Spill
|
|
; X86-NEXT: movl 48(%ebp), %esi
|
|
; X86-NEXT: movl 32(%ebp), %edi
|
|
; X86-NEXT: sbbl %esi, %edi
|
|
; X86-NEXT: movl 52(%ebp), %ebx
|
|
; X86-NEXT: movl 36(%ebp), %eax
|
|
; X86-NEXT: sbbl %ebx, %eax
|
|
; X86-NEXT: subl 24(%ebp), %ecx
|
|
; X86-NEXT: sbbl 28(%ebp), %edx
|
|
; X86-NEXT: sbbl 32(%ebp), %esi
|
|
; X86-NEXT: sbbl 36(%ebp), %ebx
|
|
; X86-NEXT: cmovll {{[-0-9]+}}(%e{{[sb]}}p), %ecx # 4-byte Folded Reload
|
|
; X86-NEXT: cmovll {{[-0-9]+}}(%e{{[sb]}}p), %edx # 4-byte Folded Reload
|
|
; X86-NEXT: cmovll %edi, %esi
|
|
; X86-NEXT: cmovll %eax, %ebx
|
|
; X86-NEXT: movl 8(%ebp), %eax
|
|
; X86-NEXT: movl %ebx, 12(%eax)
|
|
; X86-NEXT: movl %esi, 8(%eax)
|
|
; X86-NEXT: movl %edx, 4(%eax)
|
|
; X86-NEXT: movl %ecx, (%eax)
|
|
; X86-NEXT: leal -12(%ebp), %esp
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebx
|
|
; X86-NEXT: popl %ebp
|
|
; X86-NEXT: retl $4
|
|
;
|
|
; X64-LABEL: abd_ext_i128_undef:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rdx, %rax
|
|
; X64-NEXT: movq %rsi, %r8
|
|
; X64-NEXT: sbbq %rcx, %r8
|
|
; X64-NEXT: subq %rdi, %rdx
|
|
; X64-NEXT: sbbq %rsi, %rcx
|
|
; X64-NEXT: cmovgeq %rdx, %rax
|
|
; X64-NEXT: cmovgeq %rcx, %r8
|
|
; X64-NEXT: movq %r8, %rdx
|
|
; X64-NEXT: retq
|
|
%aext = sext i128 %a to i256
|
|
%bext = sext i128 %b to i256
|
|
%sub = sub i256 %aext, %bext
|
|
%abs = call i256 @llvm.abs.i256(i256 %sub, i1 true)
|
|
%trunc = trunc i256 %abs to i128
|
|
ret i128 %trunc
|
|
}
|
|
|
|
;
|
|
; sub(smax(a,b),smin(a,b)) -> abds(a,b)
|
|
;
|
|
|
|
define i8 @abd_minmax_i8(i8 %a, i8 %b) nounwind {
|
|
; X86-LABEL: abd_minmax_i8:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $al killed $al killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_minmax_i8:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movsbl %sil, %eax
|
|
; X64-NEXT: movsbl %dil, %ecx
|
|
; X64-NEXT: movl %ecx, %edx
|
|
; X64-NEXT: subl %eax, %edx
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edx, %eax
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
; X64-NEXT: retq
|
|
%min = call i8 @llvm.smin.i8(i8 %a, i8 %b)
|
|
%max = call i8 @llvm.smax.i8(i8 %a, i8 %b)
|
|
%sub = sub i8 %max, %min
|
|
ret i8 %sub
|
|
}
|
|
|
|
define i16 @abd_minmax_i16(i16 %a, i16 %b) nounwind {
|
|
; X86-LABEL: abd_minmax_i16:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_minmax_i16:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movswl %si, %eax
|
|
; X64-NEXT: movswl %di, %ecx
|
|
; X64-NEXT: movl %ecx, %edx
|
|
; X64-NEXT: subl %eax, %edx
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edx, %eax
|
|
; X64-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X64-NEXT: retq
|
|
%min = call i16 @llvm.smin.i16(i16 %a, i16 %b)
|
|
%max = call i16 @llvm.smax.i16(i16 %a, i16 %b)
|
|
%sub = sub i16 %max, %min
|
|
ret i16 %sub
|
|
}
|
|
|
|
define i32 @abd_minmax_i32(i32 %a, i32 %b) nounwind {
|
|
; X86-LABEL: abd_minmax_i32:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_minmax_i32:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: subl %esi, %eax
|
|
; X64-NEXT: subl %edi, %esi
|
|
; X64-NEXT: cmovgel %esi, %eax
|
|
; X64-NEXT: retq
|
|
%min = call i32 @llvm.smin.i32(i32 %a, i32 %b)
|
|
%max = call i32 @llvm.smax.i32(i32 %a, i32 %b)
|
|
%sub = sub i32 %max, %min
|
|
ret i32 %sub
|
|
}
|
|
|
|
define i64 @abd_minmax_i64(i64 %a, i64 %b) nounwind {
|
|
; X86-LABEL: abd_minmax_i64:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebx
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
; X86-NEXT: movl %ecx, %edi
|
|
; X86-NEXT: subl %eax, %edi
|
|
; X86-NEXT: movl %esi, %ebx
|
|
; X86-NEXT: sbbl %edx, %ebx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: sbbl %esi, %edx
|
|
; X86-NEXT: cmovll %edi, %eax
|
|
; X86-NEXT: cmovll %ebx, %edx
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebx
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_minmax_i64:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rsi, %rax
|
|
; X64-NEXT: subq %rdi, %rsi
|
|
; X64-NEXT: cmovgeq %rsi, %rax
|
|
; X64-NEXT: retq
|
|
%min = call i64 @llvm.smin.i64(i64 %a, i64 %b)
|
|
%max = call i64 @llvm.smax.i64(i64 %a, i64 %b)
|
|
%sub = sub i64 %max, %min
|
|
ret i64 %sub
|
|
}
|
|
|
|
define i128 @abd_minmax_i128(i128 %a, i128 %b) nounwind {
|
|
; X86-LABEL: abd_minmax_i128:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebp
|
|
; X86-NEXT: movl %esp, %ebp
|
|
; X86-NEXT: pushl %ebx
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: andl $-16, %esp
|
|
; X86-NEXT: subl $16, %esp
|
|
; X86-NEXT: movl 40(%ebp), %ecx
|
|
; X86-NEXT: movl 44(%ebp), %edx
|
|
; X86-NEXT: movl 24(%ebp), %eax
|
|
; X86-NEXT: movl 28(%ebp), %esi
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: movl %eax, {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Spill
|
|
; X86-NEXT: movl %esi, %eax
|
|
; X86-NEXT: sbbl %edx, %eax
|
|
; X86-NEXT: movl %eax, {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Spill
|
|
; X86-NEXT: movl 48(%ebp), %esi
|
|
; X86-NEXT: movl 32(%ebp), %edi
|
|
; X86-NEXT: sbbl %esi, %edi
|
|
; X86-NEXT: movl 52(%ebp), %ebx
|
|
; X86-NEXT: movl 36(%ebp), %eax
|
|
; X86-NEXT: sbbl %ebx, %eax
|
|
; X86-NEXT: subl 24(%ebp), %ecx
|
|
; X86-NEXT: sbbl 28(%ebp), %edx
|
|
; X86-NEXT: sbbl 32(%ebp), %esi
|
|
; X86-NEXT: sbbl 36(%ebp), %ebx
|
|
; X86-NEXT: cmovll {{[-0-9]+}}(%e{{[sb]}}p), %ecx # 4-byte Folded Reload
|
|
; X86-NEXT: cmovll {{[-0-9]+}}(%e{{[sb]}}p), %edx # 4-byte Folded Reload
|
|
; X86-NEXT: cmovll %edi, %esi
|
|
; X86-NEXT: cmovll %eax, %ebx
|
|
; X86-NEXT: movl 8(%ebp), %eax
|
|
; X86-NEXT: movl %ebx, 12(%eax)
|
|
; X86-NEXT: movl %esi, 8(%eax)
|
|
; X86-NEXT: movl %edx, 4(%eax)
|
|
; X86-NEXT: movl %ecx, (%eax)
|
|
; X86-NEXT: leal -12(%ebp), %esp
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebx
|
|
; X86-NEXT: popl %ebp
|
|
; X86-NEXT: retl $4
|
|
;
|
|
; X64-LABEL: abd_minmax_i128:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rdx, %rax
|
|
; X64-NEXT: movq %rsi, %r8
|
|
; X64-NEXT: sbbq %rcx, %r8
|
|
; X64-NEXT: subq %rdi, %rdx
|
|
; X64-NEXT: sbbq %rsi, %rcx
|
|
; X64-NEXT: cmovgeq %rdx, %rax
|
|
; X64-NEXT: cmovgeq %rcx, %r8
|
|
; X64-NEXT: movq %r8, %rdx
|
|
; X64-NEXT: retq
|
|
%min = call i128 @llvm.smin.i128(i128 %a, i128 %b)
|
|
%max = call i128 @llvm.smax.i128(i128 %a, i128 %b)
|
|
%sub = sub i128 %max, %min
|
|
ret i128 %sub
|
|
}
|
|
|
|
;
|
|
; select(icmp(a,b),sub(a,b),sub(b,a)) -> abds(a,b)
|
|
;
|
|
|
|
define i8 @abd_cmp_i8(i8 %a, i8 %b) nounwind {
|
|
; X86-LABEL: abd_cmp_i8:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $al killed $al killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_cmp_i8:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movsbl %sil, %eax
|
|
; X64-NEXT: movsbl %dil, %ecx
|
|
; X64-NEXT: movl %ecx, %edx
|
|
; X64-NEXT: subl %eax, %edx
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edx, %eax
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
; X64-NEXT: retq
|
|
%cmp = icmp sgt i8 %a, %b
|
|
%ab = sub i8 %a, %b
|
|
%ba = sub i8 %b, %a
|
|
%sel = select i1 %cmp, i8 %ab, i8 %ba
|
|
ret i8 %sel
|
|
}
|
|
|
|
define i16 @abd_cmp_i16(i16 %a, i16 %b) nounwind {
|
|
; X86-LABEL: abd_cmp_i16:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_cmp_i16:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movswl %si, %eax
|
|
; X64-NEXT: movswl %di, %ecx
|
|
; X64-NEXT: movl %ecx, %edx
|
|
; X64-NEXT: subl %eax, %edx
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edx, %eax
|
|
; X64-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X64-NEXT: retq
|
|
%cmp = icmp sge i16 %a, %b
|
|
%ab = sub i16 %a, %b
|
|
%ba = sub i16 %b, %a
|
|
%sel = select i1 %cmp, i16 %ab, i16 %ba
|
|
ret i16 %sel
|
|
}
|
|
|
|
define i32 @abd_cmp_i32(i32 %a, i32 %b) nounwind {
|
|
; X86-LABEL: abd_cmp_i32:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_cmp_i32:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: subl %esi, %eax
|
|
; X64-NEXT: subl %edi, %esi
|
|
; X64-NEXT: cmovgel %esi, %eax
|
|
; X64-NEXT: retq
|
|
%cmp = icmp slt i32 %a, %b
|
|
%ab = sub i32 %a, %b
|
|
%ba = sub i32 %b, %a
|
|
%sel = select i1 %cmp, i32 %ba, i32 %ab
|
|
ret i32 %sel
|
|
}
|
|
|
|
define i64 @abd_cmp_i64(i64 %a, i64 %b) nounwind {
|
|
; X86-LABEL: abd_cmp_i64:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebx
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
; X86-NEXT: movl %ecx, %edi
|
|
; X86-NEXT: subl %eax, %edi
|
|
; X86-NEXT: movl %esi, %ebx
|
|
; X86-NEXT: sbbl %edx, %ebx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: sbbl %esi, %edx
|
|
; X86-NEXT: cmovll %edi, %eax
|
|
; X86-NEXT: cmovll %ebx, %edx
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebx
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_cmp_i64:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rsi, %rax
|
|
; X64-NEXT: subq %rdi, %rsi
|
|
; X64-NEXT: cmovgeq %rsi, %rax
|
|
; X64-NEXT: retq
|
|
%cmp = icmp sge i64 %a, %b
|
|
%ab = sub i64 %a, %b
|
|
%ba = sub i64 %b, %a
|
|
%sel = select i1 %cmp, i64 %ab, i64 %ba
|
|
ret i64 %sel
|
|
}
|
|
|
|
define i128 @abd_cmp_i128(i128 %a, i128 %b) nounwind {
|
|
; X86-LABEL: abd_cmp_i128:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebp
|
|
; X86-NEXT: movl %esp, %ebp
|
|
; X86-NEXT: pushl %ebx
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: andl $-16, %esp
|
|
; X86-NEXT: subl $16, %esp
|
|
; X86-NEXT: movl 40(%ebp), %ecx
|
|
; X86-NEXT: movl 44(%ebp), %edx
|
|
; X86-NEXT: movl 24(%ebp), %eax
|
|
; X86-NEXT: movl 28(%ebp), %esi
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: movl %eax, {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Spill
|
|
; X86-NEXT: movl %esi, %eax
|
|
; X86-NEXT: sbbl %edx, %eax
|
|
; X86-NEXT: movl %eax, {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Spill
|
|
; X86-NEXT: movl 48(%ebp), %esi
|
|
; X86-NEXT: movl 32(%ebp), %edi
|
|
; X86-NEXT: sbbl %esi, %edi
|
|
; X86-NEXT: movl 52(%ebp), %ebx
|
|
; X86-NEXT: movl 36(%ebp), %eax
|
|
; X86-NEXT: sbbl %ebx, %eax
|
|
; X86-NEXT: subl 24(%ebp), %ecx
|
|
; X86-NEXT: sbbl 28(%ebp), %edx
|
|
; X86-NEXT: sbbl 32(%ebp), %esi
|
|
; X86-NEXT: sbbl 36(%ebp), %ebx
|
|
; X86-NEXT: cmovll {{[-0-9]+}}(%e{{[sb]}}p), %ecx # 4-byte Folded Reload
|
|
; X86-NEXT: cmovll {{[-0-9]+}}(%e{{[sb]}}p), %edx # 4-byte Folded Reload
|
|
; X86-NEXT: cmovll %edi, %esi
|
|
; X86-NEXT: cmovll %eax, %ebx
|
|
; X86-NEXT: movl 8(%ebp), %eax
|
|
; X86-NEXT: movl %ebx, 12(%eax)
|
|
; X86-NEXT: movl %esi, 8(%eax)
|
|
; X86-NEXT: movl %edx, 4(%eax)
|
|
; X86-NEXT: movl %ecx, (%eax)
|
|
; X86-NEXT: leal -12(%ebp), %esp
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebx
|
|
; X86-NEXT: popl %ebp
|
|
; X86-NEXT: retl $4
|
|
;
|
|
; X64-LABEL: abd_cmp_i128:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rdx, %rax
|
|
; X64-NEXT: movq %rsi, %r8
|
|
; X64-NEXT: sbbq %rcx, %r8
|
|
; X64-NEXT: subq %rdi, %rdx
|
|
; X64-NEXT: sbbq %rsi, %rcx
|
|
; X64-NEXT: cmovgeq %rdx, %rax
|
|
; X64-NEXT: cmovgeq %rcx, %r8
|
|
; X64-NEXT: movq %r8, %rdx
|
|
; X64-NEXT: retq
|
|
%cmp = icmp sge i128 %a, %b
|
|
%ab = sub i128 %a, %b
|
|
%ba = sub i128 %b, %a
|
|
%sel = select i1 %cmp, i128 %ab, i128 %ba
|
|
ret i128 %sel
|
|
}
|
|
|
|
;
|
|
; abs(sub_nsw(x, y)) -> abds(a,b)
|
|
;
|
|
|
|
define i8 @abd_subnsw_i8(i8 %a, i8 %b) nounwind {
|
|
; X86-LABEL: abd_subnsw_i8:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movzbl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: subb {{[0-9]+}}(%esp), %al
|
|
; X86-NEXT: movl %eax, %ecx
|
|
; X86-NEXT: sarb $7, %cl
|
|
; X86-NEXT: xorb %cl, %al
|
|
; X86-NEXT: subb %cl, %al
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_subnsw_i8:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: subb %sil, %al
|
|
; X64-NEXT: movl %eax, %ecx
|
|
; X64-NEXT: sarb $7, %cl
|
|
; X64-NEXT: xorb %cl, %al
|
|
; X64-NEXT: subb %cl, %al
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
; X64-NEXT: retq
|
|
%sub = sub nsw i8 %a, %b
|
|
%abs = call i8 @llvm.abs.i8(i8 %sub, i1 false)
|
|
ret i8 %abs
|
|
}
|
|
|
|
define i8 @abd_subnsw_i8_undef(i8 %a, i8 %b) nounwind {
|
|
; X86-LABEL: abd_subnsw_i8_undef:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movzbl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: subb {{[0-9]+}}(%esp), %al
|
|
; X86-NEXT: movl %eax, %ecx
|
|
; X86-NEXT: sarb $7, %cl
|
|
; X86-NEXT: xorb %cl, %al
|
|
; X86-NEXT: subb %cl, %al
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_subnsw_i8_undef:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: subb %sil, %al
|
|
; X64-NEXT: movl %eax, %ecx
|
|
; X64-NEXT: sarb $7, %cl
|
|
; X64-NEXT: xorb %cl, %al
|
|
; X64-NEXT: subb %cl, %al
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
; X64-NEXT: retq
|
|
%sub = sub nsw i8 %a, %b
|
|
%abs = call i8 @llvm.abs.i8(i8 %sub, i1 true)
|
|
ret i8 %abs
|
|
}
|
|
|
|
define i16 @abd_subnsw_i16(i16 %a, i16 %b) nounwind {
|
|
; X86-LABEL: abd_subnsw_i16:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movzwl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: subw {{[0-9]+}}(%esp), %cx
|
|
; X86-NEXT: movl %ecx, %eax
|
|
; X86-NEXT: negw %ax
|
|
; X86-NEXT: cmovsw %cx, %ax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_subnsw_i16:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: subl %esi, %edi
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: negw %ax
|
|
; X64-NEXT: cmovsw %di, %ax
|
|
; X64-NEXT: retq
|
|
%sub = sub nsw i16 %a, %b
|
|
%abs = call i16 @llvm.abs.i16(i16 %sub, i1 false)
|
|
ret i16 %abs
|
|
}
|
|
|
|
define i16 @abd_subnsw_i16_undef(i16 %a, i16 %b) nounwind {
|
|
; X86-LABEL: abd_subnsw_i16_undef:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movzwl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: subw {{[0-9]+}}(%esp), %cx
|
|
; X86-NEXT: movl %ecx, %eax
|
|
; X86-NEXT: negw %ax
|
|
; X86-NEXT: cmovsw %cx, %ax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_subnsw_i16_undef:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: subl %esi, %edi
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: negw %ax
|
|
; X64-NEXT: cmovsw %di, %ax
|
|
; X64-NEXT: retq
|
|
%sub = sub nsw i16 %a, %b
|
|
%abs = call i16 @llvm.abs.i16(i16 %sub, i1 true)
|
|
ret i16 %abs
|
|
}
|
|
|
|
define i32 @abd_subnsw_i32(i32 %a, i32 %b) nounwind {
|
|
; X86-LABEL: abd_subnsw_i32:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_subnsw_i32:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: subl %esi, %eax
|
|
; X64-NEXT: subl %edi, %esi
|
|
; X64-NEXT: cmovgel %esi, %eax
|
|
; X64-NEXT: retq
|
|
%sub = sub nsw i32 %a, %b
|
|
%abs = call i32 @llvm.abs.i32(i32 %sub, i1 false)
|
|
ret i32 %abs
|
|
}
|
|
|
|
define i32 @abd_subnsw_i32_undef(i32 %a, i32 %b) nounwind {
|
|
; X86-LABEL: abd_subnsw_i32_undef:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_subnsw_i32_undef:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: subl %esi, %eax
|
|
; X64-NEXT: subl %edi, %esi
|
|
; X64-NEXT: cmovgel %esi, %eax
|
|
; X64-NEXT: retq
|
|
%sub = sub nsw i32 %a, %b
|
|
%abs = call i32 @llvm.abs.i32(i32 %sub, i1 true)
|
|
ret i32 %abs
|
|
}
|
|
|
|
define i64 @abd_subnsw_i64(i64 %a, i64 %b) nounwind {
|
|
; X86-LABEL: abd_subnsw_i64:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edx
|
|
; X86-NEXT: subl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: sbbl {{[0-9]+}}(%esp), %edx
|
|
; X86-NEXT: movl %edx, %ecx
|
|
; X86-NEXT: sarl $31, %ecx
|
|
; X86-NEXT: xorl %ecx, %edx
|
|
; X86-NEXT: xorl %ecx, %eax
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: sbbl %ecx, %edx
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_subnsw_i64:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rsi, %rax
|
|
; X64-NEXT: subq %rdi, %rsi
|
|
; X64-NEXT: cmovgeq %rsi, %rax
|
|
; X64-NEXT: retq
|
|
%sub = sub nsw i64 %a, %b
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 false)
|
|
ret i64 %abs
|
|
}
|
|
|
|
define i64 @abd_subnsw_i64_undef(i64 %a, i64 %b) nounwind {
|
|
; X86-LABEL: abd_subnsw_i64_undef:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edx
|
|
; X86-NEXT: subl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: sbbl {{[0-9]+}}(%esp), %edx
|
|
; X86-NEXT: movl %edx, %ecx
|
|
; X86-NEXT: sarl $31, %ecx
|
|
; X86-NEXT: xorl %ecx, %edx
|
|
; X86-NEXT: xorl %ecx, %eax
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: sbbl %ecx, %edx
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_subnsw_i64_undef:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rsi, %rax
|
|
; X64-NEXT: subq %rdi, %rsi
|
|
; X64-NEXT: cmovgeq %rsi, %rax
|
|
; X64-NEXT: retq
|
|
%sub = sub nsw i64 %a, %b
|
|
%abs = call i64 @llvm.abs.i64(i64 %sub, i1 true)
|
|
ret i64 %abs
|
|
}
|
|
|
|
define i128 @abd_subnsw_i128(i128 %a, i128 %b) nounwind {
|
|
; X86-LABEL: abd_subnsw_i128:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebp
|
|
; X86-NEXT: movl %esp, %ebp
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: andl $-16, %esp
|
|
; X86-NEXT: movl 32(%ebp), %edx
|
|
; X86-NEXT: movl 36(%ebp), %ecx
|
|
; X86-NEXT: movl 24(%ebp), %edi
|
|
; X86-NEXT: movl 28(%ebp), %esi
|
|
; X86-NEXT: subl 40(%ebp), %edi
|
|
; X86-NEXT: sbbl 44(%ebp), %esi
|
|
; X86-NEXT: sbbl 48(%ebp), %edx
|
|
; X86-NEXT: sbbl 52(%ebp), %ecx
|
|
; X86-NEXT: movl %ecx, %eax
|
|
; X86-NEXT: sarl $31, %eax
|
|
; X86-NEXT: xorl %eax, %ecx
|
|
; X86-NEXT: xorl %eax, %edx
|
|
; X86-NEXT: xorl %eax, %esi
|
|
; X86-NEXT: xorl %eax, %edi
|
|
; X86-NEXT: subl %eax, %edi
|
|
; X86-NEXT: sbbl %eax, %esi
|
|
; X86-NEXT: sbbl %eax, %edx
|
|
; X86-NEXT: sbbl %eax, %ecx
|
|
; X86-NEXT: movl 8(%ebp), %eax
|
|
; X86-NEXT: movl %edi, (%eax)
|
|
; X86-NEXT: movl %esi, 4(%eax)
|
|
; X86-NEXT: movl %edx, 8(%eax)
|
|
; X86-NEXT: movl %ecx, 12(%eax)
|
|
; X86-NEXT: leal -8(%ebp), %esp
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebp
|
|
; X86-NEXT: retl $4
|
|
;
|
|
; X64-LABEL: abd_subnsw_i128:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rdx, %rax
|
|
; X64-NEXT: sbbq %rcx, %rsi
|
|
; X64-NEXT: movq %rsi, %rcx
|
|
; X64-NEXT: sarq $63, %rcx
|
|
; X64-NEXT: xorq %rcx, %rsi
|
|
; X64-NEXT: xorq %rcx, %rax
|
|
; X64-NEXT: subq %rcx, %rax
|
|
; X64-NEXT: sbbq %rcx, %rsi
|
|
; X64-NEXT: movq %rsi, %rdx
|
|
; X64-NEXT: retq
|
|
%sub = sub nsw i128 %a, %b
|
|
%abs = call i128 @llvm.abs.i128(i128 %sub, i1 false)
|
|
ret i128 %abs
|
|
}
|
|
|
|
define i128 @abd_subnsw_i128_undef(i128 %a, i128 %b) nounwind {
|
|
; X86-LABEL: abd_subnsw_i128_undef:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebp
|
|
; X86-NEXT: movl %esp, %ebp
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: andl $-16, %esp
|
|
; X86-NEXT: movl 32(%ebp), %edx
|
|
; X86-NEXT: movl 36(%ebp), %ecx
|
|
; X86-NEXT: movl 24(%ebp), %edi
|
|
; X86-NEXT: movl 28(%ebp), %esi
|
|
; X86-NEXT: subl 40(%ebp), %edi
|
|
; X86-NEXT: sbbl 44(%ebp), %esi
|
|
; X86-NEXT: sbbl 48(%ebp), %edx
|
|
; X86-NEXT: sbbl 52(%ebp), %ecx
|
|
; X86-NEXT: movl %ecx, %eax
|
|
; X86-NEXT: sarl $31, %eax
|
|
; X86-NEXT: xorl %eax, %ecx
|
|
; X86-NEXT: xorl %eax, %edx
|
|
; X86-NEXT: xorl %eax, %esi
|
|
; X86-NEXT: xorl %eax, %edi
|
|
; X86-NEXT: subl %eax, %edi
|
|
; X86-NEXT: sbbl %eax, %esi
|
|
; X86-NEXT: sbbl %eax, %edx
|
|
; X86-NEXT: sbbl %eax, %ecx
|
|
; X86-NEXT: movl 8(%ebp), %eax
|
|
; X86-NEXT: movl %edi, (%eax)
|
|
; X86-NEXT: movl %esi, 4(%eax)
|
|
; X86-NEXT: movl %edx, 8(%eax)
|
|
; X86-NEXT: movl %ecx, 12(%eax)
|
|
; X86-NEXT: leal -8(%ebp), %esp
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebp
|
|
; X86-NEXT: retl $4
|
|
;
|
|
; X64-LABEL: abd_subnsw_i128_undef:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rdx, %rax
|
|
; X64-NEXT: sbbq %rcx, %rsi
|
|
; X64-NEXT: movq %rsi, %rcx
|
|
; X64-NEXT: sarq $63, %rcx
|
|
; X64-NEXT: xorq %rcx, %rsi
|
|
; X64-NEXT: xorq %rcx, %rax
|
|
; X64-NEXT: subq %rcx, %rax
|
|
; X64-NEXT: sbbq %rcx, %rsi
|
|
; X64-NEXT: movq %rsi, %rdx
|
|
; X64-NEXT: retq
|
|
%sub = sub nsw i128 %a, %b
|
|
%abs = call i128 @llvm.abs.i128(i128 %sub, i1 true)
|
|
ret i128 %abs
|
|
}
|
|
|
|
;
|
|
; negative tests
|
|
;
|
|
|
|
define i32 @abd_sub_i32(i32 %a, i32 %b) nounwind {
|
|
; X86-LABEL: abd_sub_i32:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: subl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %eax
|
|
; X86-NEXT: negl %eax
|
|
; X86-NEXT: cmovsl %ecx, %eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_sub_i32:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: subl %esi, %edi
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: negl %eax
|
|
; X64-NEXT: cmovsl %edi, %eax
|
|
; X64-NEXT: retq
|
|
%sub = sub i32 %a, %b
|
|
%abs = call i32 @llvm.abs.i32(i32 %sub, i1 false)
|
|
ret i32 %abs
|
|
}
|
|
|
|
;
|
|
; sub(select(icmp(a,b),a,b),select(icmp(a,b),b,a)) -> abds(a,b)
|
|
;
|
|
|
|
define i8 @abd_select_i8(i8 %a, i8 %b) nounwind {
|
|
; X86-LABEL: abd_select_i8:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movsbl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $al killed $al killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_select_i8:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movsbl %sil, %eax
|
|
; X64-NEXT: movsbl %dil, %ecx
|
|
; X64-NEXT: movl %ecx, %edx
|
|
; X64-NEXT: subl %eax, %edx
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edx, %eax
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
; X64-NEXT: retq
|
|
%cmp = icmp slt i8 %a, %b
|
|
%ab = select i1 %cmp, i8 %a, i8 %b
|
|
%ba = select i1 %cmp, i8 %b, i8 %a
|
|
%sub = sub i8 %ba, %ab
|
|
ret i8 %sub
|
|
}
|
|
|
|
define i16 @abd_select_i16(i16 %a, i16 %b) nounwind {
|
|
; X86-LABEL: abd_select_i16:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movswl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_select_i16:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movswl %si, %eax
|
|
; X64-NEXT: movswl %di, %ecx
|
|
; X64-NEXT: movl %ecx, %edx
|
|
; X64-NEXT: subl %eax, %edx
|
|
; X64-NEXT: subl %ecx, %eax
|
|
; X64-NEXT: cmovll %edx, %eax
|
|
; X64-NEXT: # kill: def $ax killed $ax killed $eax
|
|
; X64-NEXT: retq
|
|
%cmp = icmp sle i16 %a, %b
|
|
%ab = select i1 %cmp, i16 %a, i16 %b
|
|
%ba = select i1 %cmp, i16 %b, i16 %a
|
|
%sub = sub i16 %ba, %ab
|
|
ret i16 %sub
|
|
}
|
|
|
|
define i32 @abd_select_i32(i32 %a, i32 %b) nounwind {
|
|
; X86-LABEL: abd_select_i32:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl %ecx, %edx
|
|
; X86-NEXT: subl %eax, %edx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: cmovll %edx, %eax
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_select_i32:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movl %edi, %eax
|
|
; X64-NEXT: subl %esi, %eax
|
|
; X64-NEXT: subl %edi, %esi
|
|
; X64-NEXT: cmovgel %esi, %eax
|
|
; X64-NEXT: retq
|
|
%cmp = icmp sgt i32 %a, %b
|
|
%ab = select i1 %cmp, i32 %a, i32 %b
|
|
%ba = select i1 %cmp, i32 %b, i32 %a
|
|
%sub = sub i32 %ab, %ba
|
|
ret i32 %sub
|
|
}
|
|
|
|
define i64 @abd_select_i64(i64 %a, i64 %b) nounwind {
|
|
; X86-LABEL: abd_select_i64:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebx
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
; X86-NEXT: movl %ecx, %edi
|
|
; X86-NEXT: subl %eax, %edi
|
|
; X86-NEXT: movl %esi, %ebx
|
|
; X86-NEXT: sbbl %edx, %ebx
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: sbbl %esi, %edx
|
|
; X86-NEXT: cmovll %edi, %eax
|
|
; X86-NEXT: cmovll %ebx, %edx
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebx
|
|
; X86-NEXT: retl
|
|
;
|
|
; X64-LABEL: abd_select_i64:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rsi, %rax
|
|
; X64-NEXT: subq %rdi, %rsi
|
|
; X64-NEXT: cmovgeq %rsi, %rax
|
|
; X64-NEXT: retq
|
|
%cmp = icmp sge i64 %a, %b
|
|
%ab = select i1 %cmp, i64 %a, i64 %b
|
|
%ba = select i1 %cmp, i64 %b, i64 %a
|
|
%sub = sub i64 %ab, %ba
|
|
ret i64 %sub
|
|
}
|
|
|
|
define i128 @abd_select_i128(i128 %a, i128 %b) nounwind {
|
|
; X86-LABEL: abd_select_i128:
|
|
; X86: # %bb.0:
|
|
; X86-NEXT: pushl %ebp
|
|
; X86-NEXT: movl %esp, %ebp
|
|
; X86-NEXT: pushl %ebx
|
|
; X86-NEXT: pushl %edi
|
|
; X86-NEXT: pushl %esi
|
|
; X86-NEXT: andl $-16, %esp
|
|
; X86-NEXT: subl $16, %esp
|
|
; X86-NEXT: movl 40(%ebp), %ecx
|
|
; X86-NEXT: movl 44(%ebp), %edx
|
|
; X86-NEXT: movl 24(%ebp), %eax
|
|
; X86-NEXT: movl 28(%ebp), %esi
|
|
; X86-NEXT: subl %ecx, %eax
|
|
; X86-NEXT: movl %eax, {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Spill
|
|
; X86-NEXT: movl %esi, %eax
|
|
; X86-NEXT: sbbl %edx, %eax
|
|
; X86-NEXT: movl %eax, {{[-0-9]+}}(%e{{[sb]}}p) # 4-byte Spill
|
|
; X86-NEXT: movl 48(%ebp), %esi
|
|
; X86-NEXT: movl 32(%ebp), %edi
|
|
; X86-NEXT: sbbl %esi, %edi
|
|
; X86-NEXT: movl 52(%ebp), %ebx
|
|
; X86-NEXT: movl 36(%ebp), %eax
|
|
; X86-NEXT: sbbl %ebx, %eax
|
|
; X86-NEXT: subl 24(%ebp), %ecx
|
|
; X86-NEXT: sbbl 28(%ebp), %edx
|
|
; X86-NEXT: sbbl 32(%ebp), %esi
|
|
; X86-NEXT: sbbl 36(%ebp), %ebx
|
|
; X86-NEXT: cmovll {{[-0-9]+}}(%e{{[sb]}}p), %ecx # 4-byte Folded Reload
|
|
; X86-NEXT: cmovll {{[-0-9]+}}(%e{{[sb]}}p), %edx # 4-byte Folded Reload
|
|
; X86-NEXT: cmovll %edi, %esi
|
|
; X86-NEXT: cmovll %eax, %ebx
|
|
; X86-NEXT: movl 8(%ebp), %eax
|
|
; X86-NEXT: movl %ebx, 12(%eax)
|
|
; X86-NEXT: movl %esi, 8(%eax)
|
|
; X86-NEXT: movl %edx, 4(%eax)
|
|
; X86-NEXT: movl %ecx, (%eax)
|
|
; X86-NEXT: leal -12(%ebp), %esp
|
|
; X86-NEXT: popl %esi
|
|
; X86-NEXT: popl %edi
|
|
; X86-NEXT: popl %ebx
|
|
; X86-NEXT: popl %ebp
|
|
; X86-NEXT: retl $4
|
|
;
|
|
; X64-LABEL: abd_select_i128:
|
|
; X64: # %bb.0:
|
|
; X64-NEXT: movq %rdi, %rax
|
|
; X64-NEXT: subq %rdx, %rax
|
|
; X64-NEXT: movq %rsi, %r8
|
|
; X64-NEXT: sbbq %rcx, %r8
|
|
; X64-NEXT: subq %rdi, %rdx
|
|
; X64-NEXT: sbbq %rsi, %rcx
|
|
; X64-NEXT: cmovgeq %rdx, %rax
|
|
; X64-NEXT: cmovgeq %rcx, %r8
|
|
; X64-NEXT: movq %r8, %rdx
|
|
; X64-NEXT: retq
|
|
%cmp = icmp slt i128 %a, %b
|
|
%ab = select i1 %cmp, i128 %a, i128 %b
|
|
%ba = select i1 %cmp, i128 %b, i128 %a
|
|
%sub = sub i128 %ba, %ab
|
|
ret i128 %sub
|
|
}
|
|
|
|
declare i8 @llvm.abs.i8(i8, i1)
|
|
declare i16 @llvm.abs.i16(i16, i1)
|
|
declare i32 @llvm.abs.i32(i32, i1)
|
|
declare i64 @llvm.abs.i64(i64, i1)
|
|
declare i128 @llvm.abs.i128(i128, i1)
|
|
|
|
declare i8 @llvm.smax.i8(i8, i8)
|
|
declare i16 @llvm.smax.i16(i16, i16)
|
|
declare i32 @llvm.smax.i32(i32, i32)
|
|
declare i64 @llvm.smax.i64(i64, i64)
|
|
|
|
declare i8 @llvm.smin.i8(i8, i8)
|
|
declare i16 @llvm.smin.i16(i16, i16)
|
|
declare i32 @llvm.smin.i32(i32, i32)
|
|
declare i64 @llvm.smin.i64(i64, i64)
|