The first attempt missed changing test files for tools (update_llc_test_checks.py). Original commit message: This implements the main suggested change from issue #56498. Using the shorter (non-extending) instruction with only -Oz ("minsize") rather than -Os ("optsize") is left as a possible follow-up. As noted in the bug report, the zero-extending load may have shorter latency/better throughput across a wide range of x86 micro-arches, and it avoids a potential false dependency. The cost is an extra instruction byte. This could cause perf ups and downs from secondary effects, but I don't think it is possible to account for those in advance, and that will likely also depend on exact micro-arch. This does bring LLVM x86 codegen more in line with existing gcc codegen, so if problems are exposed they are more likely to occur for both compilers. Differential Revision: https://reviews.llvm.org/D129775
59 lines
1.3 KiB
LLVM
59 lines
1.3 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -mtriple=x86_64-apple-darwin | FileCheck %s
|
|
|
|
define zeroext i1 @f1(ptr %x) {
|
|
; CHECK-LABEL: f1:
|
|
; CHECK: ## %bb.0: ## %entry
|
|
; CHECK-NEXT: movzbl (%rdi), %eax
|
|
; CHECK-NEXT: retq
|
|
|
|
entry:
|
|
%0 = load i8, ptr %x, align 1, !range !0
|
|
%tobool = trunc i8 %0 to i1
|
|
ret i1 %tobool
|
|
}
|
|
|
|
define zeroext i1 @f2(ptr %x) {
|
|
; CHECK-LABEL: f2:
|
|
; CHECK: ## %bb.0: ## %entry
|
|
; CHECK-NEXT: movzbl (%rdi), %eax
|
|
; CHECK-NEXT: retq
|
|
|
|
entry:
|
|
%0 = load i8, ptr %x, align 1, !range !0
|
|
%tobool = icmp ne i8 %0, 0
|
|
ret i1 %tobool
|
|
}
|
|
|
|
!0 = !{i8 0, i8 2}
|
|
|
|
|
|
; check that we don't build a "trunc" from i1 to i1, which would assert.
|
|
define zeroext i1 @f3(i1 %x) {
|
|
; CHECK-LABEL: f3:
|
|
; CHECK: ## %bb.0: ## %entry
|
|
; CHECK-NEXT: movl %edi, %eax
|
|
; CHECK-NEXT: andb $1, %al
|
|
; CHECK-NEXT: ## kill: def $al killed $al killed $eax
|
|
; CHECK-NEXT: retq
|
|
|
|
entry:
|
|
%tobool = icmp ne i1 %x, 0
|
|
ret i1 %tobool
|
|
}
|
|
|
|
; check that we don't build a trunc when other bits are needed
|
|
define zeroext i1 @f4(i32 %x) {
|
|
; CHECK-LABEL: f4:
|
|
; CHECK: ## %bb.0: ## %entry
|
|
; CHECK-NEXT: movzwl %di, %eax
|
|
; CHECK-NEXT: shrl $15, %eax
|
|
; CHECK-NEXT: ## kill: def $al killed $al killed $eax
|
|
; CHECK-NEXT: retq
|
|
|
|
entry:
|
|
%y = and i32 %x, 32768
|
|
%z = icmp ne i32 %y, 0
|
|
ret i1 %z
|
|
}
|