
When the default branch is the last case, we can transform that branch into a concrete branch with an unreachable default branch. ```llvm target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128" target triple = "x86_64-unknown-linux-gnu" define i64 @src(i64 %0) { %2 = urem i64 %0, 4 switch i64 %2, label %5 [ i64 1, label %3 i64 2, label %3 i64 3, label %4 ] 3: ; preds = %1, %1 br label %5 4: ; preds = %1 br label %5 5: ; preds = %1, %4, %3 %.0 = phi i64 [ 2, %4 ], [ 1, %3 ], [ 0, %1 ] ret i64 %.0 } define i64 @tgt(i64 %0) { %2 = urem i64 %0, 4 switch i64 %2, label %unreachable [ i64 0, label %5 i64 1, label %3 i64 2, label %3 i64 3, label %4 ] unreachable: ; preds = %1 unreachable 3: ; preds = %1, %1 br label %5 4: ; preds = %1 br label %5 5: ; preds = %1, %4, %3 %.0 = phi i64 [ 2, %4 ], [ 1, %3 ], [ 0, %1 ] ret i64 %.0 } ``` Alive2: https://alive2.llvm.org/ce/z/Y-PGXv After transform to a lookup table, I believe `tgt` is better code. The final instructions are as follows: ```asm src: # @src and edi, 3 lea rax, [rdi - 1] cmp rax, 2 ja .LBB0_1 mov rax, qword ptr [8*rdi + .Lswitch.table.src-8] ret .LBB0_1: xor eax, eax ret tgt: # @tgt and edi, 3 mov rax, qword ptr [8*rdi + .Lswitch.table.tgt] ret .Lswitch.table.src: .quad 1 # 0x1 .quad 1 # 0x1 .quad 2 # 0x2 .Lswitch.table.tgt: .quad 0 # 0x0 .quad 1 # 0x1 .quad 1 # 0x1 .quad 2 # 0x2 ``` Godbolt: https://llvm.godbolt.org/z/borME8znd Closes #73446. (cherry picked from commit 7d81e072712f4e6a150561b5538ccebda289aa13)
62 lines
1.4 KiB
LLVM
62 lines
1.4 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
|
|
; RUN: opt %s -S -passes='simplifycfg<switch-to-lookup>' -simplifycfg-require-and-preserve-domtree=1 -switch-range-to-icmp | FileCheck %s
|
|
|
|
target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
|
|
|
|
define i64 @test_1(i64 %0) {
|
|
; CHECK-LABEL: define i64 @test_1(
|
|
; CHECK-SAME: i64 [[TMP0:%.*]]) {
|
|
; CHECK-NEXT: switch.lookup:
|
|
; CHECK-NEXT: [[TMP1:%.*]] = urem i64 [[TMP0]], 4
|
|
; CHECK-NEXT: [[SWITCH_GEP:%.*]] = getelementptr inbounds [4 x i64], ptr @switch.table.test_1, i32 0, i64 [[TMP1]]
|
|
; CHECK-NEXT: [[SWITCH_LOAD:%.*]] = load i64, ptr [[SWITCH_GEP]], align 8
|
|
; CHECK-NEXT: ret i64 [[SWITCH_LOAD]]
|
|
;
|
|
%2 = urem i64 %0, 4
|
|
switch i64 %2, label %5 [
|
|
i64 1, label %3
|
|
i64 2, label %3
|
|
i64 3, label %4
|
|
]
|
|
|
|
3:
|
|
br label %5
|
|
|
|
4:
|
|
br label %5
|
|
|
|
5:
|
|
%.0 = phi i64 [ 2, %4 ], [ 1, %3 ], [ 0, %1 ]
|
|
ret i64 %.0
|
|
}
|
|
|
|
|
|
define i64 @test_2(i64 %0) {
|
|
; CHECK-LABEL: define i64 @test_2(
|
|
; CHECK-SAME: i64 [[TMP0:%.*]]) {
|
|
; CHECK-NEXT: switch.lookup:
|
|
; CHECK-NEXT: [[TMP1:%.*]] = urem i64 [[TMP0]], 4
|
|
; CHECK-NEXT: ret i64 [[TMP1]]
|
|
;
|
|
%2 = urem i64 %0, 4
|
|
switch i64 %2, label %6 [
|
|
i64 1, label %3
|
|
i64 2, label %4
|
|
i64 3, label %5
|
|
]
|
|
|
|
3:
|
|
br label %6
|
|
|
|
4:
|
|
br label %6
|
|
|
|
5:
|
|
br label %6
|
|
|
|
6:
|
|
%.0 = phi i64 [ 0, %1 ], [ 1, %3 ], [ 2, %4 ], [ 3, %5 ]
|
|
ret i64 %.0
|
|
}
|
|
|