llvm-project/llvm/test/CodeGen/RISCV/shrinkwrap.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple riscv32 -enable-shrink-wrap=false < %s \
; RUN:   | FileCheck %s -check-prefix=RV32I-SW-NO
; RUN: llc -mtriple riscv32 < %s \
; RUN:   | FileCheck %s -check-prefix=RV32I-SW
; RUN: llc -mtriple riscv32 -mattr=+save-restore < %s \
; RUN:   | FileCheck %s -check-prefix=RV32I-SW-SR
; RUN: llc -mtriple riscv64 < %s \
; RUN:   | FileCheck %s -check-prefix=RV64I-SW

declare void @abort()

define void @eliminate_restore(i32 %n) nounwind {
; RV32I-SW-NO-LABEL: eliminate_restore:
; RV32I-SW-NO:       # %bb.0:
; RV32I-SW-NO-NEXT:    addi sp, sp, -16
; RV32I-SW-NO-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    li a1, 32
; RV32I-SW-NO-NEXT:    bgeu a1, a0, .LBB0_2
; RV32I-SW-NO-NEXT:  # %bb.1: # %if.end
; RV32I-SW-NO-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    addi sp, sp, 16
; RV32I-SW-NO-NEXT:    ret
; RV32I-SW-NO-NEXT:  .LBB0_2: # %if.then
; RV32I-SW-NO-NEXT:    call abort
;
; RV32I-SW-LABEL: eliminate_restore:
; RV32I-SW:       # %bb.0:
; RV32I-SW-NEXT:    li a1, 32
; RV32I-SW-NEXT:    bgeu a1, a0, .LBB0_2
; RV32I-SW-NEXT:  # %bb.1: # %if.end
; RV32I-SW-NEXT:    ret
; RV32I-SW-NEXT:  .LBB0_2: # %if.then
; RV32I-SW-NEXT:    addi sp, sp, -16
; RV32I-SW-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    call abort
;
; RV32I-SW-SR-LABEL: eliminate_restore:
; RV32I-SW-SR:       # %bb.0:
; RV32I-SW-SR-NEXT:    li a1, 32
; RV32I-SW-SR-NEXT:    bgeu a1, a0, .LBB0_2
; RV32I-SW-SR-NEXT:  # %bb.1: # %if.end
; RV32I-SW-SR-NEXT:    ret
; RV32I-SW-SR-NEXT:  .LBB0_2: # %if.then
; RV32I-SW-SR-NEXT:    call t0, __riscv_save_0
; RV32I-SW-SR-NEXT:    call abort
;
; RV64I-SW-LABEL: eliminate_restore:
; RV64I-SW:       # %bb.0:
; RV64I-SW-NEXT:    sext.w a0, a0
; RV64I-SW-NEXT:    li a1, 32
; RV64I-SW-NEXT:    bgeu a1, a0, .LBB0_2
; RV64I-SW-NEXT:  # %bb.1: # %if.end
; RV64I-SW-NEXT:    ret
; RV64I-SW-NEXT:  .LBB0_2: # %if.then
; RV64I-SW-NEXT:    addi sp, sp, -16
; RV64I-SW-NEXT:    sd ra, 8(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    call abort
  %cmp = icmp ule i32 %n, 32
  br i1 %cmp, label %if.then, label %if.end

if.then:
  call void @abort()
  unreachable

if.end:
  ret void
}

declare void @notdead(ptr)

define void @conditional_alloca(i32 %n) nounwind {
; RV32I-SW-NO-LABEL: conditional_alloca:
; RV32I-SW-NO:       # %bb.0:
; RV32I-SW-NO-NEXT:    addi sp, sp, -16
; RV32I-SW-NO-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    sw s0, 8(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    addi s0, sp, 16
; RV32I-SW-NO-NEXT:    li a1, 32
; RV32I-SW-NO-NEXT:    bltu a1, a0, .LBB1_2
; RV32I-SW-NO-NEXT:  # %bb.1: # %if.then
; RV32I-SW-NO-NEXT:    addi a0, a0, 15
; RV32I-SW-NO-NEXT:    andi a0, a0, -16
; RV32I-SW-NO-NEXT:    sub a0, sp, a0
; RV32I-SW-NO-NEXT:    mv sp, a0
; RV32I-SW-NO-NEXT:    call notdead
; RV32I-SW-NO-NEXT:  .LBB1_2: # %if.end
; RV32I-SW-NO-NEXT:    addi sp, s0, -16
; RV32I-SW-NO-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    lw s0, 8(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    addi sp, sp, 16
; RV32I-SW-NO-NEXT:    ret
;
; RV32I-SW-LABEL: conditional_alloca:
; RV32I-SW:       # %bb.0:
; RV32I-SW-NEXT:    li a1, 32
; RV32I-SW-NEXT:    bltu a1, a0, .LBB1_2
; RV32I-SW-NEXT:  # %bb.1: # %if.then
; RV32I-SW-NEXT:    addi sp, sp, -16
; RV32I-SW-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    sw s0, 8(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    addi s0, sp, 16
; RV32I-SW-NEXT:    addi a0, a0, 15
; RV32I-SW-NEXT:    andi a0, a0, -16
; RV32I-SW-NEXT:    sub a0, sp, a0
; RV32I-SW-NEXT:    mv sp, a0
; RV32I-SW-NEXT:    call notdead
; RV32I-SW-NEXT:    addi sp, s0, -16
; RV32I-SW-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    lw s0, 8(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    addi sp, sp, 16
; RV32I-SW-NEXT:  .LBB1_2: # %if.end
; RV32I-SW-NEXT:    ret
;
; RV32I-SW-SR-LABEL: conditional_alloca:
; RV32I-SW-SR:       # %bb.0:
; RV32I-SW-SR-NEXT:    li a1, 32
; RV32I-SW-SR-NEXT:    bltu a1, a0, .LBB1_2
; RV32I-SW-SR-NEXT:  # %bb.1: # %if.then
; RV32I-SW-SR-NEXT:    call t0, __riscv_save_1
; RV32I-SW-SR-NEXT:    addi s0, sp, 16
; RV32I-SW-SR-NEXT:    addi a0, a0, 15
; RV32I-SW-SR-NEXT:    andi a0, a0, -16
; RV32I-SW-SR-NEXT:    sub a0, sp, a0
; RV32I-SW-SR-NEXT:    mv sp, a0
; RV32I-SW-SR-NEXT:    call notdead
; RV32I-SW-SR-NEXT:    addi sp, s0, -16
; RV32I-SW-SR-NEXT:    tail __riscv_restore_1
; RV32I-SW-SR-NEXT:  .LBB1_2: # %if.end
; RV32I-SW-SR-NEXT:    ret
;
; RV64I-SW-LABEL: conditional_alloca:
; RV64I-SW:       # %bb.0:
; RV64I-SW-NEXT:    sext.w a1, a0
; RV64I-SW-NEXT:    li a2, 32
; RV64I-SW-NEXT:    bltu a2, a1, .LBB1_2
; RV64I-SW-NEXT:  # %bb.1: # %if.then
; RV64I-SW-NEXT:    addi sp, sp, -16
; RV64I-SW-NEXT:    sd ra, 8(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    sd s0, 0(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    addi s0, sp, 16
; RV64I-SW-NEXT:    slli a0, a0, 32
; RV64I-SW-NEXT:    srli a0, a0, 32
; RV64I-SW-NEXT:    addi a0, a0, 15
; RV64I-SW-NEXT:    andi a0, a0, -16
; RV64I-SW-NEXT:    sub a0, sp, a0
; RV64I-SW-NEXT:    mv sp, a0
; RV64I-SW-NEXT:    call notdead
; RV64I-SW-NEXT:    addi sp, s0, -16
; RV64I-SW-NEXT:    ld ra, 8(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    ld s0, 0(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    addi sp, sp, 16
; RV64I-SW-NEXT:  .LBB1_2: # %if.end
; RV64I-SW-NEXT:    ret
  %cmp = icmp ule i32 %n, 32
  br i1 %cmp, label %if.then, label %if.end

if.then:
  %addr = alloca i8, i32 %n
  call void @notdead(ptr %addr)
  br label %if.end

if.end:
  ret void
}

; FIXME: Rematerialize "li s1, 57" for the second use instead of spilling s1,
; and then shrink wrap the result avoiding frame setup on the %bb.0 -> %exit
; edge.
define void @li_straightline_a(i32 zeroext %a, i32 zeroext %b) {
; RV32I-SW-NO-LABEL: li_straightline_a:
; RV32I-SW-NO:       # %bb.0:
; RV32I-SW-NO-NEXT:    addi sp, sp, -16
; RV32I-SW-NO-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-NO-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    sw s0, 8(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    sw s1, 4(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    .cfi_offset ra, -4
; RV32I-SW-NO-NEXT:    .cfi_offset s0, -8
; RV32I-SW-NO-NEXT:    .cfi_offset s1, -12
; RV32I-SW-NO-NEXT:    li s1, 57
; RV32I-SW-NO-NEXT:    beq a0, s1, .LBB2_3
; RV32I-SW-NO-NEXT:  # %bb.1: # %do_call
; RV32I-SW-NO-NEXT:    mv s0, a1
; RV32I-SW-NO-NEXT:    call foo
; RV32I-SW-NO-NEXT:    beq s0, s1, .LBB2_3
; RV32I-SW-NO-NEXT:  # %bb.2: # %do_call2
; RV32I-SW-NO-NEXT:    call foo
; RV32I-SW-NO-NEXT:  .LBB2_3: # %exit
; RV32I-SW-NO-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    lw s0, 8(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    lw s1, 4(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    .cfi_restore ra
; RV32I-SW-NO-NEXT:    .cfi_restore s0
; RV32I-SW-NO-NEXT:    .cfi_restore s1
; RV32I-SW-NO-NEXT:    addi sp, sp, 16
; RV32I-SW-NO-NEXT:    .cfi_def_cfa_offset 0
; RV32I-SW-NO-NEXT:    ret
;
; RV32I-SW-LABEL: li_straightline_a:
; RV32I-SW:       # %bb.0:
; RV32I-SW-NEXT:    addi sp, sp, -16
; RV32I-SW-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    sw s0, 8(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    sw s1, 4(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    .cfi_offset ra, -4
; RV32I-SW-NEXT:    .cfi_offset s0, -8
; RV32I-SW-NEXT:    .cfi_offset s1, -12
; RV32I-SW-NEXT:    li s1, 57
; RV32I-SW-NEXT:    beq a0, s1, .LBB2_3
; RV32I-SW-NEXT:  # %bb.1: # %do_call
; RV32I-SW-NEXT:    mv s0, a1
; RV32I-SW-NEXT:    call foo
; RV32I-SW-NEXT:    beq s0, s1, .LBB2_3
; RV32I-SW-NEXT:  # %bb.2: # %do_call2
; RV32I-SW-NEXT:    call foo
; RV32I-SW-NEXT:  .LBB2_3: # %exit
; RV32I-SW-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    lw s0, 8(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    lw s1, 4(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    .cfi_restore ra
; RV32I-SW-NEXT:    .cfi_restore s0
; RV32I-SW-NEXT:    .cfi_restore s1
; RV32I-SW-NEXT:    addi sp, sp, 16
; RV32I-SW-NEXT:    .cfi_def_cfa_offset 0
; RV32I-SW-NEXT:    ret
;
; RV32I-SW-SR-LABEL: li_straightline_a:
; RV32I-SW-SR:       # %bb.0:
; RV32I-SW-SR-NEXT:    call t0, __riscv_save_2
; RV32I-SW-SR-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-SR-NEXT:    .cfi_offset ra, -4
; RV32I-SW-SR-NEXT:    .cfi_offset s0, -8
; RV32I-SW-SR-NEXT:    .cfi_offset s1, -12
; RV32I-SW-SR-NEXT:    li s1, 57
; RV32I-SW-SR-NEXT:    beq a0, s1, .LBB2_3
; RV32I-SW-SR-NEXT:  # %bb.1: # %do_call
; RV32I-SW-SR-NEXT:    mv s0, a1
; RV32I-SW-SR-NEXT:    call foo
; RV32I-SW-SR-NEXT:    beq s0, s1, .LBB2_3
; RV32I-SW-SR-NEXT:  # %bb.2: # %do_call2
; RV32I-SW-SR-NEXT:    call foo
; RV32I-SW-SR-NEXT:  .LBB2_3: # %exit
; RV32I-SW-SR-NEXT:    tail __riscv_restore_2
;
; RV64I-SW-LABEL: li_straightline_a:
; RV64I-SW:       # %bb.0:
; RV64I-SW-NEXT:    addi sp, sp, -32
; RV64I-SW-NEXT:    .cfi_def_cfa_offset 32
; RV64I-SW-NEXT:    sd ra, 24(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    sd s0, 16(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    sd s1, 8(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    .cfi_offset ra, -8
; RV64I-SW-NEXT:    .cfi_offset s0, -16
; RV64I-SW-NEXT:    .cfi_offset s1, -24
; RV64I-SW-NEXT:    li s1, 57
; RV64I-SW-NEXT:    beq a0, s1, .LBB2_3
; RV64I-SW-NEXT:  # %bb.1: # %do_call
; RV64I-SW-NEXT:    mv s0, a1
; RV64I-SW-NEXT:    call foo
; RV64I-SW-NEXT:    beq s0, s1, .LBB2_3
; RV64I-SW-NEXT:  # %bb.2: # %do_call2
; RV64I-SW-NEXT:    call foo
; RV64I-SW-NEXT:  .LBB2_3: # %exit
; RV64I-SW-NEXT:    ld ra, 24(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    ld s0, 16(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    ld s1, 8(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    .cfi_restore ra
; RV64I-SW-NEXT:    .cfi_restore s0
; RV64I-SW-NEXT:    .cfi_restore s1
; RV64I-SW-NEXT:    addi sp, sp, 32
; RV64I-SW-NEXT:    .cfi_def_cfa_offset 0
; RV64I-SW-NEXT:    ret
  %cmp0 = icmp eq i32 %a, 57
  br i1 %cmp0, label %exit, label %do_call
do_call:
  call i32 @foo()
  %cmp1 = icmp eq i32 %b, 57
  br i1 %cmp1, label %exit, label %do_call2
do_call2:
  call i32 @foo()
  br label %exit
exit:
  ret void
}

; FIXME: The "mv s0, a1" is only required along the do_call path, and can
; be sunk there.  We can also shrink wrap to avoid the frame setup along
; the %bb.0 -> %exit edge.
define void @li_straightline_b(i32 zeroext %a, i32 zeroext %b) {
; RV32I-SW-NO-LABEL: li_straightline_b:
; RV32I-SW-NO:       # %bb.0:
; RV32I-SW-NO-NEXT:    addi sp, sp, -16
; RV32I-SW-NO-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-NO-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    sw s0, 8(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    .cfi_offset ra, -4
; RV32I-SW-NO-NEXT:    .cfi_offset s0, -8
; RV32I-SW-NO-NEXT:    mv s0, a1
; RV32I-SW-NO-NEXT:    li a1, 57
; RV32I-SW-NO-NEXT:    beq a0, a1, .LBB3_3
; RV32I-SW-NO-NEXT:  # %bb.1: # %do_call
; RV32I-SW-NO-NEXT:    call foo
; RV32I-SW-NO-NEXT:    li a0, 57
; RV32I-SW-NO-NEXT:    beq s0, a0, .LBB3_3
; RV32I-SW-NO-NEXT:  # %bb.2: # %do_call2
; RV32I-SW-NO-NEXT:    call foo
; RV32I-SW-NO-NEXT:  .LBB3_3: # %exit
; RV32I-SW-NO-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    lw s0, 8(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    .cfi_restore ra
; RV32I-SW-NO-NEXT:    .cfi_restore s0
; RV32I-SW-NO-NEXT:    addi sp, sp, 16
; RV32I-SW-NO-NEXT:    .cfi_def_cfa_offset 0
; RV32I-SW-NO-NEXT:    ret
;
; RV32I-SW-LABEL: li_straightline_b:
; RV32I-SW:       # %bb.0:
; RV32I-SW-NEXT:    addi sp, sp, -16
; RV32I-SW-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    sw s0, 8(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    .cfi_offset ra, -4
; RV32I-SW-NEXT:    .cfi_offset s0, -8
; RV32I-SW-NEXT:    mv s0, a1
; RV32I-SW-NEXT:    li a1, 57
; RV32I-SW-NEXT:    beq a0, a1, .LBB3_3
; RV32I-SW-NEXT:  # %bb.1: # %do_call
; RV32I-SW-NEXT:    call foo
; RV32I-SW-NEXT:    li a0, 57
; RV32I-SW-NEXT:    beq s0, a0, .LBB3_3
; RV32I-SW-NEXT:  # %bb.2: # %do_call2
; RV32I-SW-NEXT:    call foo
; RV32I-SW-NEXT:  .LBB3_3: # %exit
; RV32I-SW-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    lw s0, 8(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    .cfi_restore ra
; RV32I-SW-NEXT:    .cfi_restore s0
; RV32I-SW-NEXT:    addi sp, sp, 16
; RV32I-SW-NEXT:    .cfi_def_cfa_offset 0
; RV32I-SW-NEXT:    ret
;
; RV32I-SW-SR-LABEL: li_straightline_b:
; RV32I-SW-SR:       # %bb.0:
; RV32I-SW-SR-NEXT:    call t0, __riscv_save_1
; RV32I-SW-SR-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-SR-NEXT:    .cfi_offset ra, -4
; RV32I-SW-SR-NEXT:    .cfi_offset s0, -8
; RV32I-SW-SR-NEXT:    mv s0, a1
; RV32I-SW-SR-NEXT:    li a1, 57
; RV32I-SW-SR-NEXT:    beq a0, a1, .LBB3_3
; RV32I-SW-SR-NEXT:  # %bb.1: # %do_call
; RV32I-SW-SR-NEXT:    call foo
; RV32I-SW-SR-NEXT:    li a0, 57
; RV32I-SW-SR-NEXT:    beq s0, a0, .LBB3_3
; RV32I-SW-SR-NEXT:  # %bb.2: # %do_call2
; RV32I-SW-SR-NEXT:    call foo
; RV32I-SW-SR-NEXT:  .LBB3_3: # %exit
; RV32I-SW-SR-NEXT:    tail __riscv_restore_1
;
; RV64I-SW-LABEL: li_straightline_b:
; RV64I-SW:       # %bb.0:
; RV64I-SW-NEXT:    addi sp, sp, -16
; RV64I-SW-NEXT:    .cfi_def_cfa_offset 16
; RV64I-SW-NEXT:    sd ra, 8(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    sd s0, 0(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    .cfi_offset ra, -8
; RV64I-SW-NEXT:    .cfi_offset s0, -16
; RV64I-SW-NEXT:    mv s0, a1
; RV64I-SW-NEXT:    li a1, 57
; RV64I-SW-NEXT:    beq a0, a1, .LBB3_3
; RV64I-SW-NEXT:  # %bb.1: # %do_call
; RV64I-SW-NEXT:    call foo
; RV64I-SW-NEXT:    li a0, 57
; RV64I-SW-NEXT:    beq s0, a0, .LBB3_3
; RV64I-SW-NEXT:  # %bb.2: # %do_call2
; RV64I-SW-NEXT:    call foo
; RV64I-SW-NEXT:  .LBB3_3: # %exit
; RV64I-SW-NEXT:    ld ra, 8(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    ld s0, 0(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    .cfi_restore ra
; RV64I-SW-NEXT:    .cfi_restore s0
; RV64I-SW-NEXT:    addi sp, sp, 16
; RV64I-SW-NEXT:    .cfi_def_cfa_offset 0
; RV64I-SW-NEXT:    ret
  %cmp0 = icmp eq i32 %a, 57
  br i1 %cmp0, label %exit, label %do_call
do_call:
  call i32 @foo()
  br label %next
next:
  %cmp1 = icmp eq i32 %b, 57
  br i1 %cmp1, label %exit, label %do_call2
do_call2:
  call i32 @foo()
  br label %exit
exit:
  ret void
}

; A further variant of "b" to show that we can shrink wrap this case
; if the second use of 57 is remat, and we eliminate the second live
; argument.
define void @li_straightline_c(i32 zeroext %a) {
; RV32I-SW-NO-LABEL: li_straightline_c:
; RV32I-SW-NO:       # %bb.0:
; RV32I-SW-NO-NEXT:    addi sp, sp, -16
; RV32I-SW-NO-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-NO-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    .cfi_offset ra, -4
; RV32I-SW-NO-NEXT:    li a1, 57
; RV32I-SW-NO-NEXT:    beq a0, a1, .LBB4_3
; RV32I-SW-NO-NEXT:  # %bb.1: # %do_call
; RV32I-SW-NO-NEXT:    call foo
; RV32I-SW-NO-NEXT:    li a1, 57
; RV32I-SW-NO-NEXT:    beq a0, a1, .LBB4_3
; RV32I-SW-NO-NEXT:  # %bb.2: # %do_call2
; RV32I-SW-NO-NEXT:    call foo
; RV32I-SW-NO-NEXT:  .LBB4_3: # %exit
; RV32I-SW-NO-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    .cfi_restore ra
; RV32I-SW-NO-NEXT:    addi sp, sp, 16
; RV32I-SW-NO-NEXT:    .cfi_def_cfa_offset 0
; RV32I-SW-NO-NEXT:    ret
;
; RV32I-SW-LABEL: li_straightline_c:
; RV32I-SW:       # %bb.0:
; RV32I-SW-NEXT:    li a1, 57
; RV32I-SW-NEXT:    beq a0, a1, .LBB4_4
; RV32I-SW-NEXT:  # %bb.1: # %do_call
; RV32I-SW-NEXT:    addi sp, sp, -16
; RV32I-SW-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    .cfi_offset ra, -4
; RV32I-SW-NEXT:    call foo
; RV32I-SW-NEXT:    li a1, 57
; RV32I-SW-NEXT:    beq a0, a1, .LBB4_3
; RV32I-SW-NEXT:  # %bb.2: # %do_call2
; RV32I-SW-NEXT:    call foo
; RV32I-SW-NEXT:  .LBB4_3:
; RV32I-SW-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    .cfi_restore ra
; RV32I-SW-NEXT:    addi sp, sp, 16
; RV32I-SW-NEXT:    .cfi_def_cfa_offset 0
; RV32I-SW-NEXT:  .LBB4_4: # %exit
; RV32I-SW-NEXT:    ret
;
; RV32I-SW-SR-LABEL: li_straightline_c:
; RV32I-SW-SR:       # %bb.0:
; RV32I-SW-SR-NEXT:    li a1, 57
; RV32I-SW-SR-NEXT:    beq a0, a1, .LBB4_4
; RV32I-SW-SR-NEXT:  # %bb.1: # %do_call
; RV32I-SW-SR-NEXT:    call t0, __riscv_save_0
; RV32I-SW-SR-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-SR-NEXT:    .cfi_offset ra, -4
; RV32I-SW-SR-NEXT:    call foo
; RV32I-SW-SR-NEXT:    li a1, 57
; RV32I-SW-SR-NEXT:    beq a0, a1, .LBB4_3
; RV32I-SW-SR-NEXT:  # %bb.2: # %do_call2
; RV32I-SW-SR-NEXT:    call foo
; RV32I-SW-SR-NEXT:  .LBB4_3:
; RV32I-SW-SR-NEXT:    tail __riscv_restore_0
; RV32I-SW-SR-NEXT:    j .LBB4_4
; RV32I-SW-SR-NEXT:  .LBB4_4: # %exit
; RV32I-SW-SR-NEXT:    ret
;
; RV64I-SW-LABEL: li_straightline_c:
; RV64I-SW:       # %bb.0:
; RV64I-SW-NEXT:    li a1, 57
; RV64I-SW-NEXT:    beq a0, a1, .LBB4_4
; RV64I-SW-NEXT:  # %bb.1: # %do_call
; RV64I-SW-NEXT:    addi sp, sp, -16
; RV64I-SW-NEXT:    .cfi_def_cfa_offset 16
; RV64I-SW-NEXT:    sd ra, 8(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    .cfi_offset ra, -8
; RV64I-SW-NEXT:    call foo
; RV64I-SW-NEXT:    li a1, 57
; RV64I-SW-NEXT:    beq a0, a1, .LBB4_3
; RV64I-SW-NEXT:  # %bb.2: # %do_call2
; RV64I-SW-NEXT:    call foo
; RV64I-SW-NEXT:  .LBB4_3:
; RV64I-SW-NEXT:    ld ra, 8(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    .cfi_restore ra
; RV64I-SW-NEXT:    addi sp, sp, 16
; RV64I-SW-NEXT:    .cfi_def_cfa_offset 0
; RV64I-SW-NEXT:  .LBB4_4: # %exit
; RV64I-SW-NEXT:    ret
  %cmp0 = icmp eq i32 %a, 57
  br i1 %cmp0, label %exit, label %do_call
do_call:
  %b = call i32 @foo()
  br label %next
next:
  %cmp1 = icmp eq i32 %b, 57
  br i1 %cmp1, label %exit, label %do_call2
do_call2:
  call i32 @foo()
  br label %exit
exit:
  ret void
}


; In this case, the second use is in a loop, so using a callee
; saved register to avoid a remat is the profitable choice.
; FIXME: We can shrink wrap the frame setup around the loop
; and avoid it along the %bb.0 -> %exit edge
define void @li_loop(i32 zeroext %a, i32 zeroext %b) {
; RV32I-SW-NO-LABEL: li_loop:
; RV32I-SW-NO:       # %bb.0:
; RV32I-SW-NO-NEXT:    addi sp, sp, -16
; RV32I-SW-NO-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-NO-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    sw s0, 8(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    sw s1, 4(sp) # 4-byte Folded Spill
; RV32I-SW-NO-NEXT:    .cfi_offset ra, -4
; RV32I-SW-NO-NEXT:    .cfi_offset s0, -8
; RV32I-SW-NO-NEXT:    .cfi_offset s1, -12
; RV32I-SW-NO-NEXT:    li s1, 57
; RV32I-SW-NO-NEXT:    beq a0, s1, .LBB5_3
; RV32I-SW-NO-NEXT:  # %bb.1: # %do_call.preheader
; RV32I-SW-NO-NEXT:    mv s0, a1
; RV32I-SW-NO-NEXT:  .LBB5_2: # %do_call
; RV32I-SW-NO-NEXT:    # =>This Inner Loop Header: Depth=1
; RV32I-SW-NO-NEXT:    call foo
; RV32I-SW-NO-NEXT:    bne s0, s1, .LBB5_2
; RV32I-SW-NO-NEXT:  .LBB5_3: # %exit
; RV32I-SW-NO-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    lw s0, 8(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    lw s1, 4(sp) # 4-byte Folded Reload
; RV32I-SW-NO-NEXT:    .cfi_restore ra
; RV32I-SW-NO-NEXT:    .cfi_restore s0
; RV32I-SW-NO-NEXT:    .cfi_restore s1
; RV32I-SW-NO-NEXT:    addi sp, sp, 16
; RV32I-SW-NO-NEXT:    .cfi_def_cfa_offset 0
; RV32I-SW-NO-NEXT:    ret
;
; RV32I-SW-LABEL: li_loop:
; RV32I-SW:       # %bb.0:
; RV32I-SW-NEXT:    addi sp, sp, -16
; RV32I-SW-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-NEXT:    sw ra, 12(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    sw s0, 8(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    sw s1, 4(sp) # 4-byte Folded Spill
; RV32I-SW-NEXT:    .cfi_offset ra, -4
; RV32I-SW-NEXT:    .cfi_offset s0, -8
; RV32I-SW-NEXT:    .cfi_offset s1, -12
; RV32I-SW-NEXT:    li s1, 57
; RV32I-SW-NEXT:    beq a0, s1, .LBB5_3
; RV32I-SW-NEXT:  # %bb.1: # %do_call.preheader
; RV32I-SW-NEXT:    mv s0, a1
; RV32I-SW-NEXT:  .LBB5_2: # %do_call
; RV32I-SW-NEXT:    # =>This Inner Loop Header: Depth=1
; RV32I-SW-NEXT:    call foo
; RV32I-SW-NEXT:    bne s0, s1, .LBB5_2
; RV32I-SW-NEXT:  .LBB5_3: # %exit
; RV32I-SW-NEXT:    lw ra, 12(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    lw s0, 8(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    lw s1, 4(sp) # 4-byte Folded Reload
; RV32I-SW-NEXT:    .cfi_restore ra
; RV32I-SW-NEXT:    .cfi_restore s0
; RV32I-SW-NEXT:    .cfi_restore s1
; RV32I-SW-NEXT:    addi sp, sp, 16
; RV32I-SW-NEXT:    .cfi_def_cfa_offset 0
; RV32I-SW-NEXT:    ret
;
; RV32I-SW-SR-LABEL: li_loop:
; RV32I-SW-SR:       # %bb.0:
; RV32I-SW-SR-NEXT:    call t0, __riscv_save_2
; RV32I-SW-SR-NEXT:    .cfi_def_cfa_offset 16
; RV32I-SW-SR-NEXT:    .cfi_offset ra, -4
; RV32I-SW-SR-NEXT:    .cfi_offset s0, -8
; RV32I-SW-SR-NEXT:    .cfi_offset s1, -12
; RV32I-SW-SR-NEXT:    li s1, 57
; RV32I-SW-SR-NEXT:    beq a0, s1, .LBB5_3
; RV32I-SW-SR-NEXT:  # %bb.1: # %do_call.preheader
; RV32I-SW-SR-NEXT:    mv s0, a1
; RV32I-SW-SR-NEXT:  .LBB5_2: # %do_call
; RV32I-SW-SR-NEXT:    # =>This Inner Loop Header: Depth=1
; RV32I-SW-SR-NEXT:    call foo
; RV32I-SW-SR-NEXT:    bne s0, s1, .LBB5_2
; RV32I-SW-SR-NEXT:  .LBB5_3: # %exit
; RV32I-SW-SR-NEXT:    tail __riscv_restore_2
;
; RV64I-SW-LABEL: li_loop:
; RV64I-SW:       # %bb.0:
; RV64I-SW-NEXT:    addi sp, sp, -32
; RV64I-SW-NEXT:    .cfi_def_cfa_offset 32
; RV64I-SW-NEXT:    sd ra, 24(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    sd s0, 16(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    sd s1, 8(sp) # 8-byte Folded Spill
; RV64I-SW-NEXT:    .cfi_offset ra, -8
; RV64I-SW-NEXT:    .cfi_offset s0, -16
; RV64I-SW-NEXT:    .cfi_offset s1, -24
; RV64I-SW-NEXT:    li s1, 57
; RV64I-SW-NEXT:    beq a0, s1, .LBB5_3
; RV64I-SW-NEXT:  # %bb.1: # %do_call.preheader
; RV64I-SW-NEXT:    mv s0, a1
; RV64I-SW-NEXT:  .LBB5_2: # %do_call
; RV64I-SW-NEXT:    # =>This Inner Loop Header: Depth=1
; RV64I-SW-NEXT:    call foo
; RV64I-SW-NEXT:    bne s0, s1, .LBB5_2
; RV64I-SW-NEXT:  .LBB5_3: # %exit
; RV64I-SW-NEXT:    ld ra, 24(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    ld s0, 16(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    ld s1, 8(sp) # 8-byte Folded Reload
; RV64I-SW-NEXT:    .cfi_restore ra
; RV64I-SW-NEXT:    .cfi_restore s0
; RV64I-SW-NEXT:    .cfi_restore s1
; RV64I-SW-NEXT:    addi sp, sp, 32
; RV64I-SW-NEXT:    .cfi_def_cfa_offset 0
; RV64I-SW-NEXT:    ret
  %cmp0 = icmp eq i32 %a, 57
  br i1 %cmp0, label %exit, label %do_call
do_call:
  call i32 @foo()
  %cmp1 = icmp eq i32 %b, 57
  br i1 %cmp1, label %exit, label %do_call
exit:
  ret void
}

declare zeroext i32 @foo()