Craig Topper c9714d2035
[RISCV] Add profitability checks to SelectAddrRegRegScale. (#150135)
-Only fold if the ADD can be folded into all uses.
-Don't reassociate an ADDI if the shl+add can be a shxadd or similar
instruction.
-Only reassociate a single ADDI. If there are 2 addis it's the same
number of instructions as shl+add. If there are more than 2 that it
would increase instructions over folding the addis into the
loads/stores.
2025-07-22 21:10:52 -07:00

516 lines
14 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; RUN: llc -mtriple=riscv32 -verify-machineinstrs < %s \
; RUN: | FileCheck %s -check-prefixes=RV32I
; RUN: llc -mtriple=riscv32 --mattr=+zba -verify-machineinstrs < %s \
; RUN: | FileCheck %s -check-prefixes=RV32IZBA
; RUN: llc -mtriple=riscv32 -mattr=+zba,+experimental-xqcisls -verify-machineinstrs < %s \
; RUN: | FileCheck %s -check-prefixes=RV32IZBAXQCISLS
define i32 @lb_ri(i8* %a, i32 %b) {
; RV32I-LABEL: lb_ri:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a1, a1, 3
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: lb a0, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lb_ri:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: sh3add a0, a1, a0
; RV32IZBA-NEXT: lb a0, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lb_ri:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.lrb a0, a0, a1, 3
; RV32IZBAXQCISLS-NEXT: ret
%shl = shl i32 %b, 3
%1 = getelementptr i8, i8* %a, i32 %shl
%2 = load i8, i8* %1
%3 = sext i8 %2 to i32
ret i32 %3
}
define i32 @lbu_ri(i8* %a, i32 %b) {
; RV32I-LABEL: lbu_ri:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a1, a1, 2
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: lbu a0, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lbu_ri:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: sh2add a0, a1, a0
; RV32IZBA-NEXT: lbu a0, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lbu_ri:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.lrbu a0, a0, a1, 2
; RV32IZBAXQCISLS-NEXT: ret
%shl = shl i32 %b, 2
%1 = getelementptr i8, i8* %a, i32 %shl
%2 = load i8, i8* %1
%3 = zext i8 %2 to i32
ret i32 %3
}
define i32 @lh_ri(i16* %a, i32 %b) {
; RV32I-LABEL: lh_ri:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a1, a1, 5
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: lh a0, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lh_ri:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: slli a1, a1, 5
; RV32IZBA-NEXT: add a0, a0, a1
; RV32IZBA-NEXT: lh a0, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lh_ri:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.lrh a0, a0, a1, 5
; RV32IZBAXQCISLS-NEXT: ret
%shl = shl i32 %b, 4
%1 = getelementptr i16, i16* %a, i32 %shl
%2 = load i16, i16* %1
%3 = sext i16 %2 to i32
ret i32 %3
}
define i32 @lhu_ri(i16* %a, i32 %b) {
; RV32I-LABEL: lhu_ri:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a1, a1, 6
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: lhu a0, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lhu_ri:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: slli a1, a1, 6
; RV32IZBA-NEXT: add a0, a0, a1
; RV32IZBA-NEXT: lhu a0, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lhu_ri:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.lrhu a0, a0, a1, 6
; RV32IZBAXQCISLS-NEXT: ret
%shl = shl i32 %b, 5
%1 = getelementptr i16, i16* %a, i32 %shl
%2 = load i16, i16* %1
%3 = zext i16 %2 to i32
ret i32 %3
}
define i32 @lw_ri(i32* %a, i32 %b) {
; RV32I-LABEL: lw_ri:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a1, a1, 6
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: lw a0, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lw_ri:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: slli a1, a1, 6
; RV32IZBA-NEXT: add a0, a0, a1
; RV32IZBA-NEXT: lw a0, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lw_ri:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.lrw a0, a0, a1, 6
; RV32IZBAXQCISLS-NEXT: ret
%shl = shl i32 %b, 4
%1 = getelementptr i32, i32* %a, i32 %shl
%2 = load i32, i32* %1
ret i32 %2
}
define void @sb_ri(i8* %a, i8 %b, i32 %c) {
; RV32I-LABEL: sb_ri:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a2, a2, 7
; RV32I-NEXT: add a0, a0, a2
; RV32I-NEXT: sb a1, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: sb_ri:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: slli a2, a2, 7
; RV32IZBA-NEXT: add a0, a0, a2
; RV32IZBA-NEXT: sb a1, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: sb_ri:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.srb a1, a0, a2, 7
; RV32IZBAXQCISLS-NEXT: ret
%shl = shl i32 %c, 7
%1 = getelementptr i8, i8* %a, i32 %shl
store i8 %b, i8* %1
ret void
}
define void @sh_ri(i16* %a, i16 %b, i32 %c) {
; RV32I-LABEL: sh_ri:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a2, a2, 3
; RV32I-NEXT: add a0, a0, a2
; RV32I-NEXT: sh a1, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: sh_ri:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: sh3add a0, a2, a0
; RV32IZBA-NEXT: sh a1, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: sh_ri:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.srh a1, a0, a2, 3
; RV32IZBAXQCISLS-NEXT: ret
%shl = shl i32 %c, 2
%1 = getelementptr i16, i16* %a, i32 %shl
store i16 %b, i16* %1
ret void
}
define void @sw_ri(i32* %a, i32 %b, i32 %c) {
; RV32I-LABEL: sw_ri:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a2, a2, 3
; RV32I-NEXT: add a0, a0, a2
; RV32I-NEXT: sw a1, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: sw_ri:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: sh3add a0, a2, a0
; RV32IZBA-NEXT: sw a1, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: sw_ri:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.srw a1, a0, a2, 3
; RV32IZBAXQCISLS-NEXT: ret
%shl = shl i32 %c, 1
%1 = getelementptr i32, i32* %a, i32 %shl
store i32 %b, i32* %1
ret void
}
define i8 @lrb_anyext(ptr %a, i32 %b) {
; RV32I-LABEL: lrb_anyext:
; RV32I: # %bb.0:
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: lbu a0, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lrb_anyext:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: add a0, a0, a1
; RV32IZBA-NEXT: lbu a0, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lrb_anyext:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.lrbu a0, a0, a1, 0
; RV32IZBAXQCISLS-NEXT: ret
%1 = getelementptr i8, ptr %a, i32 %b
%2 = load i8, ptr %1, align 1
ret i8 %2
}
define i32 @lrb(ptr %a, i32 %b) {
; RV32I-LABEL: lrb:
; RV32I: # %bb.0:
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: lb a0, 0(a0)
; RV32I-NEXT: add a0, a0, a0
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lrb:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: add a0, a0, a1
; RV32IZBA-NEXT: lb a0, 0(a0)
; RV32IZBA-NEXT: add a0, a0, a0
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lrb:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.lrb a0, a0, a1, 0
; RV32IZBAXQCISLS-NEXT: add a0, a0, a0
; RV32IZBAXQCISLS-NEXT: ret
%1 = getelementptr i8, ptr %a, i32 %b
%2 = load i8, ptr %1, align 1
%3 = sext i8 %2 to i32
%4 = add i32 %3, %3
ret i32 %4
}
define i32 @lrbu(ptr %a, i32 %b) {
; RV32I-LABEL: lrbu:
; RV32I: # %bb.0:
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: lbu a0, 0(a0)
; RV32I-NEXT: add a0, a0, a0
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lrbu:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: add a0, a0, a1
; RV32IZBA-NEXT: lbu a0, 0(a0)
; RV32IZBA-NEXT: add a0, a0, a0
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lrbu:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: qc.lrbu a0, a0, a1, 0
; RV32IZBAXQCISLS-NEXT: add a0, a0, a0
; RV32IZBAXQCISLS-NEXT: ret
%1 = getelementptr i8, ptr %a, i32 %b
%2 = load i8, ptr %1, align 1
%3 = zext i8 %2 to i32
%4 = add i32 %3, %3
ret i32 %4
}
define i64 @lrd(ptr %a, i32 %b) {
; RV32I-LABEL: lrd:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a1, a1, 3
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: lw a1, 0(a0)
; RV32I-NEXT: lw a2, 4(a0)
; RV32I-NEXT: add a0, a1, a1
; RV32I-NEXT: sltu a1, a0, a1
; RV32I-NEXT: add a2, a2, a2
; RV32I-NEXT: add a1, a2, a1
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lrd:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: sh3add a0, a1, a0
; RV32IZBA-NEXT: lw a1, 0(a0)
; RV32IZBA-NEXT: lw a2, 4(a0)
; RV32IZBA-NEXT: add a0, a1, a1
; RV32IZBA-NEXT: sltu a1, a0, a1
; RV32IZBA-NEXT: add a2, a2, a2
; RV32IZBA-NEXT: add a1, a2, a1
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lrd:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: sh3add a0, a1, a0
; RV32IZBAXQCISLS-NEXT: lw a1, 0(a0)
; RV32IZBAXQCISLS-NEXT: lw a2, 4(a0)
; RV32IZBAXQCISLS-NEXT: add a0, a1, a1
; RV32IZBAXQCISLS-NEXT: sltu a1, a0, a1
; RV32IZBAXQCISLS-NEXT: add a2, a2, a2
; RV32IZBAXQCISLS-NEXT: add a1, a2, a1
; RV32IZBAXQCISLS-NEXT: ret
%1 = getelementptr i64, ptr %a, i32 %b
%2 = load i64, ptr %1, align 8
%3 = add i64 %2, %2
ret i64 %3
}
define i64 @lrd_2(ptr %a, i32 %b) {
; RV32I-LABEL: lrd_2:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a1, a1, 3
; RV32I-NEXT: add a0, a1, a0
; RV32I-NEXT: lw a1, 96(a0)
; RV32I-NEXT: lw a2, 100(a0)
; RV32I-NEXT: add a0, a1, a1
; RV32I-NEXT: sltu a1, a0, a1
; RV32I-NEXT: add a2, a2, a2
; RV32I-NEXT: add a1, a2, a1
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lrd_2:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: sh3add a0, a1, a0
; RV32IZBA-NEXT: lw a1, 96(a0)
; RV32IZBA-NEXT: lw a2, 100(a0)
; RV32IZBA-NEXT: add a0, a1, a1
; RV32IZBA-NEXT: sltu a1, a0, a1
; RV32IZBA-NEXT: add a2, a2, a2
; RV32IZBA-NEXT: add a1, a2, a1
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lrd_2:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: sh3add a0, a1, a0
; RV32IZBAXQCISLS-NEXT: lw a1, 96(a0)
; RV32IZBAXQCISLS-NEXT: lw a2, 100(a0)
; RV32IZBAXQCISLS-NEXT: add a0, a1, a1
; RV32IZBAXQCISLS-NEXT: sltu a1, a0, a1
; RV32IZBAXQCISLS-NEXT: add a2, a2, a2
; RV32IZBAXQCISLS-NEXT: add a1, a2, a1
; RV32IZBAXQCISLS-NEXT: ret
%1 = add i32 %b, 12
%2 = getelementptr i64, ptr %a, i32 %1
%3 = load i64, ptr %2, align 8
%4 = add i64 %3, %3
ret i64 %4
}
define void @srb(ptr %a, i32 %b, i8 %c) {
; RV32I-LABEL: srb:
; RV32I: # %bb.0:
; RV32I-NEXT: add a2, a2, a2
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: sb a2, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: srb:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: add a2, a2, a2
; RV32IZBA-NEXT: add a0, a0, a1
; RV32IZBA-NEXT: sb a2, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: srb:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: add a2, a2, a2
; RV32IZBAXQCISLS-NEXT: qc.srb a2, a0, a1, 0
; RV32IZBAXQCISLS-NEXT: ret
%1 = add i8 %c, %c
%2 = getelementptr i8, ptr %a, i32 %b
store i8 %1, ptr %2, align 1
ret void
}
define void @srh(ptr %a, i32 %b, i16 %c) {
; RV32I-LABEL: srh:
; RV32I: # %bb.0:
; RV32I-NEXT: add a2, a2, a2
; RV32I-NEXT: slli a1, a1, 1
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: sh a2, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: srh:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: add a2, a2, a2
; RV32IZBA-NEXT: sh1add a0, a1, a0
; RV32IZBA-NEXT: sh a2, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: srh:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: add a2, a2, a2
; RV32IZBAXQCISLS-NEXT: qc.srh a2, a0, a1, 1
; RV32IZBAXQCISLS-NEXT: ret
%1 = add i16 %c, %c
%2 = getelementptr i16, ptr %a, i32 %b
store i16 %1, ptr %2, align 2
ret void
}
define void @srw(ptr %a, i32 %b, i32 %c) {
; RV32I-LABEL: srw:
; RV32I: # %bb.0:
; RV32I-NEXT: add a2, a2, a2
; RV32I-NEXT: slli a1, a1, 2
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: sw a2, 0(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: srw:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: add a2, a2, a2
; RV32IZBA-NEXT: sh2add a0, a1, a0
; RV32IZBA-NEXT: sw a2, 0(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: srw:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: add a2, a2, a2
; RV32IZBAXQCISLS-NEXT: qc.srw a2, a0, a1, 2
; RV32IZBAXQCISLS-NEXT: ret
%1 = add i32 %c, %c
%2 = getelementptr i32, ptr %a, i32 %b
store i32 %1, ptr %2, align 4
ret void
}
define void @srd(ptr %a, i32 %b, i64 %c) {
; RV32I-LABEL: srd:
; RV32I: # %bb.0:
; RV32I-NEXT: add a4, a2, a2
; RV32I-NEXT: add a3, a3, a3
; RV32I-NEXT: slli a1, a1, 3
; RV32I-NEXT: sltu a2, a4, a2
; RV32I-NEXT: add a0, a0, a1
; RV32I-NEXT: add a2, a3, a2
; RV32I-NEXT: sw a4, 0(a0)
; RV32I-NEXT: sw a2, 4(a0)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: srd:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: add a4, a2, a2
; RV32IZBA-NEXT: add a3, a3, a3
; RV32IZBA-NEXT: sh3add a0, a1, a0
; RV32IZBA-NEXT: sltu a1, a4, a2
; RV32IZBA-NEXT: add a1, a3, a1
; RV32IZBA-NEXT: sw a4, 0(a0)
; RV32IZBA-NEXT: sw a1, 4(a0)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: srd:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: add a4, a2, a2
; RV32IZBAXQCISLS-NEXT: add a3, a3, a3
; RV32IZBAXQCISLS-NEXT: sh3add a0, a1, a0
; RV32IZBAXQCISLS-NEXT: sltu a1, a4, a2
; RV32IZBAXQCISLS-NEXT: add a1, a3, a1
; RV32IZBAXQCISLS-NEXT: sw a4, 0(a0)
; RV32IZBAXQCISLS-NEXT: sw a1, 4(a0)
; RV32IZBAXQCISLS-NEXT: ret
%1 = add i64 %c, %c
%2 = getelementptr i64, ptr %a, i32 %b
store i64 %1, ptr %2, align 8
ret void
}
define i64 @lrd_large_shift(ptr %a, i32 %b) {
; RV32I-LABEL: lrd_large_shift:
; RV32I: # %bb.0:
; RV32I-NEXT: slli a1, a1, 5
; RV32I-NEXT: add a1, a1, a0
; RV32I-NEXT: lw a0, 384(a1)
; RV32I-NEXT: lw a1, 388(a1)
; RV32I-NEXT: ret
;
; RV32IZBA-LABEL: lrd_large_shift:
; RV32IZBA: # %bb.0:
; RV32IZBA-NEXT: slli a1, a1, 5
; RV32IZBA-NEXT: add a1, a1, a0
; RV32IZBA-NEXT: lw a0, 384(a1)
; RV32IZBA-NEXT: lw a1, 388(a1)
; RV32IZBA-NEXT: ret
;
; RV32IZBAXQCISLS-LABEL: lrd_large_shift:
; RV32IZBAXQCISLS: # %bb.0:
; RV32IZBAXQCISLS-NEXT: slli a1, a1, 5
; RV32IZBAXQCISLS-NEXT: add a1, a1, a0
; RV32IZBAXQCISLS-NEXT: lw a0, 384(a1)
; RV32IZBAXQCISLS-NEXT: lw a1, 388(a1)
; RV32IZBAXQCISLS-NEXT: ret
%1 = add i32 %b, 12
%2 = shl i32 %1, 2
%3 = getelementptr i64, ptr %a, i32 %2
%4 = load i64, ptr %3, align 8
ret i64 %4
}