
#121386 Introduced cttz intrinsics which caused a regression where vscale/vscale divisions could no longer be constant folded. This fold was suggested as a fix in #126411. https://alive2.llvm.org/ce/z/gWbtPw
137 lines
4.2 KiB
LLVM
137 lines
4.2 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
|
|
; RUN: opt < %s -passes=instcombine -S | FileCheck %s
|
|
|
|
define i32 @shl_cttz_false(i32 %x, i32 %y) {
|
|
; CHECK-LABEL: define i32 @shl_cttz_false(
|
|
; CHECK-SAME: i32 [[X:%.*]], i32 [[Y:%.*]]) {
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[CTTZ:%.*]] = call range(i32 0, 33) i32 @llvm.cttz.i32(i32 [[Y]], i1 true)
|
|
; CHECK-NEXT: [[RES:%.*]] = shl i32 [[X]], [[CTTZ]]
|
|
; CHECK-NEXT: ret i32 [[RES]]
|
|
;
|
|
entry:
|
|
%cttz = call i32 @llvm.cttz.i32(i32 %y, i1 false)
|
|
%res = shl i32 %x, %cttz
|
|
ret i32 %res
|
|
}
|
|
|
|
; Make sure that noundef is dropped.
|
|
|
|
define i32 @shl_cttz_false_noundef(i32 %x, i32 %y) {
|
|
; CHECK-LABEL: define i32 @shl_cttz_false_noundef(
|
|
; CHECK-SAME: i32 [[X:%.*]], i32 [[Y:%.*]]) {
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[CTTZ:%.*]] = call range(i32 0, 33) i32 @llvm.cttz.i32(i32 [[Y]], i1 true)
|
|
; CHECK-NEXT: [[RES:%.*]] = shl i32 [[X]], [[CTTZ]]
|
|
; CHECK-NEXT: ret i32 [[RES]]
|
|
;
|
|
entry:
|
|
%cttz = call noundef i32 @llvm.cttz.i32(i32 %y, i1 false)
|
|
%res = shl i32 %x, %cttz
|
|
ret i32 %res
|
|
}
|
|
|
|
define i32 @shl_ctlz_false(i32 %x, i32 %y) {
|
|
; CHECK-LABEL: define i32 @shl_ctlz_false(
|
|
; CHECK-SAME: i32 [[X:%.*]], i32 [[Y:%.*]]) {
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[CTTZ:%.*]] = call range(i32 0, 33) i32 @llvm.ctlz.i32(i32 [[Y]], i1 true)
|
|
; CHECK-NEXT: [[RES:%.*]] = shl i32 [[X]], [[CTTZ]]
|
|
; CHECK-NEXT: ret i32 [[RES]]
|
|
;
|
|
entry:
|
|
%cttz = call i32 @llvm.ctlz.i32(i32 %y, i1 false)
|
|
%res = shl i32 %x, %cttz
|
|
ret i32 %res
|
|
}
|
|
|
|
define i32 @lshr_cttz_false(i32 %x, i32 %y) {
|
|
; CHECK-LABEL: define i32 @lshr_cttz_false(
|
|
; CHECK-SAME: i32 [[X:%.*]], i32 [[Y:%.*]]) {
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[CTTZ:%.*]] = call range(i32 0, 33) i32 @llvm.cttz.i32(i32 [[Y]], i1 true)
|
|
; CHECK-NEXT: [[RES:%.*]] = lshr i32 [[X]], [[CTTZ]]
|
|
; CHECK-NEXT: ret i32 [[RES]]
|
|
;
|
|
entry:
|
|
%cttz = call i32 @llvm.cttz.i32(i32 %y, i1 false)
|
|
%res = lshr i32 %x, %cttz
|
|
ret i32 %res
|
|
}
|
|
|
|
define i32 @ashr_cttz_false(i32 %x, i32 %y) {
|
|
; CHECK-LABEL: define i32 @ashr_cttz_false(
|
|
; CHECK-SAME: i32 [[X:%.*]], i32 [[Y:%.*]]) {
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[CTTZ:%.*]] = call range(i32 0, 33) i32 @llvm.cttz.i32(i32 [[Y]], i1 true)
|
|
; CHECK-NEXT: [[RES:%.*]] = ashr i32 [[X]], [[CTTZ]]
|
|
; CHECK-NEXT: ret i32 [[RES]]
|
|
;
|
|
entry:
|
|
%cttz = call i32 @llvm.cttz.i32(i32 %y, i1 false)
|
|
%res = ashr i32 %x, %cttz
|
|
ret i32 %res
|
|
}
|
|
|
|
define i32 @shl_cttz_false_multiuse(i32 %x, i32 %y) {
|
|
; CHECK-LABEL: define i32 @shl_cttz_false_multiuse(
|
|
; CHECK-SAME: i32 [[X:%.*]], i32 [[Y:%.*]]) {
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[CTTZ:%.*]] = call range(i32 0, 33) i32 @llvm.cttz.i32(i32 [[Y]], i1 false)
|
|
; CHECK-NEXT: call void @use(i32 [[CTTZ]])
|
|
; CHECK-NEXT: [[RES:%.*]] = shl i32 [[X]], [[CTTZ]]
|
|
; CHECK-NEXT: ret i32 [[RES]]
|
|
;
|
|
entry:
|
|
%cttz = call i32 @llvm.cttz.i32(i32 %y, i1 false)
|
|
call void @use(i32 %cttz)
|
|
%res = shl i32 %x, %cttz
|
|
ret i32 %res
|
|
}
|
|
|
|
define i32 @shl_cttz_as_lhs(i32 %x, i32 %y) {
|
|
; CHECK-LABEL: define i32 @shl_cttz_as_lhs(
|
|
; CHECK-SAME: i32 [[X:%.*]], i32 [[Y:%.*]]) {
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[CTTZ:%.*]] = call range(i32 0, 33) i32 @llvm.cttz.i32(i32 [[Y]], i1 false)
|
|
; CHECK-NEXT: [[RES:%.*]] = shl i32 [[CTTZ]], [[X]]
|
|
; CHECK-NEXT: ret i32 [[RES]]
|
|
;
|
|
entry:
|
|
%cttz = call i32 @llvm.cttz.i32(i32 %y, i1 false)
|
|
%res = shl i32 %cttz, %x
|
|
ret i32 %res
|
|
}
|
|
|
|
define i64 @fold_cttz_64() vscale_range(1,16) {
|
|
; CHECK-LABEL: define i64 @fold_cttz_64(
|
|
; CHECK-SAME: ) #[[ATTR0:[0-9]+]] {
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: ret i64 4
|
|
;
|
|
entry:
|
|
%vscale = tail call i64 @llvm.vscale.i64()
|
|
%shl0 = shl nuw nsw i64 %vscale, 4
|
|
%shl1 = shl nuw nsw i64 %vscale, 2
|
|
%cttz = tail call range(i64 2, 65) i64 @llvm.cttz.i64(i64 %shl1, i1 true)
|
|
%div1 = lshr i64 %shl0, %cttz
|
|
ret i64 %div1
|
|
}
|
|
|
|
define i32 @fold_cttz_32() vscale_range(1,16) {
|
|
; CHECK-LABEL: define i32 @fold_cttz_32(
|
|
; CHECK-SAME: ) #[[ATTR0]] {
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: ret i32 4
|
|
;
|
|
entry:
|
|
%vscale = tail call i32 @llvm.vscale.i32()
|
|
%shl0 = shl nuw nsw i32 %vscale, 4
|
|
%shl1 = shl nuw nsw i32 %vscale, 2
|
|
%cttz = tail call range(i32 2, 65) i32 @llvm.cttz.i32(i32 %shl1, i1 true)
|
|
%div1 = lshr i32 %shl0, %cttz
|
|
ret i32 %div1
|
|
}
|
|
|
|
declare void @use(i32)
|