Generalize VPWidenSelectRecipe codegen to consider single-scalar conditions instead of just loop-invariant ones. If the condition is a single-scalar, we can simply use a scalar condition. PR: https://github.com/llvm/llvm-project/pull/165506
80 lines
3.9 KiB
LLVM
80 lines
3.9 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
|
; RUN: opt < %s -force-vector-width=2 -force-vector-interleave=1 -force-widen-divrem-via-safe-divisor=0 -passes=loop-vectorize -S | FileCheck %s
|
|
|
|
; Test case for PR44488. Checks that the correct predicates are created for
|
|
; branches where true and false successors are equal. See the checks involving
|
|
; CMP1 and CMP2.
|
|
|
|
@v_38 = global i16 12061, align 1
|
|
@v_39 = global i16 11333, align 1
|
|
|
|
define i16 @test_true_and_false_branch_equal() {
|
|
; CHECK-LABEL: @test_true_and_false_branch_equal(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: br label [[VECTOR_PH:%.*]]
|
|
; CHECK: vector.ph:
|
|
; CHECK-NEXT: br label [[VECTOR_BODY:%.*]]
|
|
; CHECK: vector.body:
|
|
; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[PRED_SREM_CONTINUE2:%.*]] ]
|
|
; CHECK-NEXT: [[TMP0:%.*]] = load i16, ptr @v_38, align 1
|
|
; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <2 x i16> poison, i16 [[TMP0]], i64 0
|
|
; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <2 x i16> [[BROADCAST_SPLATINSERT]], <2 x i16> poison, <2 x i32> zeroinitializer
|
|
; CHECK-NEXT: [[TMP2:%.*]] = icmp ne <2 x i16> [[BROADCAST_SPLAT]], zeroinitializer
|
|
; CHECK-NEXT: [[TMP3:%.*]] = extractelement <2 x i1> [[TMP2]], i32 0
|
|
; CHECK-NEXT: br i1 [[TMP3]], label [[PRED_SREM_IF:%.*]], label [[PRED_SREM_CONTINUE:%.*]]
|
|
; CHECK: pred.srem.if:
|
|
; CHECK-NEXT: [[TMP4:%.*]] = srem i16 5786, [[TMP0]]
|
|
; CHECK-NEXT: [[TMP5:%.*]] = insertelement <2 x i16> poison, i16 [[TMP4]], i32 0
|
|
; CHECK-NEXT: br label [[PRED_SREM_CONTINUE]]
|
|
; CHECK: pred.srem.continue:
|
|
; CHECK-NEXT: [[TMP6:%.*]] = phi <2 x i16> [ poison, [[VECTOR_BODY]] ], [ [[TMP5]], [[PRED_SREM_IF]] ]
|
|
; CHECK-NEXT: [[TMP7:%.*]] = extractelement <2 x i1> [[TMP2]], i32 1
|
|
; CHECK-NEXT: br i1 [[TMP7]], label [[PRED_SREM_IF1:%.*]], label [[PRED_SREM_CONTINUE2]]
|
|
; CHECK: pred.srem.if1:
|
|
; CHECK-NEXT: [[TMP8:%.*]] = srem i16 5786, [[TMP0]]
|
|
; CHECK-NEXT: [[TMP9:%.*]] = insertelement <2 x i16> [[TMP6]], i16 [[TMP8]], i32 1
|
|
; CHECK-NEXT: br label [[PRED_SREM_CONTINUE2]]
|
|
; CHECK: pred.srem.continue2:
|
|
; CHECK-NEXT: [[TMP10:%.*]] = phi <2 x i16> [ [[TMP6]], [[PRED_SREM_CONTINUE]] ], [ [[TMP9]], [[PRED_SREM_IF1]] ]
|
|
; CHECK-NEXT: [[TMP13:%.*]] = extractelement <2 x i1> [[TMP2]], i32 0
|
|
; CHECK-NEXT: [[PREDPHI:%.*]] = select i1 [[TMP13]], <2 x i16> [[TMP10]], <2 x i16> splat (i16 5786)
|
|
; CHECK-NEXT: [[TMP11:%.*]] = extractelement <2 x i16> [[PREDPHI]], i32 1
|
|
; CHECK-NEXT: store i16 [[TMP11]], ptr @v_39, align 1
|
|
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 2
|
|
; CHECK-NEXT: [[TMP12:%.*]] = icmp eq i32 [[INDEX_NEXT]], 12
|
|
; CHECK-NEXT: br i1 [[TMP12]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]]
|
|
; CHECK: middle.block:
|
|
; CHECK-NEXT: br label [[FOR_LATCH:%.*]]
|
|
; CHECK: exit:
|
|
; CHECK-NEXT: [[RV:%.*]] = load i16, ptr @v_39, align 1
|
|
; CHECK-NEXT: ret i16 [[RV]]
|
|
;
|
|
entry:
|
|
br label %for.body
|
|
|
|
for.body: ; preds = %entry, %for.latch
|
|
%i.07 = phi i16 [ 99, %entry ], [ %inc7, %for.latch ]
|
|
%lv = load i16, ptr @v_38, align 1
|
|
%cmp1 = icmp eq i16 %lv, 32767
|
|
br i1 %cmp1, label %cond.end, label %cond.end
|
|
|
|
cond.end: ; preds = %for.body, %for.body
|
|
%cmp2 = icmp eq i16 %lv, 0
|
|
br i1 %cmp2, label %for.latch, label %cond.false4
|
|
|
|
cond.false4: ; preds = %cond.end
|
|
%rem = srem i16 5786, %lv
|
|
br label %for.latch
|
|
|
|
for.latch: ; preds = %cond.end, %cond.false4
|
|
%cond6 = phi i16 [ %rem, %cond.false4 ], [ 5786, %cond.end ]
|
|
store i16 %cond6, ptr @v_39, align 1
|
|
%inc7 = add nsw i16 %i.07, 1
|
|
%cmp = icmp slt i16 %inc7, 111
|
|
br i1 %cmp, label %for.body, label %exit
|
|
|
|
exit: ; preds = %for.latch
|
|
%rv = load i16, ptr @v_39, align 1
|
|
ret i16 %rv
|
|
}
|