
Before D135808, There would be endless loop interchange posibility (no proper priority was there in profitability check. Any profitable check may leads to loop-interchange). With this patch, there is no endless interchange (priority in profitable check is defined. Order of decision is 'Cache cost' check, 'InstrOrderCost', 'Vectorization'). Corrected the dependency checking inside isProfitableForVectorization(), corrected the checking of bad order loops in isProfitablePerInstrOrderCost(). Reviewed By: Meinersbur, bmahjour, #loopoptwg Differential Revision: https://reviews.llvm.org/D135808
210 lines
8.4 KiB
LLVM
210 lines
8.4 KiB
LLVM
; RUN: opt < %s -passes=loop-interchange -cache-line-size=64 -loop-interchange-threshold=-100 -verify-loop-lcssa -S | FileCheck %s
|
|
|
|
; Test case for PR41725. The induction variables in the latches escape the
|
|
; loops and we must move some PHIs around.
|
|
|
|
@a = common dso_local global i64 0, align 4
|
|
@b = common dso_local global i64 0, align 4
|
|
@c = common dso_local global [10 x [10 x i32 ]] zeroinitializer, align 16
|
|
|
|
|
|
define void @test_lcssa_indvars1() {
|
|
; CHECK-LABEL: @test_lcssa_indvars1()
|
|
; CHECK-LABEL: inner.body:
|
|
; CHECK-NEXT: %iv.inner = phi i64 [ %[[IVNEXT:[0-9]+]], %inner.body.split ], [ 5, %inner.body.preheader ]
|
|
|
|
; CHECK-LABEL: inner.body.split:
|
|
; CHECK-NEXT: %0 = phi i64 [ %iv.outer.next, %outer.latch ]
|
|
; CHECK-NEXT: %[[IVNEXT]] = add nsw i64 %iv.inner, -1
|
|
; CHECK-NEXT: %[[COND:[0-9]+]] = icmp eq i64 %iv.inner, 0
|
|
; CHECK-NEXT: br i1 %[[COND]], label %exit, label %inner.body
|
|
|
|
; CHECK-LABEL: exit:
|
|
; CHECK-NEXT: %v4.lcssa = phi i64 [ %0, %inner.body.split ]
|
|
; CHECK-NEXT: %v8.lcssa.lcssa = phi i64 [ %[[IVNEXT]], %inner.body.split ]
|
|
; CHECK-NEXT: store i64 %v8.lcssa.lcssa, ptr @b, align 4
|
|
; CHECK-NEXT: store i64 %v4.lcssa, ptr @a, align 4
|
|
|
|
entry:
|
|
br label %outer.header
|
|
|
|
outer.header: ; preds = %outer.latch, %entry
|
|
%iv.outer = phi i64 [ 0, %entry ], [ %iv.outer.next, %outer.latch ]
|
|
br label %inner.body
|
|
|
|
inner.body: ; preds = %inner.body, %outer.header
|
|
%iv.inner = phi i64 [ 5, %outer.header ], [ %iv.inner.next, %inner.body ]
|
|
%v7 = getelementptr inbounds [10 x [10 x i32]], ptr @c, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
store i32 0, ptr %v7, align 4
|
|
%iv.inner.next = add nsw i64 %iv.inner, -1
|
|
%v9 = icmp eq i64 %iv.inner, 0
|
|
br i1 %v9, label %outer.latch, label %inner.body
|
|
|
|
outer.latch: ; preds = %inner.body
|
|
%v8.lcssa = phi i64 [ %iv.inner.next, %inner.body ]
|
|
%iv.outer.next = add nuw nsw i64 %iv.outer, 1
|
|
%v5 = icmp ult i64 %iv.outer, 2
|
|
br i1 %v5, label %outer.header, label %exit
|
|
|
|
exit: ; preds = %outer.latch
|
|
%v4.lcssa = phi i64 [ %iv.outer.next, %outer.latch ]
|
|
%v8.lcssa.lcssa = phi i64 [ %v8.lcssa, %outer.latch ]
|
|
store i64 %v8.lcssa.lcssa, ptr @b, align 4
|
|
store i64 %v4.lcssa, ptr @a, align 4
|
|
ret void
|
|
}
|
|
|
|
|
|
define void @test_lcssa_indvars2() {
|
|
; CHECK-LABEL: @test_lcssa_indvars2()
|
|
; CHECK-LABEL: inner.body:
|
|
; CHECK-NEXT: %iv.inner = phi i64 [ %[[IVNEXT:[0-9]+]], %inner.body.split ], [ 5, %inner.body.preheader ]
|
|
|
|
; CHECK-LABEL: inner.body.split:
|
|
; CHECK-NEXT: %0 = phi i64 [ %iv.outer, %outer.latch ]
|
|
; CHECK-NEXT: %[[IVNEXT]] = add nsw i64 %iv.inner, -1
|
|
; CHECK-NEXT: %[[COND:[0-9]+]] = icmp eq i64 %[[IVNEXT]], 0
|
|
; CHECK-NEXT: br i1 %[[COND]], label %exit, label %inner.body
|
|
|
|
; CHECK-LABEL: exit:
|
|
; CHECK-NEXT: %v4.lcssa = phi i64 [ %0, %inner.body.split ]
|
|
; CHECK-NEXT: %v8.lcssa.lcssa = phi i64 [ %iv.inner, %inner.body.split ]
|
|
; CHECK-NEXT: store i64 %v8.lcssa.lcssa, ptr @b, align 4
|
|
; CHECK-NEXT: store i64 %v4.lcssa, ptr @a, align 4
|
|
|
|
entry:
|
|
br label %outer.header
|
|
|
|
outer.header: ; preds = %outer.latch, %entry
|
|
%iv.outer = phi i64 [ 0, %entry ], [ %iv.outer.next, %outer.latch ]
|
|
br label %inner.body
|
|
|
|
inner.body: ; preds = %inner.body, %outer.header
|
|
%iv.inner = phi i64 [ 5, %outer.header ], [ %iv.inner.next, %inner.body ]
|
|
%v7 = getelementptr inbounds [10 x [10 x i32]], ptr @c, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
store i32 0, ptr %v7, align 4
|
|
%iv.inner.next = add nsw i64 %iv.inner, -1
|
|
%v9 = icmp eq i64 %iv.inner.next, 0
|
|
br i1 %v9, label %outer.latch, label %inner.body
|
|
|
|
outer.latch: ; preds = %inner.body
|
|
%v8.lcssa = phi i64 [ %iv.inner, %inner.body ]
|
|
%iv.outer.next = add nuw nsw i64 %iv.outer, 1
|
|
%v5 = icmp ult i64 %iv.outer.next, 2
|
|
br i1 %v5, label %outer.header, label %exit
|
|
|
|
exit: ; preds = %outer.latch
|
|
%v4.lcssa = phi i64 [ %iv.outer, %outer.latch ]
|
|
%v8.lcssa.lcssa = phi i64 [ %v8.lcssa, %outer.latch ]
|
|
store i64 %v8.lcssa.lcssa, ptr @b, align 4
|
|
store i64 %v4.lcssa, ptr @a, align 4
|
|
ret void
|
|
}
|
|
|
|
define void @test_lcssa_indvars3() {
|
|
; CHECK-LABEL: @test_lcssa_indvars3()
|
|
; CHECK-LABEL: inner.body:
|
|
; CHECK-NEXT: %iv.inner = phi i64 [ %[[IVNEXT:[0-9]+]], %inner.body.split ], [ 5, %inner.body.preheader ]
|
|
|
|
; CHECK-LABEL: inner.body.split:
|
|
; CHECK-NEXT: %0 = phi i64 [ %iv.outer.next, %outer.latch ]
|
|
; CHECK-NEXT: %[[IVNEXT]] = add nsw i64 %iv.inner, -1
|
|
; CHECK-NEXT: %[[COND:[0-9]+]] = icmp eq i64 %iv.inner, 0
|
|
; CHECK-NEXT: br i1 %[[COND]], label %exit, label %inner.body
|
|
|
|
; CHECK-LABEL: exit:
|
|
; CHECK-NEXT: %v4.lcssa = phi i64 [ %0, %inner.body.split ]
|
|
; CHECK-NEXT: %v8.lcssa.lcssa = phi i64 [ %[[IVNEXT]], %inner.body.split ]
|
|
; CHECK-NEXT: %v8.lcssa.lcssa.2 = phi i64 [ %[[IVNEXT]], %inner.body.split ]
|
|
; CHECK-NEXT: %r1 = add i64 %v8.lcssa.lcssa, %v8.lcssa.lcssa.2
|
|
; CHECK-NEXT: store i64 %r1, ptr @b, align 4
|
|
; CHECK-NEXT: store i64 %v4.lcssa, ptr @a, align 4
|
|
|
|
|
|
entry:
|
|
br label %outer.header
|
|
|
|
outer.header: ; preds = %outer.latch, %entry
|
|
%iv.outer = phi i64 [ 0, %entry ], [ %iv.outer.next, %outer.latch ]
|
|
br label %inner.body
|
|
|
|
inner.body: ; preds = %inner.body, %outer.header
|
|
%iv.inner = phi i64 [ 5, %outer.header ], [ %iv.inner.next, %inner.body ]
|
|
%v7 = getelementptr inbounds [10 x [10 x i32]], ptr @c, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
store i32 0, ptr %v7, align 4
|
|
%iv.inner.next = add nsw i64 %iv.inner, -1
|
|
%v9 = icmp eq i64 %iv.inner, 0
|
|
br i1 %v9, label %outer.latch, label %inner.body
|
|
|
|
outer.latch: ; preds = %inner.body
|
|
%v8.lcssa = phi i64 [ %iv.inner.next, %inner.body ]
|
|
;%const.lcssa = phi i64 [ 111, %inner.body ]
|
|
%iv.outer.next = add nuw nsw i64 %iv.outer, 1
|
|
%v5 = icmp ult i64 %iv.outer, 2
|
|
br i1 %v5, label %outer.header, label %exit
|
|
|
|
exit: ; preds = %outer.latch
|
|
%v4.lcssa = phi i64 [ %iv.outer.next, %outer.latch ]
|
|
%v8.lcssa.lcssa = phi i64 [ %v8.lcssa, %outer.latch ]
|
|
%v8.lcssa.lcssa.2 = phi i64 [ %v8.lcssa, %outer.latch ]
|
|
%r1 = add i64 %v8.lcssa.lcssa, %v8.lcssa.lcssa.2
|
|
store i64 %r1, ptr @b, align 4
|
|
store i64 %v4.lcssa, ptr @a, align 4
|
|
ret void
|
|
}
|
|
|
|
|
|
; Make sure we do not crash for loops without reachable exits.
|
|
define void @no_reachable_exits() {
|
|
; Check we do not crash.
|
|
; CHECK-LABEL: @no_reachable_exits(
|
|
; CHECK-NEXT: bb:
|
|
; CHECK-NEXT: br label [[OUTER_PH:%.*]]
|
|
; CHECK: outer.ph:
|
|
; CHECK-NEXT: br label [[OUTER_HEADER:%.*]]
|
|
; CHECK: outer.header:
|
|
; CHECK-NEXT: [[TMP2:%.*]] = phi i32 [ 0, [[OUTER_PH]] ], [ [[TMP8:%.*]], [[OUTER_LATCH:%.*]] ]
|
|
; CHECK-NEXT: br i1 undef, label [[INNER_PH:%.*]], label [[OUTER_LATCH]]
|
|
; CHECK: inner.ph:
|
|
; CHECK-NEXT: br label [[INNER_BODY:%.*]]
|
|
; CHECK: inner.body:
|
|
; CHECK-NEXT: [[TMP31:%.*]] = phi i32 [ 0, [[INNER_PH]] ], [ [[TMP6:%.*]], [[INNER_BODY]] ]
|
|
; CHECK-NEXT: [[TMP5:%.*]] = load ptr, ptr undef, align 8
|
|
; CHECK-NEXT: [[TMP6]] = add nsw i32 [[TMP31]], 1
|
|
; CHECK-NEXT: br i1 false, label [[INNER_BODY]], label [[OUTER_LATCH_LOOPEXIT:%.*]]
|
|
; CHECK: outer.latch.loopexit:
|
|
; CHECK-NEXT: br label [[OUTER_LATCH]]
|
|
; CHECK: outer.latch:
|
|
; CHECK-NEXT: [[TMP8]] = add nsw i32 [[TMP2]], 1
|
|
; CHECK-NEXT: br i1 false, label [[OUTER_HEADER]], label [[EXIT:%.*]]
|
|
; CHECK: exit:
|
|
; CHECK-NEXT: unreachable
|
|
|
|
|
|
bb:
|
|
br label %outer.ph
|
|
|
|
outer.ph: ; preds = %bb
|
|
br label %outer.header
|
|
|
|
outer.header: ; preds = %outer.ph, %outer.latch
|
|
%tmp2 = phi i32 [ 0, %outer.ph ], [ %tmp8, %outer.latch ]
|
|
br i1 undef, label %inner.ph, label %outer.latch
|
|
|
|
inner.ph: ; preds = %outer.header
|
|
br label %inner.body
|
|
|
|
inner.body: ; preds = %inner.ph, %inner.body
|
|
%tmp31 = phi i32 [ 0, %inner.ph ], [ %tmp6, %inner.body]
|
|
%tmp5 = load ptr, ptr undef, align 8
|
|
%tmp6 = add nsw i32 %tmp31, 1
|
|
br i1 undef, label %inner.body, label %outer.latch
|
|
|
|
outer.latch: ; preds = %inner.body, %outer.header
|
|
%tmp8 = add nsw i32 %tmp2, 1
|
|
br i1 undef, label %outer.header, label %exit
|
|
|
|
exit: ; preds = %outer.latch
|
|
unreachable
|
|
}
|