
As specified in #53942, DA assumes base pointer invariance in its process. Some cases were fixed by #116628. However, that PR only addressed the parts related to AliasAnalysis, so the original issue persists in later stages, especially when the AliasAnalysis results in `MustAlias`. This patch insert an explicit loop-invariant checks for the base pointer and skips analysis when it is not loop-invariant. Fix the cases added in #148240.
317 lines
11 KiB
LLVM
317 lines
11 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py UTC_ARGS: --version 5
|
|
; RUN: opt < %s -disable-output "-passes=print<da>" -aa-pipeline=basic-aa 2>&1 \
|
|
; RUN: | FileCheck %s
|
|
|
|
; Check that dependence analysis correctly handles flip-flop of base addresses.
|
|
; Bug 41488 - https://github.com/llvm/llvm-project/issues/41488
|
|
|
|
define float @bug41488_test1(float %f) {
|
|
; CHECK-LABEL: 'bug41488_test1'
|
|
; CHECK-NEXT: Src: %0 = load float, ptr %p, align 4 --> Dst: %0 = load float, ptr %p, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
; CHECK-NEXT: Src: %0 = load float, ptr %p, align 4 --> Dst: store float %f, ptr %q, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
; CHECK-NEXT: Src: store float %f, ptr %q, align 4 --> Dst: store float %f, ptr %q, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
;
|
|
entry:
|
|
%g = alloca float, align 4
|
|
%h = alloca float, align 4
|
|
br label %for.body
|
|
|
|
for.body:
|
|
%p = phi float* [ %g, %entry ], [ %q, %for.body ]
|
|
%q = phi float* [ %h, %entry ], [ %p, %for.body ]
|
|
%0 = load float, float* %p, align 4
|
|
store float %f, float* %q, align 4
|
|
%branch_cond = fcmp ugt float %0, 0.0
|
|
br i1 %branch_cond, label %for.cond.cleanup, label %for.body
|
|
|
|
for.cond.cleanup:
|
|
ret float %f
|
|
}
|
|
|
|
define void @bug41488_test2(i32 %n) {
|
|
; CHECK-LABEL: 'bug41488_test2'
|
|
; CHECK-NEXT: Src: %0 = load float, ptr %p, align 4 --> Dst: %0 = load float, ptr %p, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
; CHECK-NEXT: Src: %0 = load float, ptr %p, align 4 --> Dst: store float 0.000000e+00, ptr %q, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
; CHECK-NEXT: Src: store float 0.000000e+00, ptr %q, align 4 --> Dst: store float 0.000000e+00, ptr %q, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
;
|
|
entry:
|
|
%g = alloca float, align 4
|
|
%h = alloca float, align 4
|
|
br label %for.body
|
|
|
|
for.body:
|
|
%i = phi i32 [0, %entry ], [ %inc, %for.body ]
|
|
%p = phi float* [ %g, %entry ], [ %q, %for.body ]
|
|
%q = phi float* [ %h, %entry ], [ %p, %for.body ]
|
|
%0 = load float, float* %p, align 4
|
|
store float 0.0, float* %q, align 4
|
|
%inc = add nuw i32 %i, 1
|
|
%branch_cond = icmp ult i32 %i, %n
|
|
br i1 %branch_cond, label %for.body, label %for.cond.cleanup
|
|
|
|
for.cond.cleanup:
|
|
ret void
|
|
}
|
|
|
|
; Bug 53942 - https://github.com/llvm/llvm-project/issues/53942
|
|
|
|
define void @bug53942_foo(i32 noundef %n, ptr noalias nocapture noundef writeonly %A, ptr noalias nocapture noundef %B) {
|
|
; CHECK-LABEL: 'bug53942_foo'
|
|
; CHECK-NEXT: Src: %.pre = load double, ptr %B, align 8 --> Dst: %.pre = load double, ptr %B, align 8
|
|
; CHECK-NEXT: da analyze - consistent input [S]!
|
|
; CHECK-NEXT: Src: %.pre = load double, ptr %B, align 8 --> Dst: store double %.pre, ptr %arrayidx2, align 8
|
|
; CHECK-NEXT: da analyze - confused!
|
|
; CHECK-NEXT: Src: store double %.pre, ptr %arrayidx2, align 8 --> Dst: store double %.pre, ptr %arrayidx2, align 8
|
|
; CHECK-NEXT: da analyze - confused!
|
|
;
|
|
entry:
|
|
%cmp8 = icmp sgt i32 %n, 1
|
|
br i1 %cmp8, label %for.body.preheader, label %for.cond.cleanup
|
|
|
|
for.body.preheader: ; preds = %entry
|
|
%wide.trip.count = zext nneg i32 %n to i64
|
|
br label %for.body
|
|
|
|
for.cond.cleanup: ; preds = %for.body, %entry
|
|
ret void
|
|
|
|
for.body: ; preds = %for.body.preheader, %for.body
|
|
%indvars.iv = phi i64 [ 1, %for.body.preheader ], [ %indvars.iv.next, %for.body ]
|
|
%ptr1.011 = phi ptr [ %A, %for.body.preheader ], [ %ptr2.09, %for.body ]
|
|
%ptr2.09 = phi ptr [ %B, %for.body.preheader ], [ %ptr1.011, %for.body ]
|
|
%.pre = load double, ptr %B, align 8
|
|
%arrayidx2 = getelementptr inbounds double, ptr %ptr1.011, i64 %indvars.iv
|
|
store double %.pre, ptr %arrayidx2, align 8
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
%exitcond.not = icmp eq i64 %indvars.iv.next, %wide.trip.count
|
|
br i1 %exitcond.not, label %for.cond.cleanup, label %for.body
|
|
}
|
|
|
|
|
|
; Bug 53942 - https://github.com/llvm/llvm-project/issues/53942
|
|
|
|
define void @bug53942_bar(i32 noundef %n, ptr noalias noundef %A, ptr noalias noundef %B) {
|
|
; CHECK-LABEL: 'bug53942_bar'
|
|
; CHECK-NEXT: Src: %0 = load double, ptr %arrayidx, align 8 --> Dst: %0 = load double, ptr %arrayidx, align 8
|
|
; CHECK-NEXT: da analyze - confused!
|
|
; CHECK-NEXT: Src: %0 = load double, ptr %arrayidx, align 8 --> Dst: store double %0, ptr %arrayidx8, align 8
|
|
; CHECK-NEXT: da analyze - confused!
|
|
; CHECK-NEXT: Src: store double %0, ptr %arrayidx8, align 8 --> Dst: store double %0, ptr %arrayidx8, align 8
|
|
; CHECK-NEXT: da analyze - confused!
|
|
;
|
|
entry:
|
|
br label %for.cond
|
|
|
|
for.cond: ; preds = %for.inc, %entry
|
|
%i.0 = phi i32 [ 1, %entry ], [ %inc, %for.inc ]
|
|
%cmp = icmp slt i32 %i.0, %n
|
|
br i1 %cmp, label %for.body, label %for.cond.cleanup
|
|
|
|
for.cond.cleanup: ; preds = %for.cond
|
|
br label %for.end
|
|
|
|
for.body: ; preds = %for.cond
|
|
%and = and i32 %i.0, 2
|
|
%tobool.not = icmp eq i32 %and, 0
|
|
br i1 %tobool.not, label %cond.false, label %cond.true
|
|
|
|
cond.true: ; preds = %for.body
|
|
br label %cond.end
|
|
|
|
cond.false: ; preds = %for.body
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %cond.false, %cond.true
|
|
%cond = phi ptr [ %A, %cond.true ], [ %B, %cond.false ]
|
|
%and1 = and i32 %i.0, 2
|
|
%tobool2.not = icmp eq i32 %and1, 0
|
|
br i1 %tobool2.not, label %cond.false4, label %cond.true3
|
|
|
|
cond.true3: ; preds = %cond.end
|
|
br label %cond.end5
|
|
|
|
cond.false4: ; preds = %cond.end
|
|
br label %cond.end5
|
|
|
|
cond.end5: ; preds = %cond.false4, %cond.true3
|
|
%cond6 = phi ptr [ %B, %cond.true3 ], [ %A, %cond.false4 ]
|
|
%sub = add nsw i32 %i.0, -1
|
|
%idxprom = sext i32 %sub to i64
|
|
%arrayidx = getelementptr inbounds double, ptr %cond6, i64 %idxprom
|
|
%0 = load double, ptr %arrayidx, align 8
|
|
%idxprom7 = zext nneg i32 %i.0 to i64
|
|
%arrayidx8 = getelementptr inbounds double, ptr %cond, i64 %idxprom7
|
|
store double %0, ptr %arrayidx8, align 8
|
|
br label %for.inc
|
|
|
|
for.inc: ; preds = %cond.end5
|
|
%inc = add nuw nsw i32 %i.0, 1
|
|
br label %for.cond
|
|
|
|
for.end: ; preds = %for.cond.cleanup
|
|
ret void
|
|
}
|
|
|
|
; Pseudo-code for the following IR:
|
|
;
|
|
; void f(int A[][42]) {
|
|
; for (int i = 0; i < 100; i++)
|
|
; for (int j = 0; j < 41; j++)
|
|
; (j % 2 == 0 ? A[i][j] : A[i][j+1]) = 1;
|
|
; }
|
|
;
|
|
; There are loop-carried dependencies between the store instruction. For
|
|
; example, the value of %ptr0 when (i, j) = (0, 1) is %A+8, which is the same
|
|
; as when (i, j) = (0, 2).
|
|
|
|
define void @non_invariant_baseptr_with_identical_obj(ptr %A) {
|
|
; CHECK-LABEL: 'non_invariant_baseptr_with_identical_obj'
|
|
; CHECK-NEXT: Src: store i32 1, ptr %idx, align 4 --> Dst: store i32 1, ptr %idx, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
;
|
|
entry:
|
|
br label %loop.i.header
|
|
|
|
loop.i.header:
|
|
%i = phi i32 [ 0, %entry ], [ %i.inc, %loop.i.latch ]
|
|
%A1 = getelementptr i32, ptr %A, i32 1
|
|
br label %loop.j
|
|
|
|
loop.j:
|
|
%j = phi i32 [ 0, %loop.i.header ], [ %j.inc, %loop.j ]
|
|
%ptr0 = phi ptr [ %A, %loop.i.header ], [ %ptr1, %loop.j ]
|
|
%ptr1 = phi ptr [ %A1, %loop.i.header ], [ %ptr0, %loop.j ]
|
|
%idx = getelementptr [42 x i32], ptr %ptr0, i32 %i, i32 %j
|
|
store i32 1, ptr %idx
|
|
%j.inc = add i32 %j, 1
|
|
%cmp.j = icmp slt i32 %j.inc, 41
|
|
br i1 %cmp.j, label %loop.j, label %loop.i.latch
|
|
|
|
loop.i.latch:
|
|
%i.inc = add i32 %i, 1
|
|
%cmp.i = icmp slt i32 %i.inc, 100
|
|
br i1 %cmp.i, label %loop.i.header, label %exit
|
|
|
|
exit:
|
|
ret void
|
|
}
|
|
|
|
; Pseudo-code for the following IR:
|
|
;
|
|
; void f(int A[][42][42]) {
|
|
; for (int i = 0; i < 100; i++)
|
|
; for (int j = 0; j < 41; j++) {
|
|
; int *ptr0 = (j % 2 == 0 ? A[i][j] : A[i][j+1]);
|
|
; for (int k = 0; k < 42; k++)
|
|
; ptr0[k] = 1;
|
|
; }
|
|
; }
|
|
;
|
|
; Similar to the above case, but ptr0 is loop-invariant with respsect to the
|
|
; k-loop.
|
|
;
|
|
; Same as the above case, there are loop-carried dependencies between the
|
|
; store.
|
|
|
|
define void @non_invariant_baseptr_with_identical_obj2(ptr %A) {
|
|
; CHECK-LABEL: 'non_invariant_baseptr_with_identical_obj2'
|
|
; CHECK-NEXT: Src: store i32 1, ptr %idx, align 4 --> Dst: store i32 1, ptr %idx, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
;
|
|
entry:
|
|
br label %loop.i.header
|
|
|
|
loop.i.header:
|
|
%i = phi i32 [ 0, %entry ], [ %i.inc, %loop.i.latch ]
|
|
%A1 = getelementptr i32, ptr %A, i32 1
|
|
br label %loop.j.header
|
|
|
|
loop.j.header:
|
|
%j = phi i32 [ 0, %loop.i.header ], [ %j.inc, %loop.j.latch ]
|
|
%ptr0 = phi ptr [ %A, %loop.i.header ], [ %ptr1, %loop.j.latch ]
|
|
%ptr1 = phi ptr [ %A1, %loop.i.header ], [ %ptr0, %loop.j.latch ]
|
|
br label %loop.k
|
|
|
|
loop.k:
|
|
%k = phi i32 [ 0, %loop.j.header ], [ %k.inc, %loop.k ]
|
|
%idx = getelementptr [42 x [42 x i32]], ptr %ptr0, i32 %i, i32 %k, i32 %j
|
|
store i32 1, ptr %idx
|
|
%k.inc = add i32 %k, 1
|
|
%cmp.k = icmp slt i32 %k.inc, 42
|
|
br i1 %cmp.k, label %loop.k, label %loop.j.latch
|
|
|
|
loop.j.latch:
|
|
%j.inc = add i32 %j, 1
|
|
%cmp.j = icmp slt i32 %j.inc, 41
|
|
br i1 %cmp.j, label %loop.j.header, label %loop.i.latch
|
|
|
|
loop.i.latch:
|
|
%i.inc = add i32 %i, 1
|
|
%cmp.i = icmp slt i32 %i.inc, 100
|
|
br i1 %cmp.i, label %loop.i.header, label %exit
|
|
|
|
exit:
|
|
ret void
|
|
}
|
|
|
|
; Pseudo-code that is approximately semantically equivalent to the below IR:
|
|
;
|
|
; void f(int A[][32]) {
|
|
; for (int i = 0; i < 100; i++)
|
|
; for (int j = 0; j < 15; j++) {
|
|
; int offset = (j % 2 == 0) ? 1 : 0;
|
|
; A[i][2 * j + offset + 0] = 1;
|
|
; A[i][2 * j + offset + 1] = 1;
|
|
; }
|
|
; }
|
|
;
|
|
; There are loop-carried dependencies between the two stores. For example,
|
|
; A[0][2] is accessed from both the former one when (i, j) = (0, 1) and the
|
|
; latter one when (i, j) = (0, 0).
|
|
;
|
|
define void @non_invariant_baseptr_with_identical_obj3(ptr %A) {
|
|
; CHECK-LABEL: 'non_invariant_baseptr_with_identical_obj3'
|
|
; CHECK-NEXT: Src: store i32 1, ptr %idx0, align 4 --> Dst: store i32 1, ptr %idx0, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
; CHECK-NEXT: Src: store i32 1, ptr %idx0, align 4 --> Dst: store i32 1, ptr %idx1, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
; CHECK-NEXT: Src: store i32 1, ptr %idx1, align 4 --> Dst: store i32 1, ptr %idx1, align 4
|
|
; CHECK-NEXT: da analyze - confused!
|
|
;
|
|
entry:
|
|
br label %loop.i.header
|
|
|
|
loop.i.header:
|
|
%i = phi i32 [ 0, %entry ], [ %i.inc, %loop.i.latch ]
|
|
%A1 = getelementptr i32, ptr %A, i32 1
|
|
br label %loop.j
|
|
|
|
loop.j:
|
|
%j = phi i32 [ 0, %loop.i.header ], [ %j.inc, %loop.j ]
|
|
%ptr0 = phi ptr [ %A1, %loop.i.header ], [ %ptr1, %loop.j ]
|
|
%ptr1 = phi ptr [ %A, %loop.i.header ], [ %ptr0, %loop.j ]
|
|
%j2_0 = shl i32 %j, 1
|
|
%j2_1 = add i32 %j2_0, 1
|
|
%idx0 = getelementptr [32 x i32], ptr %ptr0, i32 %i, i32 %j2_0
|
|
%idx1 = getelementptr [32 x i32], ptr %ptr0, i32 %i, i32 %j2_1
|
|
store i32 1, ptr %idx0
|
|
store i32 1, ptr %idx1
|
|
%j.inc = add i32 %j, 1
|
|
%cmp.j = icmp slt i32 %j.inc, 15
|
|
br i1 %cmp.j, label %loop.j, label %loop.i.latch
|
|
|
|
loop.i.latch:
|
|
%i.inc = add i32 %i, 1
|
|
%cmp.i = icmp slt i32 %i.inc, 100
|
|
br i1 %cmp.i, label %loop.i.header, label %exit
|
|
|
|
exit:
|
|
ret void
|
|
}
|