llvm-project/llvm/test/Transforms/LoopVectorize/interleaved-accesses-max-dependences.ll
Anna Thomas 3cf24dbbdd [LV] Complete load groups and release store groups. Try 2.
This is a complete fix for CompleteLoadGroups introduced in
D154309. We need to check for dependency between A and every member of
the load Group of B.
This patch also fixes another miscompile seen when we incorrectly sink stores
below a depending load (see testcase in
interleaved-accesses-sink-store-across-load.ll). This is fixed by
releasing store groups correctly.

This change was previously reverted (e85fd3cbdd68) due to Asan failure with
use-after-free error. A testcase is added and the bug is fixed in this
version of the patch.

Differential Revision: https://reviews.llvm.org/D155520
2023-08-08 18:10:23 -04:00

29 lines
1.0 KiB
LLVM

; RUN: opt -passes=loop-vectorize -force-vector-width=4 -force-vector-interleave=1 -enable-interleaved-mem-accesses=true -max-dependences=0 -S %s | FileCheck %s
target datalayout = "e-m:e-i64:64-i128:128-n32:64-S128"
; None of these stores have dependences between them, so we can successfully
; interleave them even though the max-dependences threshold is 0.
define void @three_interleaved_stores(ptr %arr) {
; CHECK-LABEL: define void @three_interleaved_stores
; CHECK: store <12 x i8>
entry:
br label %loop
loop:
%i = phi i64 [ 0, %entry ], [ %i.next, %loop ]
%i.plus.1 = add nuw nsw i64 %i, 1
%i.plus.2 = add nuw nsw i64 %i, 2
%gep.i.plus.0 = getelementptr inbounds i8, ptr %arr, i64 %i
%gep.i.plus.1 = getelementptr inbounds i8, ptr %arr, i64 %i.plus.1
%gep.i.plus.2 = getelementptr inbounds i8, ptr %arr, i64 %i.plus.2
store i8 1, ptr %gep.i.plus.0
store i8 1, ptr %gep.i.plus.1
store i8 1, ptr %gep.i.plus.2
%i.next = add nuw nsw i64 %i, 3
%icmp = icmp ugt i64 %i, 1032
br i1 %icmp, label %exit, label %loop
exit:
ret void
}